I have 2 nodes,g09r4n[07-08],and configure multisected in the following order:
(1)qmgr -c “set node g09r4n08 partition=test01”
(2)qmgr -c “create queue test01 queue_type=E”
qmgr -c “set queue test01 started=true”
qmgr -c “set queue test01 enabled=true”
(3)qmgr -c “create sched multisched_1”
(4)qmgr -c "set sched multisched_1 partition=tetst01
(5)qmgr -c ‘set sched multisched_1 scheduling=1’
(6)pbs_sched -I multisched_1 -S 15555
then I submit job to the test01 queue:
qsub -q test01
the job always in state Q.
View the status of the scheduler, state of multisched_1 is down:
[root@g09r4n07 server_logs]# qmgr
Max open servers: 49
Qmgr: list sched
Sched default
sched_host = g09r4n07
pbs_version = 20.0.0
sched_cycle_length = 00:20:00
sched_port = 15004
sched_priv = /var/spool/pbs/sched_priv
sched_log = /var/spool/pbs/sched_logs
scheduling = True
scheduler_iteration = 600
state = idle
preempt_queue_prio = 150
preempt_prio = express_queue, normal_jobs
preempt_order = SCR
preempt_sort = min_time_since_start
log_events = 767
server_dyn_res_alarm = 30
Sched multisched_1
sched_cycle_length = 00:20:00
partition = tetst01
sched_priv = /var/spool/pbs/sched_priv_multisched_1
sched_log = /var/spool/pbs/sched_logs_multisched_1
scheduling = True
scheduler_iteration = 600
state = down
preempt_queue_prio = 150
preempt_prio = express_queue, normal_jobs
preempt_order = SCR
preempt_sort = min_time_since_start
log_events = 767
server_dyn_res_alarm = 30
there are some error in /var/spool/pbs/server_logs/20221013:
10/13/2022 14:51:35;0001;Server@g09r4n07;Svr;Server@g09r4n07;Operation now in progress (115) in contact_sched, Could not contact Scheduler
10/13/2022 14:51:35;0001;Server@g09r4n07;Svr;Server@g09r4n07;Operation now in progress (115) in contact_sched, Could not contact Scheduler
10/13/2022 14:51:37;0001;Server@g09r4n07;Svr;Server@g09r4n07;Operation now in progress (115) in contact_sched, Could not contact Scheduler
10/13/2022 14:51:37;0001;Server@g09r4n07;Svr;Server@g09r4n07;Operation now in progress (115) in contact_sched, Could not contact Scheduler
10/13/2022 14:51:39;0001;Server@g09r4n07;Svr;Server@g09r4n07;Operation now in progress (115) in contact_sched, Could not contact Scheduler
10/13/2022 14:51:39;0001;Server@g09r4n07;Svr;Server@g09r4n07;Operation now in progress (115) in contact_sched, Could not contact Scheduler
10/13/2022 14:51:41;0001;Server@g09r4n07;Svr;Server@g09r4n07;Operation now in progress (115) in contact_sched, Could not contact Scheduler
10/13/2022 14:51:41;0001;Server@g09r4n07;Svr;Server@g09r4n07;Operation now in progress (115) in contact_sched, Could not contact Scheduler
10/13/2022 14:51:43;0001;Server@g09r4n07;Svr;Server@g09r4n07;Operation now in progress (115) in contact_sched, Could not contact Scheduler
10/13/2022 14:51:43;0001;Server@g09r4n07;Svr;Server@g09r4n07;Operation now in progress (115) in contact_sched, Could not contact Scheduler
10/13/2022 14:51:45;0001;Server@g09r4n07;Svr;Server@g09r4n07;Operation now in progress (115) in contact_sched, Could not contact Scheduler
10/13/2022 14:51:45;0001;Server@g09r4n07;Svr;Server@g09r4n07;Operation now in progress (115) in contact_sched, Could not contact Scheduler
10/13/2022 14:51:47;0001;Server@g09r4n07;Svr;Server@g09r4n07;Operation now in progress (115) in contact_sched, Could not contact Scheduler
10/13/2022 14:51:47;0001;Server@g09r4n07;Svr;Server@g09r4n07;Operation now in progress (115) in contact_sched, Could not contact Scheduler
so how should i do to let the multisched work?