[GE users] why qmaster is computing job?

wushi8 wushi8 at qq.com
Tue Nov 2 07:44:20 GMT 2010


I have 5 computer,one is head node, four is compute.
sge is sge62u6_linux24-x64_rpm.zip

When I use intel mpi ,erverything is OK!

When I use mpich2 , sometime qmaster is computing job,why?
------------------------------------------
[root at n01 ~]# qconf -sp mpich
pe_name            mpich
slots              9999
user_lists         NONE
xuser_lists        NONE
start_proc_args    /gridware/sge/mpi/startmpi.sh -catch_rsh $pe_hostfile
stop_proc_args     /gridware/sge/mpi/stopmpi.sh
allocation_rule    $fill_up
control_slaves     TRUE
job_is_first_task  FALSE
urgency_slots      min
accounting_summary TRUE
---------------------------------------------
[root at n01 ~]# qconf -shgrp @grp1
group_name @grp1
hostlist n02 n03 n04 n05
-------------------------------------------
[root at n01 ~]# qconf -su acl
name    acl
type    ACL
fshare  0
oticket 0
entries test,test2

-------------------------------------------
[root at n01 ~]# qconf -sq q1.q
qname                 q1.q
hostlist              @grp1
seq_no                0
load_thresholds       np_load_avg=1.75
suspend_thresholds    NONE
nsuspend              1
suspend_interval      00:05:00
priority              0
min_cpu_interval      00:05:00
processors            UNDEFINED
qtype                 BATCH INTERACTIVE
ckpt_list             NONE
pe_list               mpich
rerun                 FALSE
slots                 1,[n02=1],[n03=1],[n04=1],[n05=1]
tmpdir                /tmp
shell                 /bin/csh
prolog                NONE
epilog                NONE
shell_start_mode      posix_compliant
starter_method        NONE
suspend_method        NONE
resume_method         NONE
terminate_method      NONE
notify                00:00:60
owner_list            NONE
user_lists            acl
xuser_lists           NONE
subordinate_list      NONE
complex_values        NONE
projects              NONE
xprojects             NONE
calendar              NONE
initial_state         default
s_rt                  INFINITY
h_rt                  INFINITY
s_cpu                 INFINITY
h_cpu                 INFINITY
s_fsize               INFINITY
h_fsize               INFINITY
s_data                INFINITY
h_data                INFINITY
s_stack               INFINITY
h_stack               INFINITY
s_core                INFINITY
h_core                INFINITY
s_rss                 INFINITY
h_rss                 INFINITY
s_vmem                INFINITY
h_vmem                INFINITY
----------------------------------------


#!/bin/bash
#$ -j y
#$ -cwd
#$ -N b
#$ -S /bin/bash
#$ -pe mpich 4
cd /disk1/test2/em64t/



#$ -v MPICH_HOME=/disk1/bin,SGE_QMASTER_PORT


###$MPICH_HOME/mpiexec -genv I_MPI_DEVICE sock -machinefile $TMPDIR/machines -np $NSLOTS ./xhpl_em64t 
##$MPICH_HOME/mpiexec -genv I_MPI_DEVICE sock -machinefile $MACHINES -np $NSLOTS ./xhpl_em64t 
$MPICH_HOME/mpiexec -genv I_MPI_DEVICE sock  -np $NSLOTS  ./xhpl_em64t
--------------------------------------------

------------------------------------------------------
http://gridengine.sunsource.net/ds/viewMessage.do?dsForumId=38&dsMessageId=292047

To unsubscribe from this discussion, e-mail: [users-unsubscribe at gridengine.sunsource.net].



More information about the gridengine-users mailing list