Simplest Enterprise Continuous Integration Solutions

Monday, May 16, 2011

Enterprise Linux - SGE installation verification

  • #add user
qconf –auser
or 
[root@linux64-server ~]# cat /tmp/add_sge_user
name sgeuser
oticket 0
fshare 0
delete_time 0
default_project NONE
[root@linux64-server ~]# qconf -Auser /tmp/add_sge_user
root@linux64-server added "sgeuser" to user list
[root@linux64-server ~]# qconf -suserl
sgeuser
root
  • #add hosts
#SGE administrator host
[root@linux64-server ~]# qconf -sh
[root@linux64-server ~]# qconf –ah linux64-server


#SGE execution hosts
[root@linux64-server ~]# qconf –sel
[root@linux64-server ~]# qconf –ae linux64-server,linux64-client1

#SGE submit hosts
[root@linux64-server ~]# qconf –ss
[root@linux64-server ~]# qconf –as linux64-server,linux64-client1
  • #add new host group entry
qconf –ahgrp @allhosts
or 
[root@linux64-server ~]# cat /tmp/add_new_host_grp
group_name @allhosts
hostlist linux64-server linux64-client1
[root@linux64-server ~]# qconf -Ahgrp /tmp/add_new_host_grp
root@linux64-server added "@allhosts " to host group list
[root@linux64-server ~]# qconf -shgrp @allhosts
group_name @allhosts
hostlist linux64-server linux64-client1
  • #add new queue
[root@linux64-server ~]# cat /usr/local/bin/epilogsh
#!/bin/bash
#
# This is the global epilog script that will run after each task is complete.
#

if [ ! -z $epilogsh ]; then        #something was passed
  if [ -x $epilogsh ]; then
    $epilogsh
  else
    /usr/bin/logger -t sge-epilog "$epilogsh - File not found or not executable"
  fi
fi
[root@linux64-server ~]# chmod 555 /usr/local/bin/epilogsh
[root@linux64-server ~]# cat /tmp/add_new_queue
qname                 all.q
hostlist              @allhosts
seq_no                0
load_thresholds       np_load_avg=1.75
suspend_thresholds    NONE
nsuspend              1
suspend_interval      00:05:00
priority              0
min_cpu_interval      00:05:00
processors            UNDEFINED
qtype                 BATCH INTERACTIVE
ckpt_list             NONE
pe_list               make
rerun                 FALSE
slots                 1,[linux64-server=24],[linux64-client1=24]
tmpdir                /tmp
shell                 /bin/csh
prolog                NONE
epilog                /usr/local/bin/epilogsh
shell_start_mode      posix_compliant
starter_method        NONE
suspend_method        NONE
resume_method         NONE
terminate_method      NONE
notify                00:00:60
owner_list            NONE
user_lists            NONE
xuser_lists           NONE
subordinate_list      NONE
complex_values        NONE
projects              NONE
xprojects             NONE
calendar              NONE
initial_state         default
s_rt                  INFINITY
h_rt                  INFINITY
s_cpu                 INFINITY
h_cpu                 INFINITY
s_fsize               INFINITY
h_fsize               INFINITY
s_data                INFINITY
h_data                INFINITY
s_stack               INFINITY
h_stack               INFINITY
s_core                INFINITY
h_core                INFINITY
s_rss                 INFINITY
h_rss                 INFINITY
s_vmem                INFINITY
h_vmem                INFINITY
[root@linux64-server ~]# qconf -Aq /tmp/add_new_queue
root@linux64-server added "all.q" to cluster queue list
  • #make sure sge qmaster daemon is running
[root@linux64-server ~]# ps -ef | grep sge
sgeadmin      8752     1  0 16:16 ?        00:00:02 /opt/SGE/bin/lx24-amd64/sge_qmaster
  • #qstat check host state
[root@linux64-server ~]# qstat -f
queuename                      qtype resv/used/tot. load_avg arch          states
---------------------------------------------------------------------------------
all.q@linux64-server          BIP   0/0/2          -NA-     -NA-          au
---------------------------------------------------------------------------------
all.q@linux64-client1          BIP   0/0/3          0.00     lx24-amd64
  • #qrsh verification on master host
[root@linux64-server ~]# qrsh hostname
linux64-client1
  • #qsub verification on master host
[root@linux64-server ~]# cat /mnt/work/test.sh
#!/bin/bash

echo "this is a test" > /mnt/work/testSGE.results
[root@linux64-server ~]# qsub /mnt/work/work/test.sh
Your job 33 ("test.sh") has been submitted
[root@linux64-server ~]# qstat
job-ID  prior   name       user         state submit/start at     queue                          slots ja-task-ID
-----------------------------------------------------------------------------------------------------------------
     42 0.50000 test.sh    root         r     05/16/2011 20:01:42 all.q@linux64-client1              1
[root@linux64-server ~]# qstat
[root@linux64-server ~]# ls /mnt/work
test.sh testSGE.results

  • #make sure sge execd daemon is running
[root@linux64-client1 ~]# ps -ef | grep sge
sgeadmin      4920     1  0 16:18 ?        00:00:01 /opt/SGE/bin/lx24-amd64/sge_execd
  • #qstat check host state
[root@linux64-client1 ~]# qstat -f
queuename                      qtype resv/used/tot. load_avg arch          states
---------------------------------------------------------------------------------
all.q@linux64-server          BIP   0/0/2          -NA-     -NA-          au
---------------------------------------------------------------------------------
all.q@linux64-client1          BIP   0/0/3          0.00     lx24-amd64
  • #qrsh verification on execution host
[root@linux64-client1 ~]# qrsh hostname
linux64-client1
  • #qsub verification on execution host
[root@linux64-client1 ~]# qsub /mnt/work/test.sh
Your job 35 ("test.sh") has been submitted
[root@linux64-client1 ~]# qstat
job-ID  prior   name       user         state submit/start at     queue                          slots ja-task-ID
-----------------------------------------------------------------------------------------------------------------
     35 0.50000 test.sh    root         r     05/16/2011 13:57:08 all.q@linux64-client1              1
[root@linux64-client1 ~]# qstat
[root@linux64-client1 ~]# ls /mnt/work
test.sh testSGE.results

No comments:

Post a Comment