반응형

1. Install master node

master# hostnamectl set-hostname qmaster.local

master# echo ‘192.168.56.101 qmaster.local qmaster’ >> /etc/hosts

master# echo ‘192.168.56.102 compute01.local compute01’ >> /etc/hosts

master# mkdir -p /BiO/src

master# yum -y install epel-release

master# yum -y install jemalloc-devel openssl-devel ncurses-devel pam-devel libXmu-devel hwloc-devel hwloc hwloc-libs java-devel javacc ant-junit libdb-devel motif-devel csh ksh xterm db4-utils perl-XML-Simple perl-Env xorg-x11-fonts-ISO8859-1-100dpi xorg-x11-fonts-ISO8859-1-75dpi

master# groupadd -g 490 sgeadmin

master# useradd -u 495 -g 490 -r -m -d /home/sgeadmin -s /bin/bash -c "SGE Admin" sgeadmin

master# visudo

%sgeadmin ALL=(ALL) NOPASSWD: ALL


master# yum -y install ant

master# cd /BiO/src

master# wget https://arc.liv.ac.uk/downloads/SGE/releases/8.1.9/sge-8.1.9.tar.gz

master# tar zxvfp sge-8.1.9.tar.gz

master# cd sge-8.1.9/source/

master# sh scripts/bootstrap.sh && ./aimk && ./aimk man

master# export SGE_ROOT=/BiO/gridengine && mkdir $SGE_ROOT

master# echo Y | ./scripts/distinst -local -allall -libs -noexit

master# chown -R sgeadmin.sgeadmin /BiO/gridengine

master# cd $SGE_ROOT

master# vi config.conf

SGE_ROOT="/BiO/gridengine"

SGE_QMASTER_PORT="6444"

SGE_EXECD_PORT="6445"

SGE_ENABLE_SMF="false"

SGE_CLUSTER_NAME="cluster"

SGE_JMX_PORT=""

SGE_JMX_SSL="false"

SGE_JMX_SSL_CLIENT="false"

SGE_JMX_SSL_KEYSTORE=""

SGE_JMX_SSL_KEYSTORE_PW=""

SGE_JVM_LIB_PATH=""

SGE_ADDITIONAL_JVM_ARGS=""

CELL_NAME="default"

ADMIN_USER=sgeadmin

QMASTER_SPOOL_DIR=$SGE_ROOT/$CELL_NAME/spool/qmaster

EXECD_SPOOL_DIR=$SGE_ROOT/$CELL_NAME/default/spool

GID_RANGE="20000-20100"

SPOOLING_METHOD="classic"

DB_SPOOLING_DIR="$SGE_ROOT/$CELL_NAME/spool/spooldb"

PAR_EXECD_INST_COUNT="20"

ADMIN_HOST_LIST="qmaster"

SUBMIT_HOST_LIST="qmaster"

EXEC_HOST_LIST=""

EXECD_SPOOL_DIR_LOCAL=""

HOSTNAME_RESOLVING="true"

SHELL_NAME="ssh"

COPY_COMMAND="scp"

DEFAULT_DOMAIN="none"

ADMIN_MAIL="root"

ADD_TO_RC="true"

SET_FILE_PERMS="true"

RESCHEDULE_JOBS="wait"

SCHEDD_CONF="1"

SHADOW_HOST=""

EXEC_HOST_LIST_RM=""

REMOVE_RC="true"

WINDOWS_SUPPORT="false"

WIN_ADMIN_NAME="Administrator"

WIN_DOMAIN_ACCESS="false"

CSP_RECREATE="true"

CSP_COPY_CERTS="false"

CSP_COUNTRY_CODE="KO"

CSP_STATE="Daejeon"

CSP_LOCATION="YUSEONG-GU"

CSP_ORGA="KRIBB"

CSP_ORGA_UNIT="KOBIC"

CSP_MAIL_ADDRESS=isbyeon@kribb.re.kr


 

master# ./inst_sge -m -auto ./config.conf

master# cp default/common/settings.sh /etc/profile.d/

master# source /etc/profile

master# yum -y install nfs-utils

master# vi /etc/exports

/BiO 192.168.56.0/24(rw,no_root_squash)


master# systemctl start rpcbind nfs-server

master# systemctl enable rpcbind nfs-server

 

2. Add an administrative host

master# qconf -ah compute01

compute01.local added to administrative host list


 

3. SSH Public Key Authentication

master <=> compute01  // ssh-copy-id

 

4. Install compute node

compute01# yum -y install hwloc-devel

compute01# hostnamectl set-hostname compute01.local

compute01# groupadd -g 490 sgeadmin

compute01# useradd -u 495 -g 490 -r -m -d /home/sgeadmin -s /bin/bash -c "SGE Admin" sgeadmin

compute01# yum -y install nfs-utils

compute01# systemctl start rpcbind && systemctl enable rpcbind

compute01# mkdir /BiO

compute01# mount -t nfs 192.168.56.101:/BiO /BiO

compute01# vi /etc/fstab

192.168.56.101:/BiO /BiO nfs defaults 0 0


compute01# echo ‘192.168.56.101 qmaster.local qmaster’ >> /etc/hosts

compute01# echo ‘192.168.56.102 compute01.local compute01’ >> /etc/hosts

compute01# export SGE_ROOT=/BiO/gridengine; export SGE_CELL=default

compute01# SGE_ARCH=`$SGE_ROOT/util/arch`; export SGE_ARCH

compute01# cd $SGE_ROOT

 

compute01# vi compute.conf

SGE_ROOT="/BiO/gridengine"

SGE_QMASTER_PORT="6444"

SGE_EXECD_PORT="6445"

SGE_ENABLE_SMF="false"

SGE_CLUSTER_NAME="cluster"

SGE_JMX_PORT=""

SGE_JMX_SSL="false"

SGE_JMX_SSL_CLIENT="false"

SGE_JMX_SSL_KEYSTORE=""

SGE_JMX_SSL_KEYSTORE_PW=""

SGE_JVM_LIB_PATH=""

SGE_ADDITIONAL_JVM_ARGS=""

CELL_NAME="default"

ADMIN_USER=sgeadmin

QMASTER_SPOOL_DIR=$SGE_ROOT/$CELL_NAME/spool/qmaster

EXECD_SPOOL_DIR=$SGE_ROOT/$CELL_NAME/default/spool

GID_RANGE="20000-20100"

SPOOLING_METHOD="classic"

DB_SPOOLING_DIR="$SGE_ROOT/$CELL_NAME/spool/spooldb"

PAR_EXECD_INST_COUNT="20"

ADMIN_HOST_LIST="qmaster"

SUBMIT_HOST_LIST="qmaster"

EXEC_HOST_LIST="compute01"

EXECD_SPOOL_DIR_LOCAL=""

HOSTNAME_RESOLVING="true"

SHELL_NAME="ssh"

COPY_COMMAND="scp"

DEFAULT_DOMAIN="none"

ADMIN_MAIL="root"

ADD_TO_RC="true"

SET_FILE_PERMS="true"

RESCHEDULE_JOBS="wait"

SCHEDD_CONF="1"

SHADOW_HOST=""

EXEC_HOST_LIST_RM=""

REMOVE_RC="true"

WINDOWS_SUPPORT="false"

WIN_ADMIN_NAME="Administrator"

WIN_DOMAIN_ACCESS="false"

CSP_RECREATE="true"

CSP_COPY_CERTS="false"

CSP_COUNTRY_CODE="KO"

CSP_STATE="Daejeon"

CSP_LOCATION="YUSEONG-GU"

CSP_ORGA="KRIBB"

CSP_ORGA_UNIT="KOBIC"

CSP_MAIL_ADDRESS=isbyeon@kribb.re.kr


compute01# ./inst_sge -x -auto ./compute.conf

compute01# cp /BiO/gridengine/default/common/settings.sh /etc/profile.d/

compute01# source /etc/profile

 

5. Removing an execution host

master# cd /BiO/gridengine

master# cp config.conf remove.conf

master# sed -i -e 's/EXEC_HOST_LIST_RM=\"\"/EXEC_HOST_LIST_RM=\"compute01.local\"/g' remove.conf

master# cat remove.conf | grep EXEC_HOST_LIST_RM

EXEC_HOST_LIST_RM="compute01.local“


master# ./inst_sge -ux -auto ./remove.conf

 

반응형

'HPC > Sun Grid Engine' 카테고리의 다른 글

[SGE] qlogin X11 forwarding  (0) 2016.10.13
[SGE] SGE 설치  (0) 2016.10.10
[SGE] GPU 사용 등록  (0) 2015.10.22
[SGE] Submitting jobs - Simple submission  (0) 2015.10.16
[SGE] Managing Resource Quotas  (0) 2013.07.16
  • 네이버 블러그 공유하기
  • 네이버 밴드에 공유하기
  • 페이스북 공유하기
  • 카카오스토리 공유하기