728x90
반응형
패키지 설치
# apt install -y vim ssh git build-essential libhwloc-dev libssl-dev libtirpc-dev \
libmotif-dev libxext-dev libncurses-dev libdb5.3-dev libpam0g-dev pkgconf \
libsystemd-dev cmake gcc default-jdk qtchooser make gcc default-jdk qtchooser \
make gcc default-jdk qtchooser csh
# gcc --version
# make --version
사전 준비
# groupadd -g 490 sgeadmin
# useradd -u 495 -g 490 -r -m -d /home/sgeadmin -s /bin/bash -c "SGE Admin" sgeadmin
# visudo
# Members of the admin group may gain root privileges
%admin ALL=(ALL) ALL
%sgeadmin ALL=(ALL) NOPASSWD:ALL //추가
ctrl + x 로 나가기
# vim /etc/hosts
192.168.207.30 master-ubuntu-sge
192.168.207.31 node01-ubuntu-sge
...
빌드
# wget https://github.com/daimh/sge/archive/refs/tags/8.1.9.tar.gz
# tar zvxf 8.1.9.tar.gz
# export SGE_ROOT=/opt/sge
# export SGE_CELL=default
# mkdir -p $SGE_ROOT
# cd /APP/enhpc/sge-8.1.9/source
!! 주석 처리
# vim 3rdparty/qtcsh/sh.proc.c
51 //# define BSDWAIT
# sh scripts/bootstrap.sh -no-java -no-jni
# ./aimk -no-java -no-jni -no-secure
# echo Y | ./scripts/distinst -local -allall -libs -noexit
# ln -s /usr/bin/qmake /opt/sge/bin/lx-amd64/qmake
# chown -R sgeadmin: $SGE_ROOT
설치
# cd $SGE_ROOT
# chmod -t /tmp
# ./install_qmaster
- Cluster Name 설징 외에는 전부 default 값으로 설정(Enter)
Unique cluster name
-------------------
The cluster name uniquely identifies a specific Sun Grid Engine cluster.
The cluster name must be unique throughout your organization. The name
is not related to the SGE cell.
The cluster name must start with a letter ([A-Za-z]), followed by letters,
digits ([0-9]), dashes (-) or underscores (_).
Enter new cluster name or hit <RETURN>
to use default [p6444] >> estar987
./install_execd
chmod +t /tmp
cd ~
source /opt/sge/default/common/settings.sh
# qconf -mconf
수정
...
min_uid 0
min_gid 0
# qconf -as $HOSTNAME
master-ubuntu-sge added to submit host list
# echo “sleep 20” | qsub
# qstat -f
queuename qtype resv/used/tot. load_avg arch states
---------------------------------------------------------------------------------
all.q@master-ubuntu-sge BIP 0/0/12 2.33 lx-amd64
SGE 를 기본 스케줄러로 사용하기(.bashrc 등록)
# vi .bashrc
source /opt/sge/default/common/settings.sh //추가
# source .bashrc
# vi /etc/exports
/opt/sge *(rw,no_root_squash) // 추가
systemctl restart nfs-server.service
systemctl restart sgemaster.service
systemctl restart sgemaster.service
# qconf -ah node01-ubuntu-sge
node01-ubuntu-sge added to administrative host list
증설 노드에서 작업
# apt install -y libhwloc-dev nfs-client qtchooser
# vim /etc/hosts
192.168.207.30 master-ubuntu-sge
192.168.207.31 node01-ubuntu-sge
# groupadd -g 490 sgeadmin
# useradd -u 495 -g 490 -r -m -d /home/sgeadmin -s /bin/bash -c "SGE Admin" sgeadmin
# systemctl restart nfs-utils.service
# mkdir -p /opt/sge
# export SGE_ROOT=/opt/sge
# export SGE_CELL=default
# mkdir $SGE_ROOT
# mount -t nfs master-ubuntu-sge:/opt/sge /opt/sge
# df (확인)
# vim /etc/fstab
master-ubuntu-sge:/opt/sge /opt/sge nfs rw,soft,bg,vers=3 0 0 // 추가
# cd $SGE_ROOT
# ./install_execd
모두 default
마스터에서 확인
# qstat -f
queuename qtype resv/used/tot. load_avg arch states
---------------------------------------------------------------------------------
all.q@master-ubuntu-sge BIP 0/0/12 1.17 lx-amd64
---------------------------------------------------------------------------------
all.q@node01-ubuntu-sge BIP 0/0/12 3.12 lx-amd64
반응형
'HPC' 카테고리의 다른 글
[SLURM] SBATCH(1) (0) | 2024.09.06 |
---|---|
[SLURM] SRUN 명령어 (1) | 2024.09.05 |
Slurm 수동 설치 (0) | 2024.06.17 |
[Ubuntu]Munge Install (0) | 2024.06.16 |
HPE (Hewlett Packard Enterprise): 고성능 컴퓨팅의 선두 주자 (0) | 2024.06.11 |