Operation system: CentOS 7.3
Torque PBS: torque-6.1.2.tar.gz
hostname: node1
user name: ding
显示当前主机名:
hostname
localhost.localdomain
修改主机名
hostnamectl set-hostname ding
如果是静态ip还需要修改/etc/hosts,在第一行指定ip和主机名
vim /etc/hosts
192.168.101.11 ding
cd /opt
mkdir torque
cd torque
wget http://wpfilebase.s3.amazonaws.com/torque/torque-6.1.2.tar.gz
tar -zxvf torque-6.1.2.tar.gz
cd torque-6.1.2
#安装关联的库
yum install libxml2-devel openssl-devel gcc gcc-c++ boost-devel libtool -y
./configure --prefix=/usr/local/torque --with-libxml2=/home/apps/software/torque/libxml2/bin/xml2-config --with-scp --with-default-server=node1
make -j
make install
make packages
libtool --finish /usr/local/torque/lib
遇到libxml2不存在的bug时需要单独安装lbxml2-devel
yum -y install python-devel
wget http://xmlsoft.org/sources/libxml2-2.9.12.tar.gz
tar xvf libxml2-2.9.12.tar.gz
cd libxml2-2.9.12
./configure --prefix=/home/apps/software/torque/libxml2
make -j
make install
vim ~/.bashrc
export PATH=/home/apps/software/torque/libxml2/bin:${PATH}
source ~/.bashrc
cp contrib/init.d/{pbs_{server,sched,mom},trqauthd} /etc/init.d/
for i in pbs_server pbs_sched pbs_mom trqauthd; do chkconfig --add $i; chkconfig $i on; done //遇见y/n选择y回车继续
TORQUE=/usr/local/torque
echo "TORQUE=$TORQUE" >> /etc/profile
echo "export PATH=\$PATH:$TORQUE/bin:$TORQUE/sbin" >> /etc/profile
source /etc/profile
echo '/usr/local/lib' > /etc/ld.so.conf.d/torque.conf
ldconfig
./torque.setup root
qterm #关闭服务
for i in pbs_server pbs_sched pbs_mom trqauthd; do service $i start; done
vi /var/spool/torque/server_priv/nodes
node1 np=64 //添加本行信息,注意等号前后不要有空格 node1是主机名
vi /var/spool/torque/mom_priv/config
pbsserver node1 //添加这两行信息 node1是主机名
logevent 255
ps -e | grep pbs
11188 ? 00:00:00 pbs_sched
11215 ? 00:00:00 pbs_mom
29683 ? 00:00:00 pbs_server
for i in pbs_server pbs_sched pbs_mom trqauthd; do service $i restart; done
Restarting pbs_server (via systemctl): [ OK ]
Restarting pbs_sched (via systemctl): [ OK ]
Restarting pbs_mom (via systemctl): [ OK ]
Restarting trqauthd (via systemctl): [ OK ]
qmgr -c 'create queue node1'
qmgr -c 'set queue node1 queue_type= execution'
qmgr -c 'set queue node1 started= true'
qmgr -c 'set queue node1 enabled= true'
qmgr -c 'set queue node1 resources_default.walltime= 100000:00:00'
qmgr -c 'set queue node1 resources_default.nodes= 1'
qmgr -c 'set server default_queue= node1'
qnodes
node1
state = free
np = 64
ntype = cluster
status = rectime=1666147680,varattr=,jobs=,state=free,netload=2309658168,gres=,loadave=0.19,ncpus=64,physmem=263341876kb,avai
lmem=319715372kb,totmem=327340848kb,idletime=67536,nusers=3,nsessions=15,sessions=5008 9869 9880 10108 10239 10914 14121 30121 42021 165356 110275 121818 121827 126549 127128,uname=Linux node1 3.10.0-1160.76.1.el7.x86_64 #1 SMP Wed Aug 10 16:21:17 UTC 2022 x86_64,opsys=linux mom_service_port = 15002
mom_manager_port = 15003
su ding
echo sleep 2m | qsub
0.node1
qstat
Job ID Name User Time Use S Queue
------------------------- ---------------- --------------- -------- - -----
0.node1 STDIN ding 0 R node1