- 論壇徽章:
- 0
|
本帖最后由 嗜血的豬 于 2010-04-13 10:51 編輯
1
硬件:集群節(jié)點(diǎn):12臺(tái)hs21 xm刀片,交換機(jī),控制臺(tái),管理節(jié)點(diǎn)IBM System x3650
軟件:系統(tǒng)rhel5.4 xcat2.3.3 下載地址 http://xcat.sourceforge.net/#download
2網(wǎng)絡(luò)ip設(shè)置:
管理節(jié)點(diǎn)IBM System x3650 eth1 192.168.1.111 eth0 10.10.10.1 hostname ibm_hs
刀片ip eth0 10.10.10.80------10.10.10.92
刀片中心ip 10.10.10.254
3管理節(jié)點(diǎn)IBM System x3650安裝
操作系統(tǒng)rhel5.4(系統(tǒng)安裝不在介紹)最好完全安裝防止后期麻煩。
4管理節(jié)點(diǎn)操作系統(tǒng)修改
4.1檢查你的操作系統(tǒng),如果selinux為 enabled 需要執(zhí)行下面例子程序。
[root@ibm_hs ~]# vi /etc/selinux/config
# This file controls the state of SELinux on the system.
# SELINUX= can take one of these three values:
# enforcing - SELinux security policy is enforced.
# permissive - SELinux prints warnings instead of enforcing.
# disabled - SELinux is fully disabled.
SELINUX=disabled
# SELINUXTYPE= type of policy in use. Possible values are:
# targeted - Only targeted network daemons are protected.
# strict - Full SELinux protection.
SELINUXTYPE=targeted
4.2刪除系統(tǒng)安裝包 tftp-server,OpenIPMI-tools
[root@ibm_hs ~]# rpm -qa | grep tftp-server
tftp-server-0.42-3.1
[root@ibm_hs ~]# rpm -qa | grep OpenIPMI-tools
OpenIPMI-tools-2.0.6-5.el5.4
[root@ibm_hs ~]# rpm -e tftp-server; rpm -e OpenIPMI-tools
5刀片中心設(shè)置
5.1找臺(tái)筆記本或其他機(jī)器連接到刀片中心。一般默認(rèn)ip為192.168.70.125用戶(hù)為USERID密碼為PASSW0RD
Blade Tasks-->Configuration
這里修改blade名字為node1------node12
MM Control-->General Settings
下修改刀片中心名字為blademm
MM Control-->Network Interfaces
設(shè)置刀片中心ip為10.10.10.254
MM Control-->Security下激活ssh server
設(shè)置完成重啟BLADECENTER
5.2測(cè)試
通過(guò)管理節(jié)點(diǎn)執(zhí)行下面命令如果ssh配通會(huì)看到下面信息。(如果有錯(cuò)誤比如ssh不能登錄可能需要升級(jí)mm的firmware。到ibm官網(wǎng)下載就好。)
[root@ibm_hs ~]# ssh USERID@10.10.10.254
password:
Hostname: blademm
Static IP address: 10.10.10.254
Burned-in MAC address: 00:14:5E F:84:F0
DHCP: Disabled - Use static IP configuration.
Last login: Wednesday March 18 2009 0:06 from 10.10.10.1 (Web)
system>
6xcat2.3部署
mkdir -p /root/xcat2
解壓所下載的文件
tar jxvf xcat-dep-2.4-200912091450.tar.bz2
tar jxvf xcat-core-2.3.3.tar.bz2
yum repository
掛載rhel5.4的DVD光盤(pán)到/root/xcat2/rhel5.4/,并在/etc/yum.repos.d/下創(chuàng)建文件:rhels5.4.repo,內(nèi)容如下:
[rhels5.4]
name=Rhel Server 5.4
baseurl=file:///root/xcat2/rhel5.4/Server
enabled=1
gpgcheck=0
xCAT的repository文件:
cd /root/xcat2/xcat-dep/rh5/X86_64
./mklocalrepo.sh
cd /root/xcat2/xcat-core
./mklocalrepo.sh
yum install xCAT (根據(jù)提示y就行了)
安裝完成測(cè)試
[root@big ibm_hs]# /etc/init.d/xcatd status
xCAT service is running
修改/etc/hosts
10.10.10.254 blademm.hs21.com blademm
10.10.10.80 node1.hs21.com node1
10.10.10.81 node2.hs21.com node2
10.10.10.82 node3.hs21.com node3
10.10.10.83 node4.hs21.com node4
10.10.10.84 node5.hs21.com node5
10.10.10.85 node6.hs21.com node6
10.10.10.86 node7.hs21.com node7
10.10.10.87 node8.hs21.com node8
10.10.10.88 node9.hs21.com node9
10.10.10.89 node10.hs21.com node10
10.10.10.90 node11.hs21.com node11
10.10.10.91 node12.hs21.com node12
..................................待續(xù)
..................................繼續(xù)
設(shè)定root用戶(hù)profile
cd /etc/profile.d/
./xcat.sh
這個(gè)操作目的設(shè)定xcat環(huán)境變量
[root@ibm_hs ~]# less /etc/profile.d/xcat.sh
XCATROOT=/opt/xcat
PATH=$PATH XCATROOT/bin XCATROOT/sbin
MANPATH=$MANPATH XCATROOT/share/man:
export XCATROOT PATH MANPATH
export PERL_BADLANG
驗(yàn)證安裝
[root@ibm_hs~]# tabdump site
#key,value,comments,disable
"blademaxp","64",,
"fsptimeout","0",,
"installdir","/install",,
"ipmimaxp","64",,
"ipmiretries","3",,
"ipmitimeout","2",,
"consoleondemand","no",,
"master","10.10.10.1",,
"maxssh","8",,
"ppcmaxp","64",,
"ppcretry","3",,
"ppctimeout","0",,
"sharedtftp","1",,
"SNsyncfiledir","/var/xcat/syncfiles",,
"tftpdir","/tftpboot",,
"xcatdport","3001",,
"xcatiport","3002",,
"xcatconfdir","/etc/xcat",,
"timezone","Asia/Shanghai",,
"useNmapfromMN","no",,
"domain","hs21.com",,
"nameservers","10.10.10.1",,
"dhcpinterfaces","eth0",,
如果發(fā)現(xiàn)某些選項(xiàng)不對(duì)可以用tabedit site修改
用copycds命令拷貝鏡像到管理節(jié)點(diǎn)
例。
[root@ibm_hs iso]# ls
rhel-server-5.4-x86_64-dvd.iso
[root@ibm_hs iso]# pwd
/root/iso
[root@ibm_hs iso]# copycds -n rhels5.4 -a x86_64 /root/iso/rhel-server-5.4-x86_64-dvd.iso
Restoring the predefined xcat table
cd /opt/xcat/share/xcat/templates/e1350
for i in *csv; do tabrestore $i; done
對(duì)網(wǎng)絡(luò)配置表配置
[root@ibm_hs e1350]# chtab net=10.10.10.0
networks.nameservers=10.10.10.1
[root@ibm_hs e1350]# chtab net=10.10.10.0
networks.dynamicrange=10.10.10.80-10.10.10.92
[root@ibm_hs e1350]#tabdump networks (檢查你的設(shè)置)
dns設(shè)置
[root@ibm_hs iso]# less /etc/resolv.conf
search clusters.com
nameserver 127.0.0.1
#nameserver 10.10.10.1
[root@ibm_hs iso]#makedns
[root@ibm_hs iso]#service named restart
dns測(cè)試正確情況下會(huì)看到下面輸出
[root@ibm_hs iso]# host node1
node1.hs21.com has address 10.10.10.80
node1.hs21.com mail is handled by 10 node1.hs21.com.
[root@ibm_hs iso]# host node2
node2.hs21.com has address 10.10.10.81
node2.hs21.com mail is handled by 10 node2.hs21.com.
dhcp設(shè)置
[root@ibm_hs iso]# chtab net=10.10.10.0
networks.dhcpserver=10.10.10.1
[root@ibm_hs iso]# makedhcp -n
[root@ibm_hs iso]#service dhcpd start
TFTP設(shè)置
默認(rèn)tftp文件在/tftpboot下
......................待續(xù)
[root@ibm_hs iso]mknb x86_64
[root@ibm_hs iso]service tftpd restart
定義bladecenter管理模塊
[root@ibm_hs iso]nodeadd blademm groups=mm nodehm.mgt=blade mp.mpa=10.10.10.254
激活刀片管理模塊遠(yuǎn)程控制 snmp和ssh
[root@ibm_hs iso]ssh USERID@blademm users -T mm[1] -1 -at set
system> users -T mm[1] -1 -at set
如果返回ok證明你沒(méi)有問(wèn)題。
[root@ibm_hs iso]# rspconfig mm snmpcfg=enable sshcfg=enable
blademm: SNMP enable: OK
blademm: SSH enable: OK
[root@ibm_hs iso]# rspconfig blademm pd1=redwoperf pd2=redwoperf
blademm: pd2: redwoperf
blademm: pd1: redwoperf
[root@ibm_hs iso]# rpower blademm reset
setup ssh key for Management Module
[root@ibm_hs iso]# rspconfig blademm snmpcfg=enable sshcfg=enable
blademm: SNMP enable: OK
blademm: SSH enable: OK
增加計(jì)算節(jié)點(diǎn)
[root@ibm_hs iso]#nodeadd node1-node12 groups=blade,compute mp.mpa=10.10.10.254 nodehm.power=blade nodehm.mgt=blade nodetype.os=rhels5.4 nodetype.arch=x86_64 nodetype.profile=compute nodetype.nodetype=osi noderes.nfsserver=ibm_hs.hs21.com noderes.netboot=pxe noderes.primarynic=eth0
通過(guò)rscan命令可以獲取刀片位置信息。例如
[root@ibm_hs ~]# rscan blademm
type name id type-model serial-number address
mm blademm 0 8852-4XC 99A8988 10.10.10.254
blade node1 1 7995-I3B 99A9226
blade node2 2 7995-I3B 99A9233
blade node3 3 7995-I3B 99A9232
blade node4 4 7995-I3B 99A9235
blade node5 5 7995-I3B 99A9227
blade node6 6 7995-I3B 99A9236
blade node7 7 7995-I3B 99A9228
blade node8 8 7995-I3B 99A9234
blade node9 9 7995-I3B 99A9229
blade node10 10 7995-I3B 99A9230
blade node11 11 7995-I3B 99A9231
blade node12 12 7995-I3B 99A9225
如果需要修改id值可以用nodech nodexx mp.id=xx
測(cè)試管理模塊
[root@ibm_hs ~]# rpower node1 stat
node1: off
[root@ibm_hs ~]# rpower node1 on
node1: on
[root@ibm_hs ~]# rpower node1 stat
node1: on
獲取mac地址
[root@ibm_hs ~]#getmacs node1-node12
[root@ibm_hs ~]#makedhcp -n (注意有些文檔用makedhcp --macs 請(qǐng)這這個(gè)版本xca不要用這個(gè)方法)
[root@ibm_hs ~]#service dhcpd restart
[root@ibm_hs~]# tabdump mac
#node,interface,mac,comments,disable
"node1",,"00:1A:64:58:1A:72",,
"node10",,"00:1A:64:58:51:98",,
"node11",,"00:1A:64:58:5A:FE",,
"node12",,"00:1A:64:58:1E:A4",,
"node2",,"00:1A:64:58:55:2E",,
"node3",,"00:1A:64:58:60:56",,
"node4",,"00:1A:64:58:5A:98",,
"node5",,"00:1A:64:58:16:0A",,
"node6",,"00:1A:64:58:55:34",,
"node7",,"00:1A:64:58:1A:BA",,
"node8",,"00:1A:64:58:5C:84",,
"node9",,"00:1A:64:58:51:9E",,
準(zhǔn)備安裝計(jì)算節(jié)點(diǎn)
調(diào)整刀片啟動(dòng)順序
[root@ibm_hs~]# rbootseq node1-node12 list
node1: cdrom,hd0,floppy,net
.......
[root@ibm_hs~]# rbootseq node1-node12 n,h,c,f
node1: net,hd0,cdrom,floppy
......................
創(chuàng)建kickstart文件
[root@ibm_hs~]# nodeset node1-node12 install
node1: install rhels5.4-x86_54-compute
.....
開(kāi)始安裝
[root@ibm_hs~]# rinstall node1
監(jiān)控安裝
[root@ibm_hs~]# nodestat node1
node1: installing prep
[root@ibm_hs~] tail -f /var/log/messages
到這里位置xcat集群就建立完成
(參照ibm官方文檔)如果對(duì)其他參數(shù)有興趣可以去ibm網(wǎng)站下載。
下面介紹torque maui在xcat中應(yīng)用
待續(xù)。。。。。。。。。
torque安裝 |
|