xCAT Wiki

SourceForge Headquarters 1320 Columbia Street Suite 310 San Diego, CA 92101 +1 (858) 422-6466 · Notes: make sure the entry "disable=no" in the /etc/xinetd.d/tftp.

 xCAT Linux on IBM System P Clusters

https://sourceforge.net/apps/mediawiki/xcat/index.php?title=Setting_Up_a_Linux_xCAT_Mgmt_Node

rpm -qa | grep atftp
Could find one or both of the following rpms:
atftp-xcat-*
atftp-*
service tftpd stop
rpm --nodeps -e atftp-xcat atftp

yum install tftp-server.ppc

zypper install tftp

service xinetd restart

chtab key=system passwd.username=root passwd.password=cluster

chtab key=hmc passwd.username=hscroot passwd.password=abc123

mkdef -t node -o hmc1 groups=hmc,all nodetype=hmc mgt=hmc username=hscroot password=abc1234
chdef -t node -o hmc1 username=hscroot password=abc1234

mkdef -t node -o hmc1 groups=hmc,all nodetype=hmc mgt=hmc username=hscroot password=abc123

chdef -t node -o hmc1 groups=hmc,rack1,all

lsdef -l hmc1

lsslp -w -s HMC

tabdump nodelist

chdef -t node -o &lt;hmcname from lsslp&gt; username=hscroot password=abc123

rscan -z hmc1 &gt; node.stanza

Server-9117-MMA-SN10F6F3D:
objtype=node
nodetype=fsp
id=5
model=9118-575
serial=02013EB
hcp=hmc01
pprofile=
parent=Server-9458-10099201WM_A
groups=fsp,all
mgt=hmc
pnode1:
objtype=node
nodetype=lpar,osi
id=9
hcp=hmc1
pprofile=lpar9
parent=Server-9117-MMA-SN10F6F3D
groups=lpar,all
mgt=hmc
cons=hmc
pnode2:
objtype=node
nodetype=lpar,osi
id=7
hcp=hmc1
pprofile=lpar6
parent=Server-9117-MMA-SN10F6F3D
groups=lpar,all
mgt=hmc
cons=hmc

cat node.stanza | mkdef -z

lsdef -t node -l all

chdef -t node -o pnode1,pnode2 -p groups=compute

chdef -t node -o pnode1 netboot=yaboot tftpserver=192.168.0.1 nfsserver=192.168.0.1
monserver=192.168.0.1 xcatmaster=192.168.0.1 installnic="eth0" primarynic="eth0"

chtab key=master site.value=_192.168.0.1_

chdef -t node -o pnode1 os=&lt;os&gt; arch=ppc64 profile=compute

 tabdump -d nodetype

_**chdef -t node -o node01 -p postscripts=foo,bar**_

For more information on creating and setting up Post*scripts:
[Postscripts_and_Prescripts]

service ntpd start

_chdef -t site ntpservers= myMN_

 _chdef -p -t group -o compute postscripts=setupntp_

mkdef -t network -o net1 net=192.168.0.0 mask=255.255.255.0 gateway=192.168.0.1 mgtifname=eth1
 dhcpserver=192.168.0.1 tftpserver=192.168.0.1 nameservers=192.168.0.1

vi /etc/hosts
127.0.0.1  localhost
192.168.0.1 pmanagenode
192.168.0.10 pnode1
192.168.0.20 pnode2
192.168.0.100 hmc1
       .
       .
       .

vi /etc/resolv.conf
search cluster.net
nameserver 192.168.0.1

makedns
service named start
chkconfig --level 345 named on

makedns
service named restart

/var/log/consoles/&lt;management node&gt;

makeconservercf
service conserver stop
service conserver start

rcons pnode1

rpower pnode1 stat

rpower pnode1 stat, if node is on then run
rpower pnode1 off

lsdef pnode1

chdef -t pnode1 -o blade01 installnic=eth0 primarynic=eth1

getmacs pnode1

getmacs pnode1 -D -S 192.168.0.1 -G 192.168.0.10

pnode1:
Type Location Code MAC Address Full Path Name Ping Result Device Type
ent U9133.55A.10E093F-V4-C5-T1 f2:60:f0:00:40:05 /vdevice/l-lan@30000005 virtual

tabdump mac

 chdef -t site dhcpinterfaces='pmanagenode|eth1'

 rpm -qa | grep -E "^dhcp-server"

 zypper install dhcp-server

 makedhcp -n

 makedhcp -a

 service dhcpd restart

copycds /iso/RHEL5.2-Server-20080430.0-ppc-DVD.iso

/opt/xcat/share/xcat/install/&lt;platform&gt;/

/install/custom/install/&lt;platform&gt; directory.

lsdef pnode1
Object name: pnode1
.
.
.
arch=ppc64
os=rhels5.5
profile=compute

compute.rhels5.5.ppc64.tmpl
compute.rhels5.ppc64.tmpl
compute.rhels.ppc64.tmpl
compute.rhels5.5.tmpl
compute.rhels5.tmpl
compute.rhels.tmpl
compute.ppc64.tmpl
compute.tmpl

/install/post/otherpkgs/&lt;os&gt;/&lt;arch&gt;

cd /install/post/otherpkgs/&lt;os&gt;/&lt;arch&gt;
ls *.rpm &gt;rpms.list

createrepo -i rpms.list /install/post/otherpkgs/&lt;os&gt;/&lt;arch&gt;

createrepo /install/post/otherpkgs/&lt;os&gt;/&lt;arch&gt;/**other**

nodeset pnode1 install

rnetboot pnode1

lsdef pnode1 -i status

xdsh pnode1 -K

xdsh pnode1 date

mkdir /install/postscripts/data
cp &lt;kernel&gt; /install/postscripts/data

vi /install/postscripts/updatekernel
#!/bin/bash
rpm -Uivh data/kernel-*rpm
chmod 755 /install/postscripts/updatekernel

chdef -p -t group -o compute postscripts=updatekernel
rinstall compute

/opt/xcat/share/xcat/netboot/&lt;platform&gt;

/install/custom/netboot/&lt;platform&gt; directory

/install/custom/netboot/&lt;platform&gt;/&lt;profile&gt;.exlist

/install/custom/netboot/&lt;platform&gt;/&lt;profile&gt;.pkglist

cp opt/xcat/share/xcat/netboot/&lt;platform&gt;/*postinstall /install/custom/netboot/&lt;platform&gt;/.

&lt;profile&gt;.&lt;os&gt;.&lt;arch&gt;.postinstall
&lt;profile&gt;.&lt;arch&gt;.postinstall
&lt;profile&gt;.&lt;os&gt;.postinstall
&lt;profile&gt;.postinstall

bash
nfs-utils
stunnel
dhclient
kernel
openssh-server
openssh-clients
busybox-anaconda
wget
vim-minimal
ntp

cracklib
libuser
passwd

aaa_base
bash
nfs-utils
dhcpcd
kernel
openssh
psmisc
wget
sysconfig
syslog-ng
klogd
vim

cd /opt/xcat/share/xcat/netboot/rh
./genimage -i eth0 -n ibmveth -o rhels5.2 -p compute

cd /opt/xcat/share/xcat/netboot/sles
./genimage -i eth0 -n ibmveth -o sles11 -p compute

packimage -o rhels5.2 -p compute -a ppc64

packimage -o sles11 -p compute -a ppc64

nodeset pnode2 netboot

rnetboot pnode2

lsdef pnode2 -i status

xdsh pnode2 -K

xdsh pnode2 date

cd /tmp
rpm2cpio kernel-2.6.32.10-0.5.ppc64.rpm | cpio -idv ./boot/vmlinuz-2.6.32.10-0.5-ppc64
cp ./boot/vmlinux-2.6.32.10-0.5-ppc64  /boot
rpm2cpio kernel-2.6.32.10-0.5.ppc64.rpm | cpio -idv './lib/modules/2.6.32.10-0.5-ppc64/*'
cp -r ./lib/modules/2.6.32.10-0.5-ppc64 /lib/modules

genimage -i eth0 -n ibmveth -o sles11.1 -p compute -k 2.6.32.10-0.5-ppc64
packimage -o sles11 -p compute -a ppc64

nodeset pnode2 netboot
rnetboot pnode2

xdsh pnode2 uname -a

rmimage -o &lt;os&gt; -a &lt;arch&gt; -p &lt;profile&gt;

rmimage &lt;imagename&gt;

chtab key="useSSHonAIX" site.value=yes

chdef hmc01.clusters.com nodetype=hmc mgt=hmc groups=hmc username=hscroot password=abc123

rspconfig hmc01.clusters.com sshcfg=enable

http://www14.software.ibm.com/webapp/set2/firmware/gjsn.

rinv Server-m_tmp-SNs_tmp firm

http://www14.software.ibm.com/webapp/set2/firmware/gjsn.

rflash Server-m_tmp-SNs_tmp -p /tmp/fw --activate disruptive

rflash Server-m_tmp-SNs_tmp -p /tmp/fw --activate concurrent

rinv Server-m_tmps_tmp firm

http://www14.software.ibm.com/webapp/set2/firmware/gjsn

rflash Server-m_tmps_tmp -p /tmp/fw --activate disruptive

rflash Server-m_tmps_tmp -p /tmp/fw --activate concurrent

rflash Server-m_tmp-SNs_tmp --commit

 kexec-tools, crash

 nfs://&lt;nfs_server_ip&gt;/&lt;kdump_path&gt;

 nfs:///&lt;kdump_path&gt;

 &lt;os&gt;-&lt;arch&gt;-netboot-&lt;profile&gt;
 &lt;os&gt;-&lt;arch&gt;-statelite-&lt;profile&gt;

 chdef -t osimage &lt;os&gt;-&lt;arch&gt;-netboot-&lt;profile&gt; dump=nfs://&lt;nfs_server_ip&gt;/&lt;kdump_path&gt;

 chdef -t osimage rhels6-ppc64-netboot-compute dump=nfs://10.1.0.1/install/kdump

 chdef -t osimage &lt;os&gt;-&lt;arch&gt;-statelite-&lt;profile&gt; dump=nfs://&lt;nfs_server_ip&gt;/&lt;kdump_path&gt;

 "ALL","/etc/kdump.conf",,,
 "ALL","/boot/",,,

 chdef &lt;noderange&gt; -p postscripts=enablekdump

xCAT Wiki

An extreme cluster/cloud administration toolkit

XCAT_pLinux_Clusters

Introduction

Install xCAT 2 on the Management node

Setup for P7 IH Cluster on xCAT MN

Setup the management node

[Power 5] Workaround the atftpd issue

Remove atftp

Install the tftp server needed by xCAT, and restart it

Restart the tftp server

Setup common attributes for xCAT in the database

Add the default account for system

Add the default account for hmc

Define the compute nodes

Define the hardware control point for the nodes.

Discover the LPARs managed by HMC using rscan

Define xCAT node using the stanza file

Define xCAT groups

Update the attributes of the node

Check the site.master value

Set the type attributes of the node

Set up customization scripts (optional)

Add NTP setup script (optional)

Setup Basic Services

Setup the networks table

Setup Name Resolution

Setup /etc/hosts with entries for all you nodes, hmcs, fsps, etc

Setup the nameserver

Setup the DNS attributes in the Site table

Setup DNS configuration

Updating the DNS configuration

Configure conserver

Update conserver configuration

Check rcons(rnetboot and getmacs depend on it)

Check hardware control setup to the nodes

Update the mac table with the address of the node(s)

Setup dhcp service

Setup the dhcp listen interfaces in site table

[SLES] Check the installation of dhcp-server

Configure the DHCP

Install a Compute Node

Prepare the installation source

Statefull Node installation

OS versus Platform

Customize the install profile

Search order for installation templates

Install other specific packages

Set the node status to ready for installation

Use network boot to start the installation

Check the installation results

Install a new Kernel on the nodes

Statelessnode installation

Generate the stateless image for compute node

Make the compute node add/exclude packaging list

Setting up postinstall files

Run image generation

Pack the image

Set the node status ready for network boot

Use network boot to start the installation

Check the installation result

Installing a new Kernel in the stateless image

Remove an image

Statelite Node installation

Firmware upgrade

Prepare for Firmware upgrade

Enable the HMC to allow remote ssh connections(Only for P5/P6 with HMC).

Define the necessary attributes

Define the HMC as a node(Only for P5/P6 with HMC)

Setup SSH connection to HMC(Only for P5/P6 with HMC)

Get the Microcode update package and associated XML file

Perform Firmware upgrade for CEC on P5/P6/P7

Define the CEC as a node on the management node

Check firmware level

Update the firmware

Perform Firmware upgrades for BPA on P5/P6/P7

Define the BPA as a node on the Management Node

Use rinv to check the firmware level

Update the firmware

Commit currently activated LIC update(copy T to P) for a CEC/BPA on p5/p6/p7