As described in the network topology tables and diagrams, configure the communication adapter ports in pairs, so that the devices with the same device ID (for example, ib0) are on the same subnet.
Administrative access is required on all DB2 member and CF hosts.
compat-dapl-1.2.19-0.5.1
compat-dapl-32bit-1.2.19-0.5.1
dapl-32bit-2.0.30-0.5.1
dapl-doc-2.0.30-0.5.1
dapl-2.0.30-0.5.1
ibutils-32bit-1.5.4-0.3.3
Ibutils-1.5.4-0.3.3
infiniband-diags-1.5.7-0.3.2
libcxgb3-rdmav2-32bit-1.2.5-0.3.1
libcxgb3-rdmav2-1.2.5-0.3.1
libibcm-1.0.5-0.3.1
libibcm-32bit-1.0.5-0.3.1
libibcommon1-1.1.2_20090314-0.1.1
libibcommon1-32bit-1.1.2_20090314-0.1.1
libibmad5-1.3.6-0.3.1
libibmad5-32bit-1.3.6-0.3.1
libibumad3-1.3.6-0.3.1
libibumad3-32bit-1.3.6-0.3.1
libibverbs-1.1.4-0.3.1
libibverbs-32bit-1.1.4-0.3.1
libipathverbs-1.2-0.3.1
libipathverbs-32bit-1.2-0.3.1
libmlx4-rdmav2-1.0-5.21.1
libmlx4-rdmav2-32bit-1.0-5.21.1
libmthca-rdmav2-1.0.5-5.18.1
libmthca-rdmav2-32bit-1.0.5-5.18.1
libnes-rdmav2-1.1.0-0.3.1
librdmacm-1.0.13-0.3.1
librdmacm-32bit-1.0.13-0.3.1
libsdp-32bit-1.1.103-0.3.1
libsdp-1.1.103-0.3.1
mpi-selector-1.0.3-0.3.1
mstflint-1.4-2.25.1
ofed-doc-1.5.2-0.7.1
ofed-kmp-default-1.5.2_2.6.32.29_0.3-0.7.1
ofed-1.5.2-0.7.1
ofed-doc-1.5.2-0.7.1
ofed-kmp-default-1.5.2_2.6.32.29_0.3-0.7.1
opensm-32bit-3.3.7-0.5.1
opensm-3.3.7-0.5.1
ibvexdmtools-0.0.1-75.16.1
qlvnictools-0.0.1-75.16.1
sdpnetstat-1.60-5.22.1
srptools-0.0.4-6.8.2
yum groupinstall "OpenFabrics Enterprise Distribution"
yum groupinstall "InfiniBand Support"
# cd /tmp/iso
# ls -rlt
total 3354472
-rw-r--r-- 1 root root 3431618560 Jan 10 20:13 RHEL5.7-20100922.1-Server-x86_64-DVD1.iso
mount -o loop /tmp/iso/RHEL5.7-20100922.1-Server-x86_64-DVD1.iso /mnt/iso/
# cd repodata/
# ls -rlt
total 76180
-rw-r--r-- 1 root root 8032315 Jan 17 12:59 primary.xml.gz
-rw-r--r-- 1 root root 51522840 Jan 17 12:59 other.xml.gz
-rw-r--r-- 1 root root 18346363 Jan 17 12:59 filelists.xml.gz
-rw-r--r-- 1 root root 951 Jan 17 12:59 repomd.xml
# cd ..
# cd repodata/
# cat my.repo
[my repo]
name=Redhat LTC
baseurl=file:///mnt/
gpgcheck=0
enabled=1
[root@coralxib42 ~]# yum groupinstall 'Infiniband Support'
Loaded plugins: product-id, refresh-packagekit, rhnplugin, subscription-manager
Updating Red Hat repositories.
4/4
Setting up Group Process
Resolving Dependencies
--> Running transaction check
---> Package dapl.x86_64 0:2.0.25-5.2.el6 will be installed
---> Package ibsim.x86_64 0:0.5-4.el6 will be installed
---> Package ibutils.x86_64 0:1.5.4-3.el6 will be installed
--> Processing Dependency: libosmcomp.so.3(OSMCOMP_2.3)(64bit) for package: ibutils-1.5.4-3.el6.x86_64
--> Processing Dependency: libosmvendor.so.3(OSMVENDOR_2.0)(64bit) for package: ibutils-1.5.4-3.el6.x86_64
--> Processing Dependency: libopensm.so.2(OPENSM_1.5)(64bit) for package: ibutils-1.5.4-3.el6.x86_64
--> Processing Dependency: tk for package: ibutils-1.5.4-3.el6.x86_64
--> Processing Dependency: libosmcomp.so.3()(64bit) for package: ibutils-1.5.4-3.el6.x86_64
--> Processing Dependency: libosmvendor.so.3()(64bit) for package: ibutils-1.5.4-3.el6.x86_64
--> Processing Dependency: libopensm.so.2()(64bit) for package: ibutils-1.5.4-3.el6.x86_64
--> Processing Dependency: libibdmcom.so.1()(64bit) for package: ibutils-1.5.4-3.el6.x86_64
---> Package libcxgb3.x86_64 0:1.3.0-1.el6 will be installed
---> Package libibcm.x86_64 0:1.0.5-2.el6 will be installed
---> Package libibmad.x86_64 0:1.3.4-1.el6 will be installed
---> Package libibumad.x86_64 0:1.3.4-1.el6 will be installed
---> Package libibverbs.x86_64 0:1.1.4-4.el6 will be installed
---> Package libibverbs-utils.x86_64 0:1.1.4-4.el6 will be installed
---> Package libipathverbs.x86_64 0:1.2-2.el6 will be installed
---> Package libmlx4.x86_64 0:1.0.1-8.el6 will be installed
---> Package libmthca.x86_64 0:1.0.5-7.el6 will be installed
---> Package libnes.x86_64 0:1.1.1-1.el6 will be installed
---> Package librdmacm.x86_64 0:1.0.10-2.el6 will be installed
---> Package librdmacm-utils.x86_64 0:1.0.10-2.el6 will be installed
---> Package rdma.noarch 0:1.0-9.el6 will be installed
---> Package rds-tools.x86_64 0:2.0.4-3.el6 will be installed
--> Running transaction check
---> Package ibutils-libs.x86_64 0:1.5.4-3.el6 will be installed
---> Package opensm-libs.x86_64 0:3.3.5-1.el6 will be installed
---> Package tk.x86_64 1:8.5.7-5.el6 will be installed
--> Finished Dependency Resolution
Dependencies Resolved
====================================================================================
Package Arch Version Repository Size
====================================================================================
Installing:
dapl x86_64 2.0.25-5.2.el6 rhel-x86_64-server-6 143 k
ibsim x86_64 0.5-4.el6 rhel-x86_64-server-6 55 k
ibutils x86_64 1.5.4-3.el6 rhel-x86_64-server-6 1.0 M
libcxgb3 x86_64 1.3.0-1.el6 rhel-x86_64-server-6 16 k
libibcm x86_64 1.0.5-2.el6 rhel-x86_64-server-6 19 k
libibmad x86_64 1.3.4-1.el6 rhel-x86_64-server-6 52 k
libibumad x86_64 1.3.4-1.el6 rhel-x86_64-server-6 55 k
libibverbs x86_64 1.1.4-4.el6 rhel-x86_64-server-6 44 k
libibverbs-utils x86_64 1.1.4-4.el6 rhel-x86_64-server-6 34 k
libipathverbs x86_64 1.2-2.el6 rhel-x86_64-server-6 13 k
libmlx4 x86_64 1.0.1-8.el6 rhel-x86_64-server-6 27 k
libmthca x86_64 1.0.5-7.el6 rhel-x86_64-server-6 33 k
libnes x86_64 1.1.1-1.el6 rhel-x86_64-server-6 15 k
librdmacm x86_64 1.0.10-2.el6 rhel-x86_64-server-6 22 k
librdmacm-utils x86_64 1.0.10-2.el6 rhel-x86_64-server-6 27 k
rdma noarch 1.0-9.el6 rhel-x86_64-server-6 16 k
rds-tools x86_64 2.0.4-3.el6 rhel-x86_64-server-6 55 k
Installing for dependencies:
ibutils-libs x86_64 1.5.4-3.el6 rhel-x86_64-server-6 924 k
opensm-libs x86_64 3.3.5-1.el6 rhel-x86_64-server-6 53 k
tk x86_64 1:8.5.7-5.el6 rhel-x86_64-server-6 1.4 M
Transaction Summary
=====================================================================================
Install 20 Package(s)
Total download size: 4.0 M
Installed size: 0
Is this ok [y/N]:
cat /etc/dat.conf
ofa-v2-ib0 u2.0 nonthreadsafe default libdaplofa.so.2 dapl.2.0 "ib0 0" ""
ofa-v2-ib1 u2.0 nonthreadsafe default libdaplofa.so.2 dapl.2.0 "ib1 0" ""
ofa-v2-ib2 u2.0 nonthreadsafe default libdaplofa.so.2 dapl.2.0 "ib2 0" ""
ofa-v2-ib3 u2.0 nonthreadsafe default libdaplofa.so.2 dapl.2.0 "ib3 0" ""
ssh cf1 cat /etc/sysconfig/network-scripts
DEVICE=ib0
BOOTPROTO='static'
IPADDR='10.222.0.1'
NETMASK='255.255.255.0'
STARTMODE='onboot'
WIRELESS='no'
ssh cf1 cat /etc/sysconfig/network/ifcfg-ib1
DEVICE=ib1
BOOTPROTO='static'
IPADDR='10.222.1.1'
NETMASK='255.255.255.0'
STARTMODE='onboot'
WIRELESS='no'
ssh cf1 cat /etc/sysconfig/network/ifcfg-ib2
DEVICE=ib2
BOOTPROTO='static'
IPADDR='10.222.2.1'
NETMASK='255.255.255.0'
STARTMODE='onboot'
WIRELESS='no'
ssh cf1 cat /etc/sysconfig/network/ifcfg-ib3
DEVICE=ib3
BOOTPROTO='static'
IPADDR='10.222.3.1'
NETMASK='255.255.255.0'
STARTMODE='onboot'
WIRELESS='no'
ssh cf2 cat /etc/sysconfig/network/ifcfg-ib0
DEVICE=ib0
BOOTPROTO='static'
IPADDR='10.222.0.2'
NETMASK='255.255.255.0'
STARTMODE='onboot'
WIRELESS='no'
ssh cf2 cat /etc/sysconfig/network/ifcfg-ib1
DEVICE=ib1
BOOTPROTO='static'
IPADDR='10.222.1.2'
NETMASK='255.255.255.0'
STARTMODE='onboot'
WIRELESS='no'
ssh cf2 cat /etc/sysconfig/network/ifcfg-ib2
DEVICE=ib2
BOOTPROTO='static'
IPADDR='10.222.2.2'
NETMASK='255.255.255.0'
STARTMODE='onboot'
WIRELESS='no'
ssh cf2 cat /etc/sysconfig/network/ifcfg-ib3
DEVICE=ib3
BOOTPROTO='static'
IPADDR='10.222.3.2'
NETMASK='255.255.255.0'
STARTMODE='onboot'
WIRELESS='no'
ssh member1 cat /etc/sysconfig/network/ifcfg-ib0
DEVICE=ib0
BOOTPROTO='static'
IPADDR='10.222.0.101'
NETMASK='255.255.255.0'
STARTMODE='onboot'
WIRELESS='no'
ssh member2 cat /etc/sysconfig/network/ifcfg-ib0
DEVICE=ib0
BOOTPROTO='static'
IPADDR='10.222.0.102'
NETMASK='255.255.255.0'
STARTMODE='onboot'
WIRELESS='no'
ssh member3 cat /etc/sysconfig/network/ifcfg-ib0
DEVICE=ib0
BOOTPROTO='static'
IPADDR='10.222.0.103'
NETMASK='255.255.255.0'
STARTMODE='onboot'
WIRELESS='no'
ssh member4 cat /etc/sysconfig/network/ifcfg-ib0
DEVICE=ib0
BOOTPROTO='static'
IPADDR='10.222.0.104'
NETMASK='255.255.255.0'
STARTMODE='onboot'
WIRELESS='no'
cat /etc/sysconfig/network/ifcfg-ib0
DEVICE=ib0
BOOTPROTO='static'
IPADDR='10.1.1.161'
NETMASK='255.255.255.0'
STARTMODE='onboot'
WIRELESS='no'
cat /etc/sysconfig/network/ifcfg-ib1
DEVICE=ib1
BOOTPROTO='static'
IPADDR='10.1.2.161'
NETMASK='255.255.255.0'
STARTMODE='onboot'
WIRELESS='no'
All members must be on an IP subnet used
by the CF adapter interfaces. The resulting IP subnets are:chkconfig opensmd on
service opensmd start
The /etc/hosts file must have this format: <IP_Address> <fully_qualified_name> <short_name>. All hosts in the cluster must have the same /etc/hosts format.
For example, in a planned DB2 pureScale environment with multiple communication adapter ports on the CFs with four members, the /etc/hosts configuration file might resemble the following file:
10.222.0.1 cf1-ib0.example.com cf1-ib0
10.222.1.1 cf1-ib1.example.com cf1-ib1
10.222.2.1 cf1-ib2.example.com cf1-ib2
10.222.3.1 cf1-ib3.example.com cf1-ib3
10.222.0.2 cf2-ib0.example.com cf2-ib0
10.222.1.2 cf2-ib1.example.com cf2-ib1
10.222.2.2 cf2-ib2.example.com cf2-ib2
10.222.3.2 cf2-ib3.example.com cf2-ib3
10.222.0.101 member1-ib0.example.com member1-ib0
10.222.1.101 member1-ib1.example.com member1-ib1
10.222.0.102 member2-ib0.example.com member2-ib0
10.222.1.102 member2-ib1.example.com member2-ib1
10.222.0.103 member3-ib0.example.com member3-ib0
10.222.1.103 member3-ib1.example.com member3-ib1
10.222.0.104 member4-ib0.example.com member4-ib0
10.222.1.104 member4-ib1.example.com member4-ib1
service openibd restart
On
RHEL 6.1:service rdma restart
ibstatus
Infiniband device 'mlx4_0' port 1 status:
default gid: fe80:0000:0000:0000:0002:c903:0007:eafb
base lid: 0x2
sm lid: 0x1
state: 4: ACTIVE
phys state: 5: LinkUp
rate: 20 Gb/sec (4X DDR)
Infiniband device 'mlx4_0' port 2 status:
default gid: fe80:0000:0000:0000:0002:c903:0007:eafc
base lid: 0x3
sm lid: 0x1
state: 4: ACTIVE
phys state: 5: LinkUp
rate: 20 Gb/sec (4X DDR)
ofa-v2-ib0 u2.0 nonthreadsafe default libdaplofa.so.2 dapl.2.0 "ib0 0" ""
# ip -resolve neigh
coralxib44-ib3 dev ib3 lladdr 80:00:00:49:fe:80:00:00:00:00:00:00:00:02:c9:03:00:0e:9d:5e REACHABLE
coralxib42.torolab.ibm.com dev bond0 lladdr 00:1a:64:c9:d1:e8 REACHABLE
coralxib42-ib0 dev ib0 lladdr 80:00:00:48:fe:80:00:00:00:00:00:00:00:02:c9:03:00:07:ea:5f REACHABLE
coralxib44-ib0 dev ib0 lladdr 80:00:00:48:fe:80:00:00:00:00:00:00:00:02:c9:03:00:07:eb:13 REACHABLE
9.26.120.1 dev bond0 lladdr 00:00:0c:07:ac:01 REACHABLE
coralxib43.torolab.ibm.com dev bond0 lladdr 00:1a:64:c9:cc:d4 REACHABLE
coralxib44-ib2 dev ib2 lladdr 80:00:00:48:fe:80:00:00:00:00:00:00:00:02:c9:03:00:0e:9d:5d REACHABLE
coralxib44.torolab.ibm.com dev bond0 lladdr 00:1a:64:c9:d5:24 REACHABLE
coralxib44-ib1 dev ib1 lladdr 80:00:00:49:fe:80:00:00:00:00:00:00:00:02:c9:03:00:07:eb:14 REACHABLE
coralxib43-ib0 dev ib0 lladdr 80:14:00:48:fe:80:00:00:00:00:00:00:00:02:c9:03:00:07:ea:07 REACHABLE
# arp -an
? (10.1.4.144) at 80:00:00:49:fe:80:00:00:00 [infiniband] on ib3
? (9.26.120.241) at 00:1a:64:c9:d1:e8 [ether] on bond0
? (10.1.1.142) at 80:00:00:48:fe:80:00:00:00 [infiniband] on ib0
? (10.1.1.144) at 80:00:00:48:fe:80:00:00:00 [infiniband] on ib0
? (9.26.120.1) at 00:00:0c:07:ac:01 [ether] on bond0
? (9.26.120.103) at 00:1a:64:c9:cc:d4 [ether] on bond0
? (10.1.2.144) at 80:00:00:48:fe:80:00:00:00 [infiniband] on ib2
? (9.26.120.104) at 00:1a:64:c9:d5:24 [ether] on bond0
? (10.1.3.144) at 80:00:00:49:fe:80:00:00:00 [infiniband] on ib1
? (10.1.1.143) at 80:14:00:48:fe:80:00:00:00 [infiniband] on ib0
Modify the kernel parameters of hosts that you plan to include in the DB2 pureScale environment.