Difference between revisions of "OpenHPC: Setup Intel Cluster Checker in OpenHPC"
Jump to navigation
Jump to search
| (15 intermediate revisions by 3 users not shown) | |||
| Line 1: | Line 1: | ||
* Packages used to be installable from the repo but Intel removed it - gah! Instructions below are for manual setup | * Packages used to be installable from the repo but Intel removed it - gah! Instructions below are for manual setup | ||
| + | * Updated License Key: CMD9-H9684BWD (July 19) | ||
| + | * CMD9-H9684BWD | ||
== Download/Install latest clck == | == Download/Install latest clck == | ||
* Check the intel registration centre for the latest version: https://registrationcenter.intel.com/ | * Check the intel registration centre for the latest version: https://registrationcenter.intel.com/ | ||
| + | * copies of the software also available on /home/david/software/intel_cluster_checker on the Boston headnote | ||
<syntaxhighlight> | <syntaxhighlight> | ||
wget http://registrationcenter-download.intel.com/akdlm/irc_nas/tec/9701/l_clck_p_2017.0.014.tgz | wget http://registrationcenter-download.intel.com/akdlm/irc_nas/tec/9701/l_clck_p_2017.0.014.tgz | ||
cd l_clck_p_2017.0.014 | cd l_clck_p_2017.0.014 | ||
| − | ./install.sh | + | ./install.sh 18 sept 2019 |
# step 1 serial number: enter CSKW-56T6M5ZD (valid to feb 2017) | # step 1 serial number: enter CSKW-56T6M5ZD (valid to feb 2017) | ||
# select components and installation params, default is fine. | # select components and installation params, default is fine. | ||
| + | # Or install in /opt/ohpc/pub/intel as an NFS install - then ignore below | ||
| + | |||
| + | # serial CMD9-R7B52SJR obtained | ||
# lets add rpms for the compute image | # lets add rpms for the compute image | ||
| Line 23: | Line 29: | ||
rmdir 2017.0.014/ | rmdir 2017.0.014/ | ||
ln -s 2017.0/ 2017.0.014 | ln -s 2017.0/ 2017.0.014 | ||
| + | |||
| + | # open up ports so the collect works | ||
| + | firewall-cmd --permanent --zone=internal --add-port=49152/tcp | ||
# and finally recreate the VNFS | # and finally recreate the VNFS | ||
| Line 51: | Line 60: | ||
# check memory bandwidth (-I is include_only) | # check memory bandwidth (-I is include_only) | ||
clck -f ./nodefile -I stream -v 5 | clck -f ./nodefile -I stream -v 5 | ||
| + | </syntaxhighlight> | ||
| + | |||
| + | == Using version 2.2 == | ||
| + | * This version provides us with the output we can use for accpetance test reporting | ||
| + | |||
| + | <syntaxhighlight> | ||
| + | # URL may change, check registration centre: | ||
| + | wget http://registrationcenter-download.intel.com/akdlm/irc_nas/tec/7754/l_clck_p_2.2.2.004.tgz | ||
| + | tar zxvf l_clck_p_2.2.2.004.tgz | ||
| + | cd l_clck_p_2.2.2.004 | ||
| + | ./install | ||
| + | # change the install dir to /opt/ohpc/pub/intel/clck/2.2.2.004 | ||
| + | |||
| + | # now lets add the runtimes: | ||
| + | wget http://registrationcenter-download.intel.com/akdlm/irc_nas/tec/3506/intel_cluster_runtimes_3.6-1.tgz | ||
| + | yum install lsb libstdc++.i686 | ||
| + | tar zxvf intel_cluster_runtimes_3.6-1.tgz | ||
| + | cd intel_cluster_runtimes_3.6-1 | ||
| + | ./install | ||
| + | |||
| + | # and again in the chroot | ||
| + | cp intel_cluster_runtimes_3.6-1.tgz /opt/ohpc/admin/images/centos7.2/root/scratch/ | ||
| + | chroot $CHROOT | ||
| + | cd root/scratch | ||
| + | yum install lsb libstdc++.i686 | ||
| + | tar zxvf intel_cluster_runtimes_3.6-1.tgz | ||
| + | cd intel_cluster_runtimes_3.6-1 | ||
| + | ./install | ||
| + | </syntaxhighlight> | ||
| + | |||
| + | * Then we need to setup the environment | ||
| + | <syntaxhighlight> | ||
| + | mkdir /etc/intel | ||
| + | mkdir /opt/ohpc/admin/images/centos7.2/etc/intel | ||
| + | echo "CLUSTER_READY_VERSION=1.3.1" > /etc/intel/icr | ||
| + | echo "CLUSTER_READY_VERSION=1.3.1" > /opt/ohpc/admin/images/centos7.2/etc/intel/icr | ||
| + | </syntaxhighlight> | ||
| + | |||
| + | * At this stage: <b>reboot / reinstall</b> nodes | ||
| + | |||
| + | == Create a hosts file == | ||
| + | You need to add a headnode to the hostsfile | ||
| + | <syntaxhighlight> | ||
| + | [biosit@fotres bin]$ cat nodefile | ||
| + | fotres #type: head | ||
| + | node01 | ||
| + | node02 | ||
| + | node03 | ||
| + | node04 | ||
| + | </syntaxhighlight> | ||
| + | |||
| + | == Create a hosts file and configuration file == | ||
| + | Add libraries location if you use different location | ||
| + | |||
| + | <syntaxhighlight> | ||
| + | export LD_LIBRARY_PATH=$LD_LIBRARY_PATH:/home/biosit/cluster_checker2.2/compiler/lib/intel64/ | ||
| + | |||
| + | # From OpenHPC, put in the ~/.bashrc of a standard user | ||
| + | export LD_LIBRARY_PATH=/opt/intel/composer_xe_2013_sp1.0.080/compiler/lib/intel64/:$LD_LIBRARY_PATH | ||
| + | source /opt/intel/clck/2.2.2.004/bin/clckvars.sh | ||
| + | source /opt/intel/impi/4.1.1.036/bin64/mpivars.sh | ||
| + | |||
| + | # Copy the default configuration file: | ||
| + | cp /opt/intel/clck/2.2.2.004/share/doc/intel-clck/defaults.xml ./cluster-conf.xml | ||
| + | </syntaxhighlight> | ||
| + | |||
| + | == Run Perf Checks for Version 2.2 == | ||
| + | <syntaxhighlight> | ||
| + | # Network / IMB | ||
| + | /opt/ohpc/pub/intel/clck/2.2.2.004/clck/2.2.2.004/bin/clck -c ./cluster-conf.xml --include_only imb_pingpong --verbose 5 --debug | ||
| + | |||
| + | # Linpack CPU Floating | ||
| + | /opt/ohpc/pub/intel/clck/2.2.2.004/clck/2.2.2.004/bin/clck -c ./cluster-conf.xml --include_only dgemm --verbose 5 --debug | ||
| + | |||
| + | # Stream | ||
| + | /opt/ohpc/pub/intel/clck/2.2.2.004/clck/2.2.2.004/bin/clck -c ./cluster-conf.xml --include_only stream --verbose 5 --debug | ||
| + | |||
| + | # Disk Bandwidth | ||
| + | /opt/ohpc/pub/intel/clck/2.2.2.004/clck/2.2.2.004/bin/clck -c ./cluster-conf.xml --include_only disk_bandwidth --verbose 5 --debug | ||
</syntaxhighlight> | </syntaxhighlight> | ||
Latest revision as of 14:18, 18 September 2019
- Packages used to be installable from the repo but Intel removed it - gah! Instructions below are for manual setup
- Updated License Key: CMD9-H9684BWD (July 19)
- CMD9-H9684BWD
Download/Install latest clck
- Check the intel registration centre for the latest version: https://registrationcenter.intel.com/
- copies of the software also available on /home/david/software/intel_cluster_checker on the Boston headnote
wget http://registrationcenter-download.intel.com/akdlm/irc_nas/tec/9701/l_clck_p_2017.0.014.tgz
cd l_clck_p_2017.0.014
./install.sh 18 sept 2019
# step 1 serial number: enter CSKW-56T6M5ZD (valid to feb 2017)
# select components and installation params, default is fine.
# Or install in /opt/ohpc/pub/intel as an NFS install - then ignore below
# serial CMD9-R7B52SJR obtained
# lets add rpms for the compute image
pwd
/root/scratch/l_clck_p_2017.0.014
rpm --root $CHROOT -ivh rpm/*rpm
# hack - need to make the dirs similar on compute / head. Must be something dont by the install script rather than just the RPMs
chroot $CHROOT
cd /opt/intel/clck
mv 2017.0.014/* 2017.0/
rmdir 2017.0.014/
ln -s 2017.0/ 2017.0.014
# open up ports so the collect works
firewall-cmd --permanent --zone=internal --add-port=49152/tcp
# and finally recreate the VNFS
wwvnfs -y --chroot $CHROOTRun the cluster checker tool
- Setup the environment
# source the vars
[boston@head1 clck_sanger]$ grep clck ~/.bashrc
source /opt/intel/clck_latest/bin/clckvars.sh
# create the nodefile
for i in {01..20}; do echo node${i} >> nodefile ; done- Run for the first time
clck-collect -a -f nodefile # this take a god damn eternity!
clck-analyze -f nodefile
Run quick perf test
# check memory bandwidth (-I is include_only)
clck -f ./nodefile -I stream -v 5Using version 2.2
- This version provides us with the output we can use for accpetance test reporting
# URL may change, check registration centre:
wget http://registrationcenter-download.intel.com/akdlm/irc_nas/tec/7754/l_clck_p_2.2.2.004.tgz
tar zxvf l_clck_p_2.2.2.004.tgz
cd l_clck_p_2.2.2.004
./install
# change the install dir to /opt/ohpc/pub/intel/clck/2.2.2.004
# now lets add the runtimes:
wget http://registrationcenter-download.intel.com/akdlm/irc_nas/tec/3506/intel_cluster_runtimes_3.6-1.tgz
yum install lsb libstdc++.i686
tar zxvf intel_cluster_runtimes_3.6-1.tgz
cd intel_cluster_runtimes_3.6-1
./install
# and again in the chroot
cp intel_cluster_runtimes_3.6-1.tgz /opt/ohpc/admin/images/centos7.2/root/scratch/
chroot $CHROOT
cd root/scratch
yum install lsb libstdc++.i686
tar zxvf intel_cluster_runtimes_3.6-1.tgz
cd intel_cluster_runtimes_3.6-1
./install- Then we need to setup the environment
mkdir /etc/intel
mkdir /opt/ohpc/admin/images/centos7.2/etc/intel
echo "CLUSTER_READY_VERSION=1.3.1" > /etc/intel/icr
echo "CLUSTER_READY_VERSION=1.3.1" > /opt/ohpc/admin/images/centos7.2/etc/intel/icr- At this stage: reboot / reinstall nodes
Create a hosts file
You need to add a headnode to the hostsfile
[biosit@fotres bin]$ cat nodefile
fotres #type: head
node01
node02
node03
node04Create a hosts file and configuration file
Add libraries location if you use different location
export LD_LIBRARY_PATH=$LD_LIBRARY_PATH:/home/biosit/cluster_checker2.2/compiler/lib/intel64/
# From OpenHPC, put in the ~/.bashrc of a standard user
export LD_LIBRARY_PATH=/opt/intel/composer_xe_2013_sp1.0.080/compiler/lib/intel64/:$LD_LIBRARY_PATH
source /opt/intel/clck/2.2.2.004/bin/clckvars.sh
source /opt/intel/impi/4.1.1.036/bin64/mpivars.sh
# Copy the default configuration file:
cp /opt/intel/clck/2.2.2.004/share/doc/intel-clck/defaults.xml ./cluster-conf.xmlRun Perf Checks for Version 2.2
# Network / IMB
/opt/ohpc/pub/intel/clck/2.2.2.004/clck/2.2.2.004/bin/clck -c ./cluster-conf.xml --include_only imb_pingpong --verbose 5 --debug
# Linpack CPU Floating
/opt/ohpc/pub/intel/clck/2.2.2.004/clck/2.2.2.004/bin/clck -c ./cluster-conf.xml --include_only dgemm --verbose 5 --debug
# Stream
/opt/ohpc/pub/intel/clck/2.2.2.004/clck/2.2.2.004/bin/clck -c ./cluster-conf.xml --include_only stream --verbose 5 --debug
# Disk Bandwidth
/opt/ohpc/pub/intel/clck/2.2.2.004/clck/2.2.2.004/bin/clck -c ./cluster-conf.xml --include_only disk_bandwidth --verbose 5 --debug