Monday, 25 July 2016

PBS PRO Scheduler Configuration:

PBS PRO Scheduler application Configuration:

How to add new application on nodes


Below is the command to change the existing configuration, see here on node1.example.com (compute node1) only two applications are allowed to run jobs that is Abaqus & Dyna_MPP.

Now the requirement is user wants to run Pamcrash application on node1.autoliv.int, For enabling that please follow the below steps

BEFORE ADDING APPLICATION

#pbsnode -a
node1.example.com
     Mom = node1.example.com
     Port = 15002
     pbs_version = PBSPro_13.1.0.160576
     ntype = PBS
     state = free
     pcpus = 32
     resources_available.arch = linux
     resources_available.host = node1
     resources_available.mem = 132279240kb
     resources_available.ncpus = 32
     resources_available.pas_applications_enabled = Abaqus,Dyna_Mpp
     resources_available.vnode = node1.example.com
     resources_assigned.accelerator_memory = 0kb
     resources_assigned.mem = 0kb
     resources_assigned.naccelerators = 0
     resources_assigned.ncpus = 0
     resources_assigned.netwins = 0
     resources_assigned.ngpus = 0
     resources_assigned.vmem = 0kb
     resv_enable = True
     sharing = default_shared

ADDING NEW APPLICATION ON NODE (node1.example.com is a hostname of that node)

 # qmgr
Max open servers: 49
Qmgr: set node node1.example.com resources_available.pas_applications_enabled+=Pamcrash
AFTER ADDING APPLICATION
#pbsnode –a
node1.example.com
     Mom = node1.example.com
     Port = 15002
     pbs_version = PBSPro_13.1.0.160576
     ntype = PBS
     state = free
     pcpus = 32
     resources_available.arch = linux
     resources_available.host = node1
     resources_available.mem = 132279240kb
     resources_available.ncpus = 32
     resources_available.pas_applications_enabled = Abaqus,Dyna_Mpp,Pamcrash
     resources_available.vnode = node1.example.com
     resources_assigned.accelerator_memory = 0kb
     resources_assigned.mem = 0kb
     resources_assigned.naccelerators = 0
     resources_assigned.ncpus = 0
     resources_assigned.netwins = 0
     resources_assigned.ngpus = 0
     resources_assigned.vmem = 0kb
     resv_enable = True

     sharing = default_shared

Tuesday, 12 July 2016

-bash: fork: Cannot allocate memory in RHEL 6/CentOS 6

-bash: fork: Cannot allocate memory in Red Hat Enterprise Linux 6 (or) CentOS 6

Solution:-
This problem is caused because of Process Identifiers Limit, Increasing the value will help on large Linux system or clusters to ease process identification and process management, So that we can avoid this kind error “-bash: fork: Cannot allocate memory”

If you want to check current value execute this command

# cat /proc/sys/kernel/pid_max
32768

(OR)

# sysctl kernel.pid_max
kernel.pid_max = 32768

So I am going to increase this value to 65534.

# echo kernel.pid_max = 65534 >> /etc/sysctl.conf

To configure kernel parameters at runtime use sysctl command

# sysctl –p

{Note: p option is used to load sysctl setting from the file      /etc/sysctl.conf }



Wednesday, 29 June 2016

Domain Name System (DNS) Configuration in Centos 6/RHEL 6

See in this post we are going to see how to configure DNS 

First we should know what is DNS ...??

DNS is also called as Domain Name Service (DNS) , DNS is the Application layer protocol in internet protocol suite.
DNS is used for naming services also it resolves Forward and Reverse Lookup.
Forward Lookup = Domain Name to find an IP Address
Reverse Lookup = IP Address to find a Domain Name
An Internet facility that lets you do either forward or reverse DNS lookup yourself is called nslookup.
DNS PORT NO = 53
Domain name= example.org
Server IP Address = 192.168.40.120/24
Server Hostname = server.tn.example.org
Client IP Address = 192.168.40.125/24
Client Hostname = client.tn.example.org

Server Side Configuration:-

Install BIND Package 


[root@server ~]# yum install bind bind-utils –y

[root@server ~]# vim /etc/named.conf
//
// named.conf
//
// Provided by Red Hat bind package to configure the ISC BIND named(8) DNS
// server as a caching only nameserver (as a localhost DNS resolver only).
//
// See /usr/share/doc/bind*/sample/ for example named configuration files.
//

options {
listen-on port 53 { 127.0.0.1; 192.168.40.120; };
listen-on-v6 port 53 { ::1; };
directory "/var/named";
dump-file "/var/named/data/cache_dump.db";
        statistics-file "/var/named/data/named_stats.txt";
        memstatistics-file "/var/named/data/named_mem_stats.txt";
allow-query     { localhost; 192.168.40.0/24; };
allow-transfer{ localhost; 192.168.40.0/24; };
recursion yes;
dnssec-enable yes;
dnssec-validation yes;
dnssec-lookaside auto;
/* Path to ISC DLV key */
bindkeys-file "/etc/named.iscdlv.key";
managed-keys-directory "/var/named/dynamic";
};
logging {
        channel default_debug {
                file "data/named.run";
                severity dynamic;
        };
};
zone "." IN {
type hint;
file "named.ca";
};
zone"example.org" IN {
type master;
file "forward.example";
allow-update { none; };
};
zone"40.168.192.in-addr.arpa" IN {
type master;
file "reverse.example";
allow-update { none; };
};
include "/etc/named.rfc1912.zones";
include "/etc/named.root.key";

Create forward.example & reverse.example files under the directory /var/named

[root@server ~]# vim /var/named/forward.example
$TTL 86400
@   IN  SOA     server.tn.example.org. root.example.org. (
        2011071001  ;Serial
        3600        ;Refresh
        1800        ;Retry
        604800      ;Expire
        86400       ;Minimum TTL
)
@       IN  NS          server.tn.example.org.
@       IN  A           192.168.40.120
@       IN  A           192.168.40.125
server.tn       IN  A   192.168.40.120
client.tn       IN  A   192.168.40.125

[root@server ~]# vim /var/named/reverse.example
$TTL 86400
@   IN  SOA     server.tn.example.org. root.example.org. (
        2011071001  ;Serial
        3600        ;Refresh
        1800        ;Retry
        604800      ;Expire
        86400       ;Minimum TTL
)
@       IN  NS          server.tn.example.org.
@       IN  PTR         example.org.
server.tn       IN  A   192.168.40.120
client.tn       IN  A   192.168.40.125
120     IN  PTR         server.tn.example.org.
125     IN  PTR         client.tn.example.org.
[root@server ~]# /etc/init.d/named start
Starting named:                                            [  OK  ]
[root@server ~]# /etc/init.d/named status
version: 9.8.2rc1-RedHat-9.8.2-0.37.rc1.el6
CPUs found: 1
worker threads: 1
number of zones: 21
debug level: 0
xfers running: 0
xfers deferred: 0
soa queries in progress: 0
query logging is OFF
recursive clients: 0/0/1000
tcp clients: 0/100
server is up and running
named (pid  3834) is running...

[root@server ~]# chkconfig named on

Add iptables rule for allowing dns port
[root@server ~]# iptables -A INPUT -p tcp --dport 53 -s 0.0.0.0/0.0.0.0 -j ACCEPT
[root@server ~]# iptables -A INPUT -p udp --dport 53 -s 0.0.0.0/0.0.0.0 -j ACCEPT
[root@server ~]# service iptables save
iptables: Saving firewall rules to /etc/sysconfig/iptables:[  OK  ]
[root@server ~]# service iptables restart
iptables: Setting chains to policy ACCEPT: filter          [  OK  ]
iptables: Flushing firewall rules:                         [  OK  ]
iptables: Unloading modules:                               [  OK  ]
iptables: Applying firewall rules:                         [  OK  ]

you can test DNS server using dig and nslookup commands

[root@server ~]# dig server.tn.example.org

; <<>> DiG 9.8.2rc1-RedHat-9.8.2-0.37.rc1.el6 <<>> server.tn.example.org
;; global options: +cmd
;; Got answer:
;; ->>HEADER<<- opcode: QUERY, status: NOERROR, id: 7617
;; flags: qr aa rd ra; QUERY: 1, ANSWER: 1, AUTHORITY: 1, ADDITIONAL: 0

;; QUESTION SECTION:
;server.tn.example.org.         IN      A

;; ANSWER SECTION:
server.tn.example.org.  86400   IN      A       192.168.40.120

;; AUTHORITY SECTION:
example.org.            86400   IN      NS      server.tn.example.org.

;; Query time: 0 msec
;; SERVER: 127.0.0.1#53(127.0.0.1)
;; WHEN: Wed Jun 29 16:07:55 2016
;; MSG SIZE  rcvd: 69

nslookup is a command is used to query name servers

[root@server ~]# nslookup example.org
Server:         127.0.0.1
Address:        127.0.0.1#53

Name:   example.org
Address: 192.168.40.125
Name:   example.org
Address: 192.168.40.120


Client Side Configuration:-

Add DNS server details in resolv.conf in client machine.
[root@client ~]# vim /etc/resolv.conf
; generated by /sbin/dhclient-script
search example.org
nameserver 192.168.40.120
[root@client ~]# dig server.tn.example.org

; <<>> DiG 9.8.2rc1-RedHat-9.8.2-0.37.rc1.el6 <<>> server.tn.example.org
;; global options: +cmd
;; Got answer:
;; ->>HEADER<<- opcode: QUERY, status: NOERROR, id: 27640
;; flags: qr aa rd ra; QUERY: 1, ANSWER: 1, AUTHORITY: 1, ADDITIONAL: 0

;; QUESTION SECTION:
;server.tn.example.org.         IN      A

;; ANSWER SECTION:
server.tn.example.org.  86400   IN      A       192.168.40.120

;; AUTHORITY SECTION:
example.org.            86400   IN      NS      server.tn.example.org.

;; Query time: 2 msec
;; SERVER: 192.168.40.120#53(192.168.40.120)
;; WHEN: Wed Jun 29 22:23:52 2016
;; MSG SIZE  rcvd: 69

[root@client ~]# dig client.tn.example.org

; <<>> DiG 9.8.2rc1-RedHat-9.8.2-0.37.rc1.el6 <<>> client.tn.example.org
;; global options: +cmd
;; Got answer:
;; ->>HEADER<<- opcode: QUERY, status: NOERROR, id: 2456
;; flags: qr aa rd ra; QUERY: 1, ANSWER: 1, AUTHORITY: 1, ADDITIONAL: 1

;; QUESTION SECTION:
;client.tn.example.org.         IN      A

;; ANSWER SECTION:
client.tn.example.org.  86400   IN      A       192.168.40.125

;; AUTHORITY SECTION:
example.org.            86400   IN      NS      server.tn.example.org.

;; ADDITIONAL SECTION:
server.tn.example.org.  86400   IN      A       192.168.40.120

;; Query time: 1 msec
;; SERVER: 192.168.40.120#53(192.168.40.120)
;; WHEN: Wed Jun 29 22:24:22 2016
;; MSG SIZE  rcvd: 92




Thursday, 23 June 2016

User and Group Management in CentOS 6/RHEL 6

User and Group Management

In linux operating system root is the administrator user who is having all the privileges, root user is also called superuser, root can access all files and commands on linux.
root user id is 0
If you want to check system user related information in /etc/passwd file

{In RHEL 6 by default UID assigned to users would start from 500 but in RHEL 7 change in UID allocation, any new users would get UIDs starts assigned from 1000. If you don't want  UID starts from 1000 you can change this in /etc/login.defs }

By default users home directory is created under /home

To create new user
[root@server ~]# useradd arun

Set password for newly created user
[root@server ~]# passwd --stdin arun
Changing password for user arun.
arun123
passwd: all authentication tokens updated successfully.

Check the details of new user account added in /etc/passwd

[root@server ~]# tail -n 1 /etc/passwd
arun:x:500:500::/home/arun:/bin/bash

Check the group account information in /etc/group
[root@server ~]# tail -n 1 /etc/group
arun:x:500:

To delete user account
#userdel arun

To delete user with home directory
#userdel -r arun

To create new group called mango
#groupadd mango

To create a group with particular group ID
#groupadd –g 555 mango

To modify existing user home directory
#usermod –d /home/apps arun
{above command will change the existing user arun home directory from /home/arun to /home/apps }

To change the user’s home directory with content
#usermod –m –d /home/newapps arun

To change user’s default shell using two command usermod & chsh
#usermod –s /bin/sh arun

(OR)

# chsh -s /bin/sh arun
Changing shell for arun.
Shell changed.

To view the available shell
#chsh –l

How to change default user home directory while adding a new user
[root@server ~]# cat /etc/default/useradd 
# useradd defaults file
GROUP=100
HOME=/home
INACTIVE=-1
EXPIRE=
SHELL=/bin/bash
SKEL=/etc/skel
CREATE_MAIL_SPOOL=yes












Wednesday, 13 January 2016

pdsh (Parallel Distributed Shell) installation in CentOS/RHEL 6

#yum groupinstall "Development tools" -y
#tar -xjf pdsh-2.29.tar.bz2
# ./configure
Note:- /configure --with-ssh
# make
# make install
[root@server ~]# which pdsh
/usr/local/bin/pdsh
[root@server pdsh-2.29]# vim /etc/profile.d/pdsh.sh
[root@server pdsh-2.29]# cat /etc/profile.d/pdsh.sh
# setup pdsh for cluster users
export PDSH_RCMD_TYPE='ssh'

export WCOLL='/etc/pdsh/machines'

Monday, 4 January 2016

How to configure HA-LVM in Red Hat Cluster Suite

High Availability LVM :-
How to configure HA-LVM in RedHat Cluster

Prerequisites:-
Actually we are going to configure active-standby linux cluster so minimum two nodes are required for configuring RHCS:-
Operating System :- Red Hat Enterprise Linux Server release 6.7 (Santiago)
Hostname and IP of node1:- server1.example.com; 10.0.0.101/24
Hostname and IP of node2:- server2.example.com; 10.0.0.102/24
Third node will be used for management purpose of cluster so luci is installed & shared iscsi storage server is also configured on the same node.
Hostname and IP of node3:- storage.example.com; 10.0.0.140/24

{ Note:- SELINUX is disabled }

Install Necessary Packages:-
On server1 & server2 install these packages:-
#yum groupinstall "High Availability" "Resilient Storage" -y
#yum -y install iscsi-initiator-utils
On storage node already iscsi server is configured now install luci package on this node:-
#yum install luci –y

[root@server1 ~]# iscsiadm -m discovery -t sendtargets -p storage.example.com
Starting iscsid:                                           [  OK  ]
10.0.0.140:3260,1 iqn.2015-12.com.example:share1
[root@server1 ~]# iscsiadm -m node --targetname "iqn.2015-12.com.example:share1" --portal "storage.example.com:3260" --login
Logging in to [iface: default, target: iqn.2015-12.com.example:share1, portal: 10.0.0.140,3260] (multiple)
Login to [iface: default, target: iqn.2015-12.com.example:share1, portal: 10.0.0.140,3260] successful.
[root@server1 ~]# service iscsi restart
Stopping iscsi:                                            [  OK  ]
Starting iscsi:                                            [  OK  ]
[root@server1 ~]# chkconfig iscsi on
Please confirm the iscsi disk is attached or not
[root@server1 ~]# dmesg | tail
sd 34:0:0:1: [sdb] Mode Sense: 49 00 00 08
sd 34:0:0:1: [sdb] Write cache: enabled, read cache: enabled, doesn't support DPO or FUA
 sdb: unknown partition table
sd 34:0:0:1: [sdb] Attached SCSI disk

Please do the same steps on server2 :-
[root@server2 ~]# iscsiadm -m discovery -t sendtargets -p storage.example.com
Starting iscsid:                                           [  OK  ]
10.0.0.140:3260,1 iqn.2015-12.com.example:share1

[root@server2 ~]# iscsiadm -m node --targetname "iqn.2015-12.com.example:share1" --portal "storage.example.com:3260" --login
Logging in to [iface: default, target: iqn.2015-12.com.example:share1, portal: 10.0.0.140,3260] (multiple)
Login to [iface: default, target: iqn.2015-12.com.example:share1, portal: 10.0.0.140,3260] successful.
[root@server2 ~]# service iscsi restart
Stopping iscsi:                                            [  OK  ]
Starting iscsi:                                            [  OK  ]
[root@server2 ~]# chkconfig iscsi on
[root@server2 ~]# dmesg | tail
sd 34:0:0:1: [sdb] Write Protect is off
sd 34:0:0:1: [sdb] Mode Sense: 49 00 00 08
sd 34:0:0:1: [sdb] Write cache: enabled, read cache: enabled, doesn't support DPO or FUA
 sdb: unknown partition table
sd 34:0:0:1: [sdb] Attached SCSI disk

You have to assing the password for ricci user on both the nodes:-
[root@server1 ~]# passwd --stdin ricci
Changing password for user ricci.
redhat
passwd: all authentication tokens updated successfully.
Start the ricci service:-
[root@server1 ~]# /etc/init.d/ricci start
Starting oddjobd:                                          [  OK  ]
generating SSL certificates...  done
Generating NSS database...  done
Starting ricci:                                            [  OK  ]
[root@server1 ~]# chkconfig ricci on
[root@server2 ~]# passwd --stdin ricci
Changing password for user ricci.
redhat
passwd: all authentication tokens updated successfully.
[root@server2 ~]# /etc/init.d/ricci start
Starting oddjobd:                                          [  OK  ]
generating SSL certificates...  done
Generating NSS database...  done
Starting ricci:                                            [  OK  ]
[root@server2 ~]# chkconfig ricci on
Iptables Rules needs to add on both the nodes:-
#iptables -I INPUT -m state --state NEW -m multiport -p udp -s 10.0.0.0/24 -d 10.0.0.0/24 --dports 5404,5405 -j ACCEPTiptables -I INPUT -m addrtype --dst-type MULTICAST -m state --state NEW -m multiport -p udp -s 10.0.0.0/24 --dports 5404,5405 -j ACCEPT
#iptables -I INPUT -m state --state NEW -p tcp -s 10.0.0.0/24 -d 10.0.0.0/24 --dport 21064 -j ACCEPT
#iptables -I INPUT -m state --state NEW -p tcp -s 10.0.0.0/24 -d 10.0.0.0/24 --dport 11111 -j ACCEPT
#iptables -I INPUT -m state --state NEW -p tcp -s 10.0.0.0/24 -d 10.0.0.0/24 --dport 16851 -j ACCEPT
#iptables -I INPUT -m state --state NEW -p tcp -s 10.0.0.0/24 -d 10.0.0.0/24 --dport 8084 -j ACCEPT
#iptables -I INPUT -p igmp -j ACCEPT
#service iptables save ; service iptables restart
Access Luci Console:-
Point your web browser to https://storage.example.com:8084
Please enter username and password
Username:- root
Password:- our luci machine root user password

After login Navigate the windows to "Manage Clusters" then click on Create


New pop-up will come here you need to provide Cluster Name, Node’s hostname and ricci password


Here I have given mycluster as a ClusterName,
Node Name:- server1.example.com & server2.example.com password we already created for ricci user please give that password, after that please check Enabled Shared Storage Support and Use Locally Installed Packages

If everthing goes fine it will show you below popup otherwise it will throw error



Now both the nodes has been added successfully


Please make sure these services should run on both the nodes:-
Cluster Daemons
Status
cman
Running
rgmanager
Running
Ricci
Running
Modclusterd
Running
Clvmd
Running


Now configure the HA-LVM with CLVM:-
Note:- locking_type parameter in the global section of the /etc/lvm/lvm.conf file is set to the value '3'.
[root@server1 ~]# fdisk -cu /dev/sdb
Device contains neither a valid DOS partition table, nor Sun, SGI or OSF disklabel
Building a new DOS disklabel with disk identifier 0xb10ea483.
Changes will remain in memory only, until you decide to write them.
After that, of course, the previous content won't be recoverable.

Warning: invalid flag 0x0000 of partition table 4 will be corrected by w(rite)

Command (m for help): p

Disk /dev/sdb: 8589 MB, 8589934592 bytes
64 heads, 32 sectors/track, 8192 cylinders, total 16777216 sectors
Units = sectors of 1 * 512 = 512 bytes
Sector size (logical/physical): 512 bytes / 512 bytes
I/O size (minimum/optimal): 512 bytes / 512 bytes
Disk identifier: 0xb10ea483

   Device Boot      Start         End      Blocks   Id  System

Command (m for help): n
Command action
   e   extended
   p   primary partition (1-4)
p
Partition number (1-4): 1
First sector (2048-16777215, default 2048):
Using default value 2048
Last sector, +sectors or +size{K,M,G} (2048-16777215, default 16777215):
Using default value 16777215

Command (m for help): t
Selected partition 1
Hex code (type L to list codes): 8e
Changed system type of partition 1 to 8e (Linux LVM)

Command (m for help): p

Disk /dev/sdb: 8589 MB, 8589934592 bytes
64 heads, 32 sectors/track, 8192 cylinders, total 16777216 sectors
Units = sectors of 1 * 512 = 512 bytes
Sector size (logical/physical): 512 bytes / 512 bytes
I/O size (minimum/optimal): 512 bytes / 512 bytes
Disk identifier: 0xb10ea483

   Device Boot      Start         End      Blocks   Id  System
/dev/sdb1            2048    16777215     8387584   8e  Linux LVM

Command (m for help): w
The partition table has been altered!

Calling ioctl() to re-read partition table.
Syncing disks.
[root@server1 ~]# pvcreate /dev/sdb1
  Physical volume "/dev/sdb1" successfully created
[root@server1 ~]# vgcreate -cy cluster_vg /dev/sdb1
  Clustered volume group "cluster_vg" successfully created

During the lvcreation you may get below error:-

[root@server1 ~]# lvcreate -L 7G -n cluster_lv cluster_vg
  Error locking on node server2.example.com: Volume group for uuid not found: LWfm85PirK3ujvcShsSfOgP3PhFH4AU6KF8m0BcSfwU4dWD9DS19CMDh0aBJaagD
  Failed to activate new LV
Solution:-
1) Make sure clvmd service is running  on all the cluster nodes, if not start clvmd service using below command
# service clvmd start
2) Make sure the partition /dev/sdb1 is detected by the kernel and mapped on all the node
# partprobe ---> run this command on both the nodes server1 & server2


[root@server1 ~]# lvcreate -L 7G -n cluster_lv cluster_vg
  Logical volume "cluster_lv" created.
[root@server1 ~]# mkfs.ext4 /dev/mapper/cluster_vg-cluster_lv
mke2fs 1.41.12 (17-May-2010)
Filesystem label=
OS type: Linux
Block size=4096 (log=2)
Fragment size=4096 (log=2)
Stride=0 blocks, Stripe width=0 blocks
458752 inodes, 1835008 blocks
91750 blocks (5.00%) reserved for the super user
First data block=0
Maximum filesystem blocks=1879048192
56 block groups
32768 blocks per group, 32768 fragments per group
8192 inodes per group
Superblock backups stored on blocks:
        32768, 98304, 163840, 229376, 294912, 819200, 884736, 1605632

Writing inode tables: done
Creating journal (32768 blocks): done
Writing superblocks and filesystem accounting information: done

This filesystem will be automatically checked every 39 mounts or
180 days, whichever comes first.  Use tune2fs -c or -i to override.

Add fencing to Cluster Select Fence Devices,
{Note: Fencing is the disconnection of a node from shared storage}
There are different types of fencing devices available. Here I am using VMWARE virtual machine to build a cluster, So I am selecting the option called VMware Fencing {SOAP Interface}







After selecting Vmware Fencing(SOAP Interface)
Give desired name whatever you want, I have given myfence as a Name, Address give your base machine IP Address {not virtual machine ok}
Login :- login user of your base machine
Password:- password of that user

 fence device created successfully


Step 1 – To get the UUID of your two nodes please run the below command in terminal

[root@server1 ~]# fence_vmware_soap --ip 192.168.58.1 --username "arun m" --password  impel123 -z --action list | grep server1
server1,564d246b-949e-03fe-e3fc-14fc35ce9cb6

[root@server1 ~]# fence_vmware_soap --ip 192.168.58.1 --username "arun m" --password  impel123 -z --action list | grep server2
server2,564d8d2a-2054-1e05-22ce-b733e3f491d5

Step2:- Go back to the luci Manage Clusters and click on select the firtnode server1.example.com


Then select Add Fence Method

Give any name here I have give vmware_fence as a name, then click “Submit” your changes

Now select “Add Fence Instance


In this section we are going to add your fencing device instance, select the option called myfence(VMware Fencing SOAP Interface)
[NOTE:- we have already configured this vmware fencing soap interface in Fence Devices tab ]
Next Give Vm name or any name {name does not matter}
Next Give the UUID of server1
Next check the Use SSL option, then click submit



Please do the same step for server2 also:-
Failover Domain Configuration:-


There are different types of failover domains are there
Nodes in the ordered domain are assigned a priority level from 1-100. Priority 1 being highest and 100 being the lowest. A node with the highest priority will run the resource group. The resource if it was running on node 2, will migrate to node 1 when it becomes online.






























After creating the whole cluster setup, my cluster.conf file will look like the following
[root@server1 ~]# cat /etc/cluster/cluster.conf
<?xml version="1.0"?>
<cluster config_version="8" name="mycluster">
        <clusternodes>
                <clusternode name="server1.example.com" nodeid="1"/>
                <clusternode name="server2.example.com" nodeid="2"/>
        </clusternodes>
        <cman expected_votes="1" two_node="1"/>
        <rm>
                <failoverdomains>
                        <failoverdomain name="failoverdomain" nofailback="1" ordered="1">
                                <failoverdomainnode name="server1.example.com" priority="1"/>
                                <failoverdomainnode name="server2.example.com" priority="2"/>
                        </failoverdomain>
                </failoverdomains>
                <resources>
                        <fs device="/dev/cluster_vg/cluster_lv" force_unmount="1" fsid="19408" fstype="ext4" mountpoint="/cluster" name="myFS"/>
                        <lvm lv_name="cluster_lv" name="lvm" self_fence="1" vg_name="cluster_vg"/>
                </resources>
                <service domain="failoverdomain" name="myservice" recovery="relocate">
                        <lvm ref="lvm"/>
                        <fs ref="myFS"/>
                </service>
        </rm>
        <fencedevices>
                <fencedevice agent="fence_vmware_soap" ipaddr="192.168.58.1" login="arun m" name="myfence" passwd="impel123"/>
        </fencedevices>
</cluster>

[root@server1 ~]# df -h
Filesystem            Size  Used Avail Use% Mounted on
/dev/mapper/vg_server1-lv_root
                       18G  5.6G   11G  35% /
tmpfs                 1.9G   26M  1.9G   2% /dev/shm
/dev/sda1             477M   42M  411M  10% /boot
/dev/mapper/cluster_vg-cluster_lv
                      6.8G   16M  6.4G   1% /cluster
To test the cluster I am powering off the server1:-
[root@server1 ~]# poweroff
[root@server1 ~]#
Broadcast message from root@server1.example.com
        (/dev/pts/0) at 20:39 ...

The system is going down for power off NOW!
Verify server2 using df command LVM is mounted on /cluster directory
[root@server2 ~]# df -h
Filesystem            Size  Used Avail Use% Mounted on
/dev/mapper/vg_server2-lv_root
                       18G  5.6G   11G  35% /
tmpfs                 1.9G   26M  1.9G   2% /dev/shm
/dev/sda1             477M   42M  411M  10% /boot
[root@server2 ~]# df -h
Filesystem            Size  Used Avail Use% Mounted on
/dev/mapper/vg_server2-lv_root
                       18G  5.6G   11G  35% /
tmpfs                 1.9G   26M  1.9G   2% /dev/shm
/dev/sda1             477M   42M  411M  10% /boot
/dev/mapper/cluster_vg-cluster_lv
                      6.8G   16M  6.4G   1% /cluster