Node Type: WNsIntelS2600TP

Firewall requirements

local port open to reason


Regular Maintenance work

Emergency Measures

Installation

10Gbs net

The following 10Gbs cables are for the single connected Servers ( t3wn5[1-9] ) 
13-18902, 13-18904, 13-18918 to 13-18924
VLAN 410

mdadm 1+0 on 4 disks

grub.conf as made by kickstart

# cat /boot/grub/grub.conf
default=0
timeout=5
serial --unit=0 --speed=115200
terminal --timeout=5 serial console
title Scientific Linux 6 (2.6.32-573.22.1.el6.x86_64)
	root (hd0,1)
	kernel /vmlinuz-2.6.32-573.22.1.el6.x86_64 ro root=UUID=878ca5a0-6e97-47b2-a6bb-e6cf6efdc293 rd_NO_LUKS rd_MD_UUID=4e09e669:a6f071fe:e33d3d95:7218d202 text elevator=noop LANG=en_US.UTF-8 rd_NO_LVM console=ttyS0,115200 crashkernel=auto rd_MD_UUID=290f8013:5a9c5296:0d75d175:05f47e24  KEYBOARDTYPE=pc KEYTABLE=us SYSFONT=latarcyrheb-sun16 rd_NO_DM
	initrd /initramfs-2.6.32-573.22.1.el6.x86_64.img

# file -s /dev/sda /dev/sdb /dev/sdc /dev/sdd
/dev/sda: x86 boot sector; GRand Unified Bootloader, stage1 version 0x3, boot drive 0x80, 1st sector stage2 0x13db808, GRUB version 0.94; partition 1: ID=0xfd, starthead 32, startsector 2048, 20480000 sectors; partition 2: ID=0xfd, active, starthead 254, startsector 20482048, 6144000 sectors; partition 3: ID=0xfd, starthead 254, startsector 26626048, 102400000 sectors; partition 4: ID=0x5, starthead 254, startsector 129026048, 1629148720 sectors, code offset 0x48
/dev/sdb: x86 boot sector; GRand Unified Bootloader, stage1 version 0x3, boot drive 0x80, 1st sector stage2 0x13db808, GRUB version 0.94; partition 1: ID=0xfd, starthead 32, startsector 2048, 20480000 sectors; partition 2: ID=0xfd, active, starthead 254, startsector 20482048, 6144000 sectors; partition 3: ID=0xfd, starthead 254, startsector 26626048, 102400000 sectors; partition 4: ID=0x5, starthead 254, startsector 129026048, 1629148720 sectors, code offset 0x48
/dev/sdc: x86 boot sector; partition 1: ID=0xfd, starthead 32, startsector 2048, 20480000 sectors; partition 2: ID=0xfd, active, starthead 254, startsector 20482048, 6144000 sectors; partition 3: ID=0xfd, starthead 254, startsector 26626048, 102400000 sectors; partition 4: ID=0x5, starthead 254, startsector 129026048, 1629148720 sectors, code offset 0xb8
/dev/sdd: x86 boot sector; partition 1: ID=0xfd, starthead 32, startsector 2048, 20480000 sectors; partition 2: ID=0xfd, active, starthead 254, startsector 20482048, 6144000 sectors; partition 3: ID=0xfd, starthead 254, startsector 26626048, 102400000 sectors; partition 4: ID=0x5, starthead 254, startsector 129026048, 1629148720 sectors, code offset 0xb8

grub.conf fallback boot

# cat /boot/grub/grub.conf
default=0
fallback=1
timeout=5
serial --unit=0 --speed=115200
terminal --timeout=5 serial console
title Scientific Linux 6 (2.6.32-573.22.1.el6.x86_64) - 1st disk
	root (hd0,1)
	kernel /vmlinuz-2.6.32-573.22.1.el6.x86_64 ro root=UUID=878ca5a0-6e97-47b2-a6bb-e6cf6efdc293 rd_NO_LUKS rd_MD_UUID=4e09e669:a6f071fe:e33d3d95:7218d202 text elevator=noop LANG=en_US.UTF-8 rd_NO_LVM console=ttyS0,115200 crashkernel=auto rd_MD_UUID=290f8013:5a9c5296:0d75d175:05f47e24  KEYBOARDTYPE=pc KEYTABLE=us SYSFONT=latarcyrheb-sun16 rd_NO_DM
	initrd /initramfs-2.6.32-573.22.1.el6.x86_64.img
title Scientific Linux 6 (2.6.32-573.22.1.el6.x86_64) - 2nd disk
	root (hd1,1)
	kernel /vmlinuz-2.6.32-573.22.1.el6.x86_64 ro root=UUID=878ca5a0-6e97-47b2-a6bb-e6cf6efdc293 rd_NO_LUKS rd_MD_UUID=4e09e669:a6f071fe:e33d3d95:7218d202 text elevator=noop LANG=en_US.UTF-8 rd_NO_LVM console=ttyS0,115200 crashkernel=auto rd_MD_UUID=290f8013:5a9c5296:0d75d175:05f47e24  KEYBOARDTYPE=pc KEYTABLE=us SYSFONT=latarcyrheb-sun16 rd_NO_DM
	initrd /initramfs-2.6.32-573.22.1.el6.x86_64.img

Failing intentionally a disk

# cat /proc/mdstat  | grep md | egrep --color 'md[0-9]+|sdc[0-9]+' -o | paste - - | sort  -n | awk '{ print "mdadm /dev/"$1" --fail /dev/"$2" --remove /dev/"$2 }'
mdadm /dev/md0 --fail /dev/sdc2 --remove /dev/sdc2
mdadm /dev/md10 --fail /dev/sdc3 --remove /dev/sdc3
mdadm /dev/md11 --fail /dev/sdc5 --remove /dev/sdc5
mdadm /dev/md1 --fail /dev/sdc1 --remove /dev/sdc1
mdadm /dev/md2 --fail /dev/sdc10 --remove /dev/sdc10
mdadm /dev/md3 --fail /dev/sdc11 --remove /dev/sdc11
mdadm /dev/md4 --fail /dev/sdc6 --remove /dev/sdc6
mdadm /dev/md5 --fail /dev/sdc8 --remove /dev/sdc8
mdadm /dev/md6 --fail /dev/sdc13 --remove /dev/sdc13
mdadm /dev/md7 --fail /dev/sdc9 --remove /dev/sdc9
mdadm /dev/md8 --fail /dev/sdc7 --remove /dev/sdc7
mdadm /dev/md9 --fail /dev/sdc12 --remove /dev/sdc12

# cat /proc/mdstat  | grep md | egrep --color 'md[0-9]+|sdc[0-9]+' -o | paste - - | sort  -n | awk '{ print "mdadm /dev/"$1" --fail /dev/"$2" --remove /dev/"$2 }' | bash -x
+ mdadm /dev/md0 --fail /dev/sdc2 --remove /dev/sdc2
mdadm: set /dev/sdc2 faulty in /dev/md0
mdadm: hot removed /dev/sdc2 from /dev/md0
+ mdadm /dev/md10 --fail /dev/sdc3 --remove /dev/sdc3
mdadm: set /dev/sdc3 faulty in /dev/md10
mdadm: hot removed /dev/sdc3 from /dev/md10
+ mdadm /dev/md11 --fail /dev/sdc5 --remove /dev/sdc5
mdadm: set /dev/sdc5 faulty in /dev/md11
mdadm: hot removed /dev/sdc5 from /dev/md11
+ mdadm /dev/md1 --fail /dev/sdc1 --remove /dev/sdc1
mdadm: set /dev/sdc1 faulty in /dev/md1
mdadm: hot removed /dev/sdc1 from /dev/md1
+ mdadm /dev/md2 --fail /dev/sdc10 --remove /dev/sdc10
mdadm: set /dev/sdc10 faulty in /dev/md2
mdadm: hot removed /dev/sdc10 from /dev/md2
+ mdadm /dev/md3 --fail /dev/sdc11 --remove /dev/sdc11
mdadm: set /dev/sdc11 faulty in /dev/md3
mdadm: hot removed /dev/sdc11 from /dev/md3
+ mdadm /dev/md4 --fail /dev/sdc6 --remove /dev/sdc6
mdadm: set /dev/sdc6 faulty in /dev/md4
mdadm: hot removed /dev/sdc6 from /dev/md4
+ mdadm /dev/md5 --fail /dev/sdc8 --remove /dev/sdc8
mdadm: set /dev/sdc8 faulty in /dev/md5
mdadm: hot removed /dev/sdc8 from /dev/md5
+ mdadm /dev/md6 --fail /dev/sdc13 --remove /dev/sdc13
mdadm: set /dev/sdc13 faulty in /dev/md6
mdadm: hot removed /dev/sdc13 from /dev/md6
+ mdadm /dev/md7 --fail /dev/sdc9 --remove /dev/sdc9
mdadm: set /dev/sdc9 faulty in /dev/md7
mdadm: hot removed /dev/sdc9 from /dev/md7
+ mdadm /dev/md8 --fail /dev/sdc7 --remove /dev/sdc7
mdadm: set /dev/sdc7 faulty in /dev/md8
mdadm: hot removed /dev/sdc7 from /dev/md8
+ mdadm /dev/md9 --fail /dev/sdc12 --remove /dev/sdc12
mdadm: set /dev/sdc12 faulty in /dev/md9
mdadm: hot removed /dev/sdc12 from /dev/md9

Replacing a broken disk

Making the same partitions - 1st way

Easy!
ddrescue -d -f -v /dev/sdn  /dev/sdm rescue.log
so in 1 step we also get GRUB installed

Making the same partitions - 2nd way

In this example we're going to replace sdd ; change the next pipe accordingly ; if you lost a disc with Grub installed then install also the Grub boot loader in order to have 2 bootable disks :
# sfdisk -d /dev/sdc | sfdisk --force /dev/sdd

Making appear the partitions

partprobe /dev/sd_REPLACED_DISK 

Resyncing mdadm

Adapt this pipe to your own case :
 
# awk '{ print $1,$5}' /proc/mdstat | grep md  |sort -V | cut -d[ -f1  |awk '{ print  " mdadm --add /dev/"$1" /dev/"$2 }'  | sed 's#sd[abc]#sdd#'  | bash -x 
+ mdadm --add /dev/md0 /dev/sdd2
mdadm: added /dev/sdd2
+ mdadm --add /dev/md1 /dev/sdd1
mdadm: added /dev/sdd1
+ mdadm --add /dev/md2 /dev/sdd10
mdadm: added /dev/sdd10
+ mdadm --add /dev/md3 /dev/sdd11
mdadm: added /dev/sdd11
+ mdadm --add /dev/md4 /dev/sdd6
mdadm: added /dev/sdd6
+ mdadm --add /dev/md5 /dev/sdd8
mdadm: added /dev/sdd8
+ mdadm --add /dev/md6 /dev/sdd13
mdadm: added /dev/sdd13
+ mdadm --add /dev/md7 /dev/sdd9
mdadm: added /dev/sdd9
+ mdadm --add /dev/md8 /dev/sdd7
mdadm: added /dev/sdd7
+ mdadm --add /dev/md9 /dev/sdd12
mdadm: added /dev/sdd12
+ mdadm --add /dev/md10 /dev/sdd3
mdadm: added /dev/sdd3
+ mdadm --add /dev/md11 /dev/sdd5
mdadm: added /dev/sdd5

Services

Backups

No backups

RailKit HowTo

t3wn51-59 rail kit howto doc
NodeTypeForm
Hostnames t3wn[51-59]
Services Sun Grid Engine 6.2u5 execution hosts
Hardware Dalco r2264i5t - Intel S2600TP
Install Profile wn
Guarantee/maintenance until 01-04-2019
Topic attachments
I Attachment History Action Size Date Who Comment
PDFpdf t3wn51-9-rail-kit-doc.pdf r1 manage 2339.7 K 2016-04-11 - 09:23 FabioMartinelli t3wn5[1-9] rail kit howto doc
Edit | Attach | Watch | Print version | History: r19 | r17 < r16 < r15 < r14 | Backlinks | Raw View | Raw edit | More topic actions...
Topic revision: r15 - 2016-11-07 - FabioMartinelli
 
  • Edit
  • Attach
This site is powered by the TWiki collaboration platform Powered by Perl This site is powered by the TWiki collaboration platformCopyright © 2008-2024 by the contributing authors. All material on this collaboration platform is the property of the contributing authors.
Ideas, requests, problems regarding TWiki? Send feedback