Салют трудягам!
Сервер в стойке, старенький ~6-7 лет.
[root@ftp /home/dmitry]# pciconf -l -cv
hostb0@pci0:0:0:0: class=0x060000 card=0x342f8086 chip=0x25788086 rev=0x02 hdr=0x00
vendor = 'Intel Corporation'
device = '82875P/E7210 DRAM Controller / Host-Hub Interface'
class = bridge
subclass = HOST-PCI
cap 09[e4] = vendor (length 6) Intel cap 3 version 1
pcib1@pci0:0:3:0: class=0x060400 card=0x00000000 chip=0x257b8086 rev=0x02 hdr=0x01
vendor = 'Intel Corporation'
device = '82875P/E7210 PCI to CSA Bridge'
class = bridge
subclass = PCI-PCI
pcib2@pci0:0:28:0: class=0x060400 card=0x00000000 chip=0x25ae8086 rev=0x02 hdr=0x01
vendor = 'Intel Corporation'
device = '6300ESB Hub Interface to PCI-X Bridge'
class = bridge
subclass = PCI-PCI
cap 07[50] = PCI-X 64-bit bridge supports
uhci0@pci0:0:29:0: class=0x0c0300 card=0x342f8086 chip=0x25a98086 rev=0x02 hdr=0x00
vendor = 'Intel Corporation'
device = '6300ESB USB 1.1 UHCI Controller'
class = serial bus
subclass = USB
uhci1@pci0:0:29:1: class=0x0c0300 card=0x342f8086 chip=0x25aa8086 rev=0x02 hdr=0x00
vendor = 'Intel Corporation'
device = '6300ESB USB 1.1 UHCI Controller'
class = serial bus
subclass = USB
none0@pci0:0:29:4: class=0x088000 card=0x342f8086 chip=0x25ab8086 rev=0x02 hdr=0x00
vendor = 'Intel Corporation'
device = '6300ESB Watchdog Timer'
class = base peripheral
ioapic0@pci0:0:29:5: class=0x080020 card=0x342f8086 chip=0x25ac8086 rev=0x02 hdr=0x00
vendor = 'Intel Corporation'
device = '6300ESB I/O Advanced Programmable Interrupt Controller'
class = base peripheral
subclass = interrupt controller
cap 07[50] = PCI-X 64-bit supports 512 burst read, 1 split transaction
ehci0@pci0:0:29:7: class=0x0c0320 card=0x342f8086 chip=0x25ad8086 rev=0x02 hdr=0x00
vendor = 'Intel Corporation'
device = '6300ESB USB 2.0 EHCI Controller'
class = serial bus
subclass = USB
cap 01[50] = powerspec 2 supports D0 D3 current D0
cap 0a[58] = EHCI Debug Port at offset 0x80 in map 0x14
pcib3@pci0:0:30:0: class=0x060400 card=0x00000000 chip=0x244e8086 rev=0x0a hdr=0x01
vendor = 'Intel Corporation'
device = '82801 Family (ICH2/3/4/4/5/5/6/7/8/9,63xxESB) Hub Interface to PCI Bridge'
class = bridge
subclass = PCI-PCI
isab0@pci0:0:31:0: class=0x060100 card=0x00000000 chip=0x25a18086 rev=0x02 hdr=0x00
vendor = 'Intel Corporation'
device = '6300ESB LPC Inteface Controller'
class = bridge
subclass = PCI-ISA
atapci0@pci0:0:31:1: class=0x01018a card=0x342f8086 chip=0x25a28086 rev=0x02 hdr=0x00
vendor = 'Intel Corporation'
device = '6300ESB IDE Controller'
class = mass storage
subclass = ATA
atapci1@pci0:0:31:2: class=0x01018f card=0x342f8086 chip=0x25a38086 rev=0x02 hdr=0x00
vendor = 'Intel Corporation'
device = '6300ESB Serial ATA Controller'
class = mass storage
subclass = ATA
none1@pci0:0:31:3: class=0x0c0500 card=0x342f8086 chip=0x25a48086 rev=0x02 hdr=0x00
vendor = 'Intel Corporation'
device = '6300ESB SMBus Controller'
class = serial bus
subclass = SMBus
em0@pci0:1:1:0: class=0x020000 card=0x342f8086 chip=0x10758086 rev=0x00 hdr=0x00
vendor = 'Intel Corporation'
device = '82547EI Gigabit Ethernet Controller'
class = network
subclass = ethernet
cap 01[dc] = powerspec 2 supports D0 D3 current D0
vgapci0@pci0:3:0:0: class=0x030000 card=0x342f8086 chip=0x47521002 rev=0x27 hdr=0x00
vendor = 'ATI Technologies Inc'
device = 'Rage XL PCI'
class = display
subclass = VGA
cap 01[5c] = powerspec 2 supports D0 D1 D2 D3 current D0
fxp0@pci0:3:1:0: class=0x020000 card=0x342f8086 chip=0x12298086 rev=0x10 hdr=0x00
vendor = 'Intel Corporation'
device = '82550/1/7/8/9 EtherExpress PRO/100(B) Ethernet Adapter'
class = network
subclass = ethernet
cap 01[dc] = powerspec 2 supports D0 D1 D2 D3 current D0
[root@ftp /home/dmitry]# dmesg |grep ad4
ad4: 953869MB <Seagate ST31000524NS SN11> at ata2-master SATA150
Trying to mount root from ufs:/dev/ad4s1a
ad4: TIMEOUT - READ_DMA retrying (1 retry left) LBA=9916535
ad4: TIMEOUT - READ_DMA retrying (1 retry left) LBA=8533759
ad4: TIMEOUT - READ_DMA48 retrying (1 retry left) LBA=295845648
ad4: TIMEOUT - READ_DMA48 retrying (0 retries left) LBA=295845648
ad4: FAILURE - READ_DMA48 timed out LBA=295845648
g_vfs_done():ad4s1f[READ(offset=136426192896, length=16384)]error = 5
ad4: TIMEOUT - READ_DMA48 retrying (1 retry left) LBA=322190288
ad4: TIMEOUT - READ_DMA48 retrying (0 retries left) LBA=322190288
ad4: FAILURE - READ_DMA48 timed out LBA=322190288
g_vfs_done():ad4s1f[READ(offset=149914648576, length=16384)]error = 5
ad4: TIMEOUT - READ_DMA48 retrying (1 retry left) LBA=344771408
ad4: TIMEOUT - READ_DMA48 retrying (0 retries left) LBA=344771408
ad4: FAILURE - READ_DMA48 timed out LBA=344771408
g_vfs_done():ad4s1f[READ(offset=161476182016, length=16384)]error = 5
ad4: TIMEOUT - READ_DMA48 retrying (1 retry left) LBA=1457267760
ad4: TIMEOUT - READ_DMA48 retrying (0 retries left) LBA=1457267760
ad4: FAILURE - READ_DMA48 timed out LBA=1457267760
g_vfs_done():ad4s1f[READ(offset=731074314240, length=16384)]error = 5
ad4: TIMEOUT - READ_DMA retrying (1 retry left) LBA=19830450
[root@ftp /home/dmitry]#
Стали сыпаться диски. За 2 недели уже второй:
=== START OF READ SMART DATA SECTION ===
SMART Attributes Data Structure revision number: 10
Vendor Specific SMART Attributes with Thresholds:
ID# ATTRIBUTE_NAME FLAG VALUE WORST THRESH TYPE UPDATED WHEN_FAILED RAW_VALUE
1 Raw_Read_Error_Rate 0x000f 081 065 044 Pre-fail Always - 139991064
3 Spin_Up_Time 0x0003 100 100 000 Pre-fail Always - 0
4 Start_Stop_Count 0x0032 100 100 020 Old_age Always - 7
5 Reallocated_Sector_Ct 0x0033 009 009 036 Pre-fail Always FAILING_NOW 3729
7 Seek_Error_Rate 0x000f 064 060 030 Pre-fail Always - 2969006
9 Power_On_Hours 0x0032 100 100 000 Old_age Always - 268
10 Spin_Retry_Count 0x0013 100 100 097 Pre-fail Always - 0
12 Power_Cycle_Count 0x0032 100 100 020 Old_age Always - 7
184 Unknown_Attribute 0x0032 100 100 099 Old_age Always - 0
187 Reported_Uncorrect 0x0032 100 100 000 Old_age Always - 0
188 Unknown_Attribute 0x0032 099 081 000 Old_age Always - 38657196070
189 High_Fly_Writes 0x003a 100 100 000 Old_age Always - 0
190 Airflow_Temperature_Cel 0x0022 073 068 045 Old_age Always - 27 (Lifetime Min/Max 21/32)
191 G-Sense_Error_Rate 0x0032 100 100 000 Old_age Always - 0
192 Power-Off_Retract_Count 0x0032 100 100 000 Old_age Always - 6
193 Load_Cycle_Count 0x0032 100 100 000 Old_age Always - 7
194 Temperature_Celsius 0x0022 027 040 000 Old_age Always - 27 (0 20 0 0)
195 Hardware_ECC_Recovered 0x001a 030 029 000 Old_age Always - 139991064
197 Current_Pending_Sector 0x0012 100 100 000 Old_age Always - 0
198 Offline_Uncorrectable 0x0010 100 100 000 Old_age Offline - 0
199 UDMA_CRC_Error_Count 0x003e 200 200 000 Old_age Always - 0
Кабеля менял. Блок питания или контроллер, больше думать не на что :/