All,
I'm resending to a somewhat larger audience in the hope of getting some
response.
I got the above the first time yesterday when I rebooted my Lenovo T60p
running opensolaris with b93; e1000g was "gone", ie, it wasn't plumbed
anymore. I've seen it go down more often recently during data transfers,
but haven't had time to pursue it so far.
I found Jeff Cheeney's blog entry
(http://blogs.sun.com/icedawn/entry/laptop_and_retired_i_o) and started
fmdump'ing - here's one example, I've attached the output of a few commands
for those interested in more details
$ fmdump -v -u d0e07886-f997-edf3-91ff-b2e3c7017368
TIME UUID SUNW-MSG-ID
Aug 10 02:38:25.0576 d0e07886-f997-edf3-91ff-b2e3c7017368 PCIEX-8000-0A
100% fault.io.pciex.device-interr
Problem in:
hc://:product-id=8744C9U:chassis-id=L3CA377:server-id=paddy/motherboard=0/hostbridge=1/pciexrc=1/pciexbus=2/pciexdev=0/pciexfn=0
Affects: dev:////[EMAIL PROTECTED],0/pci8086,[EMAIL
PROTECTED]/pci17aa,[EMAIL PROTECTED]
FRU:
hc://:product-id=8744C9U:chassis-id=L3CA377:server-id=paddy/motherboard=0/hostbridge=1/pciexrc=1/pciexbus=2/pciexdev=0
Location: pcie2
I could probably try to follow Jeff's example and just "fmadm repair", but
I feel that would only delay the issue ...
so:
- from that attached data, is it possible to find out what the root-cause
is? (if yes: what is it? ;-)
- if no, what do I need to do to help identify it?
TIA
Michael
--
Michael Schuster http://blogs.sun.com/recursion
Recursion, n.: see 'Recursion'
Script started on Mon Aug 11 20:42:30 2008
$ fmdump
TIME UUID SUNW-MSG-ID
Aug 10 02:38:25.0576 d0e07886-f997-edf3-91ff-b2e3c7017368 PCIEX-8000-0A
$ fmdump -e
TIME CLASS
Aug 10 02:37:54.4000 ereport.io.device.stall
Aug 10 02:37:54.8360 ereport.io.device.inval_state
Aug 10 02:37:54.8360 ereport.io.service.lost
Aug 10 02:37:54.8361 ereport.io.service.lost
$ fmdump -vV
TIME UUID SUNW-MSG-ID
Aug 10 02:38:25.0576 d0e07886-f997-edf3-91ff-b2e3c7017368 PCIEX-8000-0A
TIME CLASS ENA
Aug 10 02:37:54.8361 ereport.io.service.lost 0x4cb4dccf61600401
Aug 10 02:37:54.8360 ereport.io.service.lost 0x4cb4dcb61d800401
Aug 10 02:37:54.8360 ereport.io.device.inval_state 0x4cb4dcb16a100401
Aug 10 02:37:54.4000 ereport.io.device.stall 0x4cb33cda59700401
nvlist version: 0
version = 0x0
class = list.suspect
uuid = d0e07886-f997-edf3-91ff-b2e3c7017368
code = PCIEX-8000-0A
diag-time = 1218361104 775848
de = (embedded nvlist)
nvlist version: 0
version = 0x0
scheme = fmd
authority = (embedded nvlist)
nvlist version: 0
version = 0x0
product-id = 8744C9U
chassis-id = L3CA377
server-id = paddy
(end authority)
mod-name = eft
mod-version = 1.16
(end de)
fault-list-sz = 0x1
fault-list = (array of embedded nvlists)
(start fault-list[0])
nvlist version: 0
version = 0x0
class = fault.io.pciex.device-interr
certainty = 0x64
asru = (embedded nvlist)
nvlist version: 0
version = 0x0
scheme = dev
device-path = /[EMAIL PROTECTED],0/pci8086,[EMAIL
PROTECTED]/pci17aa,[EMAIL PROTECTED]
(end asru)
fru = (embedded nvlist)
nvlist version: 0
version = 0x0
scheme = hc
hc-root =
authority = (embedded nvlist)
nvlist version: 0
product-id = 8744C9U
chassis-id = L3CA377
server-id = paddy
(end authority)
hc-list-sz = 0x5
hc-list = (array of embedded nvlists)
(start hc-list[0])
nvlist version: 0
hc-name = motherboard
hc-id = 0
(end hc-list[0])
(start hc-list[1])
nvlist version: 0
hc-name = hostbridge
hc-id = 1
(end hc-list[1])
(start hc-list[2])
nvlist version: 0
hc-name = pciexrc
hc-id = 1
(end hc-list[2])
(start hc-list[3])
nvlist version: 0
hc-name = pciexbus
hc-id = 2
(end hc-list[3])
(start hc-list[4])
nvlist version: 0
hc-name = pciexdev
hc-id = 0
(end hc-list[4])
(end fru)
resource = (embedded nvlist)
nvlist version: 0
version = 0x0
scheme = hc
hc-root =
authority = (embedded nvlist)
nvlist version: 0
product-id = 8744C9U
chassis-id = L3CA377
server-id = paddy
(end authority)
hc-list-sz = 0x6
hc-list = (array of embedded nvlists)
(start hc-list[0])
nvlist version: 0
hc-name = motherboard
hc-id = 0
(end hc-list[0])
(start hc-list[1])
nvlist version: 0
hc-name = hostbridge
hc-id = 1
(end hc-list[1])
(start hc-list[2])
nvlist version: 0
hc-name = pciexrc
hc-id = 1
(end hc-list[2])
(start hc-list[3])
nvlist version: 0
hc-name = pciexbus
hc-id = 2
(end hc-list[3])
(start hc-list[4])
nvlist version: 0
hc-name = pciexdev
hc-id = 0
(end hc-list[4])
(start hc-list[5])
nvlist version: 0
hc-name = pciexfn
hc-id = 0
(end hc-list[5])
(end resource)
location = pcie2
(end fault-list[0])
fault-status = 0x3
__ttl = 0x1
__tod = 0x489eb711 0x36f6118
$ fmdump -evV
TIME CLASS
Aug 10 2008 02:37:54.400020757 ereport.io.device.stall
nvlist version: 0
class = ereport.io.device.stall
ena = 0x4cb33cda59700401
detector = (embedded nvlist)
nvlist version: 0
version = 0x0
scheme = dev
device-path = /[EMAIL PROTECTED],0/pci8086,[EMAIL
PROTECTED]/pci17aa,[EMAIL PROTECTED]
(end detector)
__ttl = 0x1
__tod = 0x489eb6f2 0x17d7d515
Aug 10 2008 02:37:54.836060516 ereport.io.device.inval_state
nvlist version: 0
class = ereport.io.device.inval_state
ena = 0x4cb4dcb16a100401
detector = (embedded nvlist)
nvlist version: 0
version = 0x0
scheme = dev
device-path = /[EMAIL PROTECTED],0/pci8086,[EMAIL
PROTECTED]/pci17aa,[EMAIL PROTECTED]
(end detector)
__ttl = 0x1
__tod = 0x489eb6f2 0x31d54564
Aug 10 2008 02:37:54.836080403 ereport.io.service.lost
nvlist version: 0
class = ereport.io.service.lost
ena = 0x4cb4dcb61d800401
detector = (embedded nvlist)
nvlist version: 0
version = 0x0
scheme = dev
device-path = /[EMAIL PROTECTED],0/pci8086,[EMAIL
PROTECTED]/pci17aa,[EMAIL PROTECTED]
(end detector)
__ttl = 0x1
__tod = 0x489eb6f2 0x31d59313
Aug 10 2008 02:37:54.836183187 ereport.io.service.lost
nvlist version: 0
class = ereport.io.service.lost
ena = 0x4cb4dccf61600401
detector = (embedded nvlist)
nvlist version: 0
version = 0x0
scheme = dev
device-path = /[EMAIL PROTECTED],0/pci8086,[EMAIL
PROTECTED]/pci17aa,[EMAIL PROTECTED]
(end detector)
__ttl = 0x1
__tod = 0x489eb6f2 0x31d72493
$ ls -las /devices/[EMAIL PROTECTED],0/pci8086,[EMAIL PROTECTED]/
/devices/[EMAIL PROTECTED],0/pci8086,[EMAIL PROTECTED]/pci17aa,[EMAIL
PROTECTED]:e1000g0: No such device or address
total 9
3 drwxr-xr-x 3 root sys 3 Aug 10 02:38 .
3 drwxr-xr-x 11 root sys 12 Jun 26 06:05 ..
3 drwxr-xr-x 2 root sys 2 Aug 10 02:38 pci17aa,[EMAIL
PROTECTED]
script done on Mon Aug 11 20:44:03 2008
$ fmdump -v -u d0e07886-f997-edf3-91ff-b2e3c7017368
TIME UUID SUNW-MSG-ID
Aug 10 02:38:25.0576 d0e07886-f997-edf3-91ff-b2e3c7017368 PCIEX-8000-0A
100% fault.io.pciex.device-interr
Problem in:
hc://:product-id=8744C9U:chassis-id=L3CA377:server-id=paddy/motherboard=0/hostbridge=1/pciexrc=1/pciexbus=2/pciexdev=0/pciexfn=0
Affects: dev:////[EMAIL PROTECTED],0/pci8086,[EMAIL
PROTECTED]/pci17aa,[EMAIL PROTECTED]
FRU:
hc://:product-id=8744C9U:chassis-id=L3CA377:server-id=paddy/motherboard=0/hostbridge=1/pciexrc=1/pciexbus=2/pciexdev=0
Location: pcie2
_______________________________________________
networking-discuss mailing list
[email protected]