[OmniOS-discuss] fmdump help?

Johan Kragsterman johan.kragsterman at capvert.se
Mon May 12 11:13:41 UTC 2014


Hi!

Got some fmdump issues here that I would appreciate someone to help me diagnos.


System is as you can see a Dell T5500 workstation, equipped with dual xeon L5520 with HT enabled, and 36 GB of ram. Bge integrated nic on mobo is disabled, and I use a quad port Gbe Intel nic at the PCI-X slot.

Got the rpool on an Intel SLC SSD on the motherboard integrated SATA controller.

Got a Dell H200 flashed to IT f/w(LSI2008), anounces itself as a Dell 6 gb HBA, connected to two Seagate ST4000VN000, and a Samsung 840 EVO SSD as a L2Arc device.



root at omni:~# fmdump -p
TIME                 UUID                                 SUNW-MSG-ID EVENT
maj 01 13:16:25.9491 bf630a54-1d96-6b2b-e6e9-e3347c1ba7f3 ZFS-8000-D3 Diagnosed
maj 10 21:49:13.8088 431d3b05-328c-4ec2-d83a-f58a006ea156 SUNOS-8000-J0 Diagnosed
maj 10 21:49:14.0433 f0a4a159-daf5-41c9-b948-d68055fb5a48 SUNOS-8000-J0 Diagnosed
maj 10 21:49:14.6796 87a8a141-fa1f-6bed-f25d-b467e130c85d PCIEX-8000-43 Diagnosed




Of the fmdumps, The last three from may 10 are the ones I'm interested in, and I choosed to display two of them here.one is severity "Major", and the other one is "Critical"




I see some "defect.sunos.eft.unexpected_telemetry", "class and path are incompatible" and "fault.io.pci.bus-linkerr".

Unfortunatly though, can't tell what it means.











root at omni:~# fmdump -V -u 431d3b05-328c-4ec2-d83a-f58a006ea156
TIME                           UUID                                 SUNW-MSG-ID
maj 10 2014 21:49:13.808892000 431d3b05-328c-4ec2-d83a-f58a006ea156 SUNOS-8000-J0

  TIME                 CLASS                                 ENA
  maj 10 21:47:03.1897 ereport.io.pcix.unex-spl              0x32b407bf59f01001

nvlist version: 0
        version = 0x0
        class = list.suspect
        uuid = 431d3b05-328c-4ec2-d83a-f58a006ea156
        code = SUNOS-8000-J0
        diag-time = 1399751353 665690
        de = (embedded nvlist)
        nvlist version: 0
                version = 0x0
                scheme = fmd
                authority = (embedded nvlist)
                nvlist version: 0
                        version = 0x0
                        product-id = Precision-WorkStation-T5500
                        chassis-id = 17BPY4J
                        server-id = omni
                (end authority)

                mod-name = eft
                mod-version = 1.16
        (end de)

        fault-list-sz = 0x2
        fault-list = (array of embedded nvlists)
        (start fault-list[0])
        nvlist version: 0
                version = 0x0
                class = defect.sunos.eft.unexpected_telemetry
                certainty = 0x32
                resource = (embedded nvlist)
                nvlist version: 0
                        version = 0x0
                        scheme = hc
                        hc-root = 
                        authority = (embedded nvlist)
                        nvlist version: 0
                                product-id = Precision-WorkStation-T5500
                                server-id = omni
                                chassis-id = 17BPY4J
                        (end authority)

                        hc-list-sz = 0x6
                        hc-list = (array of embedded nvlists)
                        (start hc-list[0])
                        nvlist version: 0
                                hc-name = motherboard
                                hc-id = 0
                        (end hc-list[0])
                        (start hc-list[1])
                        nvlist version: 0
                                hc-name = hostbridge
                                hc-id = 0
                        (end hc-list[1])
                        (start hc-list[2])
                        nvlist version: 0
                                hc-name = pciexrc
                                hc-id = 0
                        (end hc-list[2])
                        (start hc-list[3])
                        nvlist version: 0
                                hc-name = pciexbus
                                hc-id = 1
                        (end hc-list[3])
                        (start hc-list[4])
                        nvlist version: 0
                                hc-name = pciexdev
                                hc-id = 0
                        (end hc-list[4])
                        (start hc-list[5])
                        nvlist version: 0
                                hc-name = pciexfn
                                hc-id = 0
                        (end hc-list[5])

                (end resource)

                reason = ereport.io.pcix.unex-spl at motherboard0/hostbridge0/pciexrc0/pciexbus1/pciexdev0/pciexfn0 class and path are incompatible
                retire = 0
                response = 0
                asru = (embedded nvlist)
                nvlist version: 0
                        scheme = mod
                        version = 0x0
                        mod-id = 86
                        mod-name = pcieb
                        mod-desc = PCIe bridge/switch driver
                (end asru)

        (end fault-list[0])
        (start fault-list[1])
        nvlist version: 0
                version = 0x0
                class = fault.sunos.eft.unexpected_telemetry
                certainty = 0x32
                resource = (embedded nvlist)
                nvlist version: 0
                        version = 0x0
                        scheme = hc
                        hc-root = 
                        authority = (embedded nvlist)
                        nvlist version: 0
                                product-id = Precision-WorkStation-T5500
                                server-id = omni
                                chassis-id = 17BPY4J
                        (end authority)

                        hc-list-sz = 0x6
                        hc-list = (array of embedded nvlists)
                        (start hc-list[0])
                        nvlist version: 0
                                hc-name = motherboard
                                hc-id = 0
                        (end hc-list[0])
                        (start hc-list[1])
                        nvlist version: 0
                                hc-name = hostbridge
                                hc-id = 0
                        (end hc-list[1])
                        (start hc-list[2])
                        nvlist version: 0
                                hc-name = pciexrc
                                hc-id = 0
                        (end hc-list[2])
                        (start hc-list[3])
                        nvlist version: 0
                                hc-name = pciexbus
                                hc-id = 1
                        (end hc-list[3])
                        (start hc-list[4])
                        nvlist version: 0
                                hc-name = pciexdev
                                hc-id = 0
                        (end hc-list[4])
                        (start hc-list[5])
                        nvlist version: 0
                                hc-name = pciexfn
                                hc-id = 0
                        (end hc-list[5])

                (end resource)

                reason = ereport.io.pcix.unex-spl at motherboard0/hostbridge0/pciexrc0/pciexbus1/pciexdev0/pciexfn0 class and path are incompatible
                retire = 0
                response = 0
                asru = (embedded nvlist)
                nvlist version: 0
                        scheme = dev
                        version = 0x0
                        device-path = /pci at 0,0/pci8086,3408 at 1/pci12d8,e130 at 0
                (end asru)

                fru = (embedded nvlist)
                nvlist version: 0
                        version = 0x0
                        scheme = hc
                        hc-root = 
                        authority = (embedded nvlist)
                        nvlist version: 0
                                product-id = Precision-WorkStation-T5500
                                server-id = omni
                                chassis-id = 17BPY4J
                        (end authority)

                        hc-list = (array of embedded nvlists)
                        (start hc-list[0])
                        nvlist version: 0
                                hc-name = motherboard
                                hc-id = 0
                        (end hc-list[0])

                (end fru)

                location = MB
        (end fault-list[1])

        fault-status = 0x1 0x1
        severity = Major
        __ttl = 0x1
        __tod = 0x536e82b9 0x3036b660

root at omni:~# fmdump -V -u 87a8a141-fa1f-6bed-f25d-b467e130c85d
TIME                           UUID                                 SUNW-MSG-ID
maj 10 2014 21:49:14.679652000 87a8a141-fa1f-6bed-f25d-b467e130c85d PCIEX-8000-43

  TIME                 CLASS                                 ENA
  maj 10 21:47:03.1897 ereport.io.pci.dpe                    0x32b407c3fd901001
  maj 10 21:47:03.1897 ereport.io.pci.sserr                  0x32b407c3fd901001
  maj 10 21:47:03.1897 ereport.io.pciex.bdg.sec-serr         0x32b407bf59f01001
  maj 10 21:47:03.1897 ereport.io.pci.sec-rserr              0x32b407bf59f01001
  maj 10 21:47:03.1897 ereport.io.pciex.rc.fe-msg            0x32b407bb51101001
  maj 10 21:47:03.1897 ereport.io.pci.sec-rserr              0x32b407bb51101001

nvlist version: 0
        version = 0x0
        class = list.suspect
        uuid = 87a8a141-fa1f-6bed-f25d-b467e130c85d
        code = PCIEX-8000-43
        diag-time = 1399751354 555330
        de = (embedded nvlist)
        nvlist version: 0
                version = 0x0
                scheme = fmd
                authority = (embedded nvlist)
                nvlist version: 0
                        version = 0x0
                        product-id = Precision-WorkStation-T5500
                        chassis-id = 17BPY4J
                        server-id = omni
                (end authority)

                mod-name = eft
                mod-version = 1.16
        (end de)

        fault-list-sz = 0x2
        fault-list = (array of embedded nvlists)
        (start fault-list[0])
        nvlist version: 0
                version = 0x0
                class = fault.io.pciex.device-interr
                certainty = 0x43
                resource = (embedded nvlist)
                nvlist version: 0
                        version = 0x0
                        scheme = hc
                        hc-root = 
                        authority = (embedded nvlist)
                        nvlist version: 0
                                product-id = Precision-WorkStation-T5500
                                server-id = omni
                                chassis-id = 17BPY4J
                        (end authority)

                        hc-list-sz = 0x6
                        hc-list = (array of embedded nvlists)
                        (start hc-list[0])
                        nvlist version: 0
                                hc-name = motherboard
                                hc-id = 0
                        (end hc-list[0])
                        (start hc-list[1])
                        nvlist version: 0
                                hc-name = hostbridge
                                hc-id = 0
                        (end hc-list[1])
                        (start hc-list[2])
                        nvlist version: 0
                                hc-name = pciexrc
                                hc-id = 0
                        (end hc-list[2])
                        (start hc-list[3])
                        nvlist version: 0
                                hc-name = pciexbus
                                hc-id = 1
                        (end hc-list[3])
                        (start hc-list[4])
                        nvlist version: 0
                                hc-name = pciexdev
                                hc-id = 0
                        (end hc-list[4])
                        (start hc-list[5])
                        nvlist version: 0
                                hc-name = pciexfn
                                hc-id = 0
                        (end hc-list[5])

                (end resource)

                asru = (embedded nvlist)
                nvlist version: 0
                        scheme = dev
                        version = 0x0
                        device-path = /pci at 0,0/pci8086,3408 at 1/pci12d8,e130 at 0
                (end asru)

                fru = (embedded nvlist)
                nvlist version: 0
                        version = 0x0
                        scheme = hc
                        hc-root = 
                        authority = (embedded nvlist)
                        nvlist version: 0
                                product-id = Precision-WorkStation-T5500
                                server-id = omni
                                chassis-id = 17BPY4J
                        (end authority)

                        hc-list = (array of embedded nvlists)
                        (start hc-list[0])
                        nvlist version: 0
                                hc-name = motherboard
                                hc-id = 0
                        (end hc-list[0])

                (end fru)

                location = MB
        (end fault-list[0])
        (start fault-list[1])
        nvlist version: 0
                version = 0x0
                class = fault.io.pci.bus-linkerr
                certainty = 0x21
                resource = (embedded nvlist)
                nvlist version: 0
                        version = 0x0
                        scheme = hc
                        hc-root = 
                        authority = (embedded nvlist)
                        nvlist version: 0
                                product-id = Precision-WorkStation-T5500
                                server-id = omni
                                chassis-id = 17BPY4J
                        (end authority)

                        hc-list-sz = 0x7
                        hc-list = (array of embedded nvlists)
                        (start hc-list[0])
                        nvlist version: 0
                                hc-name = motherboard
                                hc-id = 0
                        (end hc-list[0])
                        (start hc-list[1])
                        nvlist version: 0
                                hc-name = hostbridge
                                hc-id = 0
                        (end hc-list[1])
                        (start hc-list[2])
                        nvlist version: 0
                                hc-name = pciexrc
                                hc-id = 0
                        (end hc-list[2])
                        (start hc-list[3])
                        nvlist version: 0
                                hc-name = pciexbus
                                hc-id = 1
                        (end hc-list[3])
                        (start hc-list[4])
                        nvlist version: 0
                                hc-name = pciexdev
                                hc-id = 0
                        (end hc-list[4])
                        (start hc-list[5])
                        nvlist version: 0
                                hc-name = pciexfn
                                hc-id = 0
                        (end hc-list[5])
                        (start hc-list[6])
                        nvlist version: 0
                                hc-name = pcibus
                                hc-id = 2
                        (end hc-list[6])

                (end resource)

                asru = (embedded nvlist)
                nvlist version: 0
                        scheme = dev
                        version = 0x0
                        device-path = /pci at 0,0/pci8086,3408 at 1/pci12d8,e130 at 0
                (end asru)

                fru = (embedded nvlist)
                nvlist version: 0
                        version = 0x0
                        scheme = hc
                        hc-root = 
                        authority = (embedded nvlist)
                        nvlist version: 0
                                product-id = Precision-WorkStation-T5500
                                server-id = omni
                                chassis-id = 17BPY4J
                        (end authority)

                        hc-list = (array of embedded nvlists)
                        (start hc-list[0])
                        nvlist version: 0
                                hc-name = motherboard
                                hc-id = 0
                        (end hc-list[0])

                (end fru)

                location = MB
        (end fault-list[1])

        fault-status = 0x1 0x1
        severity = Critical
        __ttl = 0x1
        __tod = 0x536e82ba 0x2882aaa0

root at omni:~# 

Best regards from/Med vänliga hälsningar från

Johan Kragsterman

Capvert



More information about the OmniOS-discuss mailing list