Corrections for GA2 GPU naming
Corrections to the policy table to add entries for the new way GPUs are
called out in GA2. The change goes from using gpu# with a custom callout
to /xyz/openbmc_project/inventory/system/chassis/motherboard/gv100card#
using a callout inventory path. The old entries will remain to support
previously GA'd systems.
Signed-off-by: Justin Thaler thalerj@us.ibm.com
diff --git a/thalerj/policyTable.json b/thalerj/policyTable.json
index db0089b..8d3d025 100644
--- a/thalerj/policyTable.json
+++ b/thalerj/policyTable.json
@@ -3633,6 +3633,132 @@
"UserAction": null,
"VMMigrationFlag": null
},
+ "org.open_power.Witherspoon.Fault.Error.GPUOverTemp||/xyz/openbmc_project/inventory/system/chassis/motherboard/gv100card0": {
+ "AffectedLEDs": null,
+ "AffectedSubsystem": "Cooling",
+ "BMCMessageID": "org.open_power.Witherspoon.Fault.Error.GPUOverTemp",
+ "CallHomeCandidate": false,
+ "CommonEventID": "FQPSPCA0066M",
+ "ComponentInstance": null,
+ "DateAdded": null,
+ "DateReviewed": null,
+ "EventType": "Environmental",
+ "Internal": false,
+ "LengthyDescription": null,
+ "LogSource": "BMC",
+ "Message": "GPU 0 suffered an over-temperature fault",
+ "ReferencedInventory": "/xyz/openbmc_project/inventory/system/chassis/motherboard/gv100card0",
+ "RelatedEventIDs": {},
+ "Serviceable": true,
+ "Severity": "Critical",
+ "UserAction": "Cooling",
+ "VMMigrationFlag": null
+ },
+ "org.open_power.Witherspoon.Fault.Error.GPUOverTemp||/xyz/openbmc_project/inventory/system/chassis/motherboard/gv100card1": {
+ "AffectedLEDs": null,
+ "AffectedSubsystem": "Cooling",
+ "BMCMessageID": "org.open_power.Witherspoon.Fault.Error.GPUOverTemp",
+ "CallHomeCandidate": false,
+ "CommonEventID": "FQPSPCA0066M",
+ "ComponentInstance": null,
+ "DateAdded": null,
+ "DateReviewed": null,
+ "EventType": "Environmental",
+ "Internal": false,
+ "LengthyDescription": null,
+ "LogSource": "BMC",
+ "Message": "GPU 1 suffered an over-temperature fault",
+ "ReferencedInventory": "/xyz/openbmc_project/inventory/system/chassis/motherboard/gv100card1",
+ "RelatedEventIDs": {},
+ "Serviceable": true,
+ "Severity": "Critical",
+ "UserAction": "Cooling",
+ "VMMigrationFlag": null
+ },
+ "org.open_power.Witherspoon.Fault.Error.GPUOverTemp||/xyz/openbmc_project/inventory/system/chassis/motherboard/gv100card2": {
+ "AffectedLEDs": null,
+ "AffectedSubsystem": "Cooling",
+ "BMCMessageID": "org.open_power.Witherspoon.Fault.Error.GPUOverTemp",
+ "CallHomeCandidate": false,
+ "CommonEventID": "FQPSPCA0066M",
+ "ComponentInstance": null,
+ "DateAdded": null,
+ "DateReviewed": null,
+ "EventType": "Environmental",
+ "Internal": false,
+ "LengthyDescription": null,
+ "LogSource": "BMC",
+ "Message": "GPU 2 suffered an over-temperature fault",
+ "ReferencedInventory": "/xyz/openbmc_project/inventory/system/chassis/motherboard/gv100card2",
+ "RelatedEventIDs": {},
+ "Serviceable": true,
+ "Severity": "Critical",
+ "UserAction": "Cooling",
+ "VMMigrationFlag": null
+ },
+ "org.open_power.Witherspoon.Fault.Error.GPUOverTemp||/xyz/openbmc_project/inventory/system/chassis/motherboard/gv100card3": {
+ "AffectedLEDs": null,
+ "AffectedSubsystem": "Cooling",
+ "BMCMessageID": "org.open_power.Witherspoon.Fault.Error.GPUOverTemp",
+ "CallHomeCandidate": false,
+ "CommonEventID": "FQPSPCA0066M",
+ "ComponentInstance": null,
+ "DateAdded": null,
+ "DateReviewed": null,
+ "EventType": "Environmental",
+ "Internal": false,
+ "LengthyDescription": null,
+ "LogSource": "BMC",
+ "Message": "GPU 3 suffered an over-temperature fault",
+ "ReferencedInventory": "/xyz/openbmc_project/inventory/system/chassis/motherboard/gv100card3",
+ "RelatedEventIDs": {},
+ "Serviceable": true,
+ "Severity": "Critical",
+ "UserAction": "Cooling",
+ "VMMigrationFlag": null
+ },
+ "org.open_power.Witherspoon.Fault.Error.GPUOverTemp||/xyz/openbmc_project/inventory/system/chassis/motherboard/gv100card4": {
+ "AffectedLEDs": null,
+ "AffectedSubsystem": "Cooling",
+ "BMCMessageID": "org.open_power.Witherspoon.Fault.Error.GPUOverTemp",
+ "CallHomeCandidate": false,
+ "CommonEventID": "FQPSPCA0066M",
+ "ComponentInstance": null,
+ "DateAdded": null,
+ "DateReviewed": null,
+ "EventType": "Environmental",
+ "Internal": false,
+ "LengthyDescription": null,
+ "LogSource": "BMC",
+ "Message": "GPU 4 suffered an over-temperature fault",
+ "ReferencedInventory": "/xyz/openbmc_project/inventory/system/chassis/motherboard/gv100card4",
+ "RelatedEventIDs": {},
+ "Serviceable": true,
+ "Severity": "Critical",
+ "UserAction": "Cooling",
+ "VMMigrationFlag": null
+ },
+ "org.open_power.Witherspoon.Fault.Error.GPUOverTemp||/xyz/openbmc_project/inventory/system/chassis/motherboard/gv100card5": {
+ "AffectedLEDs": null,
+ "AffectedSubsystem": "Cooling",
+ "BMCMessageID": "org.open_power.Witherspoon.Fault.Error.GPUOverTemp",
+ "CallHomeCandidate": false,
+ "CommonEventID": "FQPSPCA0066M",
+ "ComponentInstance": null,
+ "DateAdded": null,
+ "DateReviewed": null,
+ "EventType": "Environmental",
+ "Internal": false,
+ "LengthyDescription": null,
+ "LogSource": "BMC",
+ "Message": "GPU 5 suffered an over-temperature fault",
+ "ReferencedInventory": "/xyz/openbmc_project/inventory/system/chassis/motherboard/gv100card5",
+ "RelatedEventIDs": {},
+ "Serviceable": true,
+ "Severity": "Critical",
+ "UserAction": "Cooling",
+ "VMMigrationFlag": null
+ },
"org.open_power.Witherspoon.Fault.Error.GPUPowerFault||/xyz/openbmc_project/inventory/system/chassis/motherboard/gpu0": {
"AffectedLEDs": null,
"AffectedSubsystem": "Power",
@@ -3759,6 +3885,132 @@
"UserAction": null,
"VMMigrationFlag": null
},
+ "org.open_power.Witherspoon.Fault.Error.GPUPowerFault||/xyz/openbmc_project/inventory/system/chassis/motherboard/gv100card0": {
+ "AffectedLEDs": null,
+ "AffectedSubsystem": "Power",
+ "BMCMessageID": "org.open_power.Witherspoon.Fault.Error.GPUPowerFault",
+ "CallHomeCandidate": false,
+ "CommonEventID": "FQPSPPW0038M",
+ "ComponentInstance": null,
+ "DateAdded": null,
+ "DateReviewed": null,
+ "EventType": "Environmental",
+ "Internal": false,
+ "LengthyDescription": null,
+ "LogSource": "BMC",
+ "Message": "GPU 0 suffered a power fault",
+ "ReferencedInventory": "/xyz/openbmc_project/inventory/system/chassis/motherboard/gv100card0",
+ "RelatedEventIDs": {},
+ "Serviceable": true,
+ "Severity": "Critical",
+ "UserAction": "Power",
+ "VMMigrationFlag": null
+ },
+ "org.open_power.Witherspoon.Fault.Error.GPUPowerFault||/xyz/openbmc_project/inventory/system/chassis/motherboard/gv100card1": {
+ "AffectedLEDs": null,
+ "AffectedSubsystem": "Power",
+ "BMCMessageID": "org.open_power.Witherspoon.Fault.Error.GPUPowerFault",
+ "CallHomeCandidate": false,
+ "CommonEventID": "FQPSPPW0038M",
+ "ComponentInstance": null,
+ "DateAdded": null,
+ "DateReviewed": null,
+ "EventType": "Environmental",
+ "Internal": false,
+ "LengthyDescription": null,
+ "LogSource": "BMC",
+ "Message": "GPU 1 suffered a power fault",
+ "ReferencedInventory": "/xyz/openbmc_project/inventory/system/chassis/motherboard/gv100card1",
+ "RelatedEventIDs": {},
+ "Serviceable": true,
+ "Severity": "Critical",
+ "UserAction": "Power",
+ "VMMigrationFlag": null
+ },
+ "org.open_power.Witherspoon.Fault.Error.GPUPowerFault||/xyz/openbmc_project/inventory/system/chassis/motherboard/gv100card2": {
+ "AffectedLEDs": null,
+ "AffectedSubsystem": "Power",
+ "BMCMessageID": "org.open_power.Witherspoon.Fault.Error.GPUPowerFault",
+ "CallHomeCandidate": false,
+ "CommonEventID": "FQPSPPW0038M",
+ "ComponentInstance": null,
+ "DateAdded": null,
+ "DateReviewed": null,
+ "EventType": "Environmental",
+ "Internal": false,
+ "LengthyDescription": null,
+ "LogSource": "BMC",
+ "Message": "GPU 2 suffered a power fault",
+ "ReferencedInventory": "/xyz/openbmc_project/inventory/system/chassis/motherboard/gv100card2",
+ "RelatedEventIDs": {},
+ "Serviceable": true,
+ "Severity": "Critical",
+ "UserAction": "Power",
+ "VMMigrationFlag": null
+ },
+ "org.open_power.Witherspoon.Fault.Error.GPUPowerFault||/xyz/openbmc_project/inventory/system/chassis/motherboard/gv100card3": {
+ "AffectedLEDs": null,
+ "AffectedSubsystem": "Power",
+ "BMCMessageID": "org.open_power.Witherspoon.Fault.Error.GPUPowerFault",
+ "CallHomeCandidate": false,
+ "CommonEventID": "FQPSPPW0038M",
+ "ComponentInstance": null,
+ "DateAdded": null,
+ "DateReviewed": null,
+ "EventType": "Environmental",
+ "Internal": false,
+ "LengthyDescription": null,
+ "LogSource": "BMC",
+ "Message": "GPU 3 suffered a power fault",
+ "ReferencedInventory": "/xyz/openbmc_project/inventory/system/chassis/motherboard/gv100card3",
+ "RelatedEventIDs": {},
+ "Serviceable": true,
+ "Severity": "Critical",
+ "UserAction": "Power",
+ "VMMigrationFlag": null
+ },
+ "org.open_power.Witherspoon.Fault.Error.GPUPowerFault||/xyz/openbmc_project/inventory/system/chassis/motherboard/gv100card4": {
+ "AffectedLEDs": null,
+ "AffectedSubsystem": "Power",
+ "BMCMessageID": "org.open_power.Witherspoon.Fault.Error.GPUPowerFault",
+ "CallHomeCandidate": false,
+ "CommonEventID": "FQPSPPW0038M",
+ "ComponentInstance": null,
+ "DateAdded": null,
+ "DateReviewed": null,
+ "EventType": "Environmental",
+ "Internal": false,
+ "LengthyDescription": null,
+ "LogSource": "BMC",
+ "Message": "GPU 4 suffered a power fault",
+ "ReferencedInventory": "/xyz/openbmc_project/inventory/system/chassis/motherboard/gv100card4",
+ "RelatedEventIDs": {},
+ "Serviceable": true,
+ "Severity": "Critical",
+ "UserAction": "Power",
+ "VMMigrationFlag": null
+ },
+ "org.open_power.Witherspoon.Fault.Error.GPUPowerFault||/xyz/openbmc_project/inventory/system/chassis/motherboard/gv100card5": {
+ "AffectedLEDs": null,
+ "AffectedSubsystem": "Power",
+ "BMCMessageID": "org.open_power.Witherspoon.Fault.Error.GPUPowerFault",
+ "CallHomeCandidate": false,
+ "CommonEventID": "FQPSPPW0038M",
+ "ComponentInstance": null,
+ "DateAdded": null,
+ "DateReviewed": null,
+ "EventType": "Environmental",
+ "Internal": false,
+ "LengthyDescription": null,
+ "LogSource": "BMC",
+ "Message": "GPU 5 suffered a power fault",
+ "ReferencedInventory": "/xyz/openbmc_project/inventory/system/chassis/motherboard/gv100card5",
+ "RelatedEventIDs": {},
+ "Serviceable": true,
+ "Severity": "Critical",
+ "UserAction": "Power",
+ "VMMigrationFlag": null
+ },
"org.open_power.Witherspoon.Fault.Error.PowerOnFailure": {
"AffectedLEDs": null,
"AffectedSubsystem": "Power",
@@ -16383,7 +16635,7 @@
},
"fileInfo": {
"Entity": "IBM OpenBMC",
- "Version": 1.5,
+ "Version": 1.55,
"language": "English"
}
}
\ No newline at end of file