blob: 0952cb9eef131f52a3af2191ebcafc0ecfb407ce [file] [log] [blame]
Brandon Wyman24e422f2017-07-25 19:40:14 -05001/**
2 * Copyright © 2017 IBM Corporation
3 *
4 * Licensed under the Apache License, Version 2.0 (the "License");
5 * you may not use this file except in compliance with the License.
6 * You may obtain a copy of the License at
7 *
8 * http://www.apache.org/licenses/LICENSE-2.0
9 *
10 * Unless required by applicable law or agreed to in writing, software
11 * distributed under the License is distributed on an "AS IS" BASIS,
12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 * See the License for the specific language governing permissions and
14 * limitations under the License.
15 */
Brandon Wyman442035f2017-08-08 15:58:45 -050016#include <phosphor-logging/log.hpp>
17#include <phosphor-logging/elog.hpp>
Brandon Wymane0eb45c2017-10-06 12:58:42 -050018#include <org/open_power/Witherspoon/Fault/error.hpp>
Matt Spinlerceacf942017-10-05 13:55:02 -050019#include <xyz/openbmc_project/Common/Device/error.hpp>
Brandon Wyman442035f2017-08-08 15:58:45 -050020#include "elog-errors.hpp"
Brandon Wyman10295542017-08-09 18:20:44 -050021#include "names_values.hpp"
Brandon Wyman24e422f2017-07-25 19:40:14 -050022#include "power_supply.hpp"
Brandon Wyman442035f2017-08-08 15:58:45 -050023#include "pmbus.hpp"
24#include "utility.hpp"
25
26using namespace phosphor::logging;
Brandon Wymane0eb45c2017-10-06 12:58:42 -050027using namespace sdbusplus::org::open_power::Witherspoon::Fault::Error;
Matt Spinlerceacf942017-10-05 13:55:02 -050028using namespace sdbusplus::xyz::openbmc_project::Common::Device::Error;
Brandon Wyman24e422f2017-07-25 19:40:14 -050029
Brandon Wyman1db9a9e2017-07-26 18:50:22 -050030namespace witherspoon
Brandon Wyman24e422f2017-07-25 19:40:14 -050031{
32namespace power
33{
34namespace psu
35{
36
Brandon Wyman10295542017-08-09 18:20:44 -050037constexpr auto INVENTORY_OBJ_PATH = "/xyz/openbmc_project/inventory";
38constexpr auto INVENTORY_INTERFACE = "xyz.openbmc_project.Inventory.Item";
39constexpr auto PRESENT_PROP = "Present";
Brandon Wyman431fbe42017-08-18 16:22:09 -050040constexpr auto POWER_OBJ_PATH = "/org/openbmc/control/power0";
41constexpr auto POWER_INTERFACE = "org.openbmc.control.Power";
Brandon Wyman10295542017-08-09 18:20:44 -050042
43PowerSupply::PowerSupply(const std::string& name, size_t inst,
Brandon Wyman431fbe42017-08-18 16:22:09 -050044 const std::string& objpath,
45 const std::string& invpath,
46 sdbusplus::bus::bus& bus,
47 event::Event& e,
48 std::chrono::seconds& t)
49 : Device(name, inst), monitorPath(objpath), pmbusIntf(objpath),
50 inventoryPath(invpath), bus(bus), event(e), powerOnInterval(t),
51 powerOnTimer(e, [this]()
52 {
53 this->powerOn = true;
54 })
Brandon Wyman10295542017-08-09 18:20:44 -050055{
Brandon Wyman10295542017-08-09 18:20:44 -050056 using namespace sdbusplus::bus;
57 auto present_obj_path = INVENTORY_OBJ_PATH + inventoryPath;
58 presentMatch = std::make_unique<match_t>(bus,
59 match::rules::propertiesChanged(
60 present_obj_path,
61 INVENTORY_INTERFACE),
62 [this](auto& msg)
Brandon Wyman431fbe42017-08-18 16:22:09 -050063 {
64 this->inventoryChanged(msg);
65 });
66 // Get initial presence state.
Brandon Wyman253dc9b2017-08-12 13:45:52 -050067 updatePresence();
Brandon Wyman431fbe42017-08-18 16:22:09 -050068
69 // Subscribe to power state changes
70 powerOnMatch = std::make_unique<match_t>(bus,
71 match::rules::propertiesChanged(
72 POWER_OBJ_PATH,
73 POWER_INTERFACE),
74 [this](auto& msg)
75 {
76 this->powerStateChanged(msg);
77 });
78 // Get initial power state.
79 updatePowerState();
Brandon Wyman10295542017-08-09 18:20:44 -050080}
Brandon Wyman442035f2017-08-08 15:58:45 -050081
Brandon Wymana1e96342017-09-25 16:47:44 -050082void PowerSupply::captureCmd(util::NamesValues& nv, const std::string& cmd,
83 witherspoon::pmbus::Type type)
84{
85 if (pmbusIntf.exists(cmd, type))
86 {
87 try
88 {
89 auto val = pmbusIntf.read(cmd, type);
90 nv.add(cmd, val);
91 }
92 catch (std::exception& e)
93 {
94 log<level::INFO>("Unable to capture metadata", entry("CMD=%s",
95 cmd));
96 }
97 }
98}
Brandon Wyman431fbe42017-08-18 16:22:09 -050099
Brandon Wyman1db9a9e2017-07-26 18:50:22 -0500100void PowerSupply::analyze()
101{
Brandon Wyman442035f2017-08-08 15:58:45 -0500102 using namespace witherspoon::pmbus;
103
104 try
105 {
Brandon Wyman10295542017-08-09 18:20:44 -0500106 if (present)
Brandon Wyman442035f2017-08-08 15:58:45 -0500107 {
Brandon Wyman764c7972017-08-22 17:05:36 -0500108 std::uint16_t statusWord = 0;
Brandon Wyman764c7972017-08-22 17:05:36 -0500109
110 // Read the 2 byte STATUS_WORD value to check for faults.
111 statusWord = pmbusIntf.read(STATUS_WORD, Type::Debug);
112
Brandon Wyman10295542017-08-09 18:20:44 -0500113 //TODO: 3 consecutive reads should be performed.
114 // If 3 consecutive reads are seen, log the fault.
115 // Driver gives cached value, read once a second.
116 // increment for fault on, decrement for fault off, to deglitch.
117 // If count reaches 3, we have fault. If count reaches 0, fault is
118 // cleared.
119
Brandon Wyman603cc002017-08-28 18:17:58 -0500120 checkInputFault(statusWord);
Brandon Wyman764c7972017-08-22 17:05:36 -0500121
122 if (powerOn)
123 {
Brandon Wyman12661f12017-08-31 15:28:21 -0500124 checkFanFault(statusWord);
Brandon Wyman875b3632017-09-13 18:46:03 -0500125 checkTemperatureFault(statusWord);
Brandon Wymancfa032b2017-09-25 17:37:50 -0500126 checkOutputOvervoltageFault(statusWord);
127 checkCurrentOutOverCurrentFault(statusWord);
128 checkPGOrUnitOffFault(statusWord);
Brandon Wyman442035f2017-08-08 15:58:45 -0500129 }
130 }
131 }
132 catch (ReadFailure& e)
133 {
134 if (!readFailLogged)
135 {
136 commit<ReadFailure>();
137 readFailLogged = true;
Brandon Wyman442035f2017-08-08 15:58:45 -0500138 }
139 }
140
Brandon Wyman1db9a9e2017-07-26 18:50:22 -0500141 return;
142}
143
Brandon Wyman10295542017-08-09 18:20:44 -0500144void PowerSupply::inventoryChanged(sdbusplus::message::message& msg)
145{
146 std::string msgSensor;
147 std::map<std::string, sdbusplus::message::variant<uint32_t, bool>> msgData;
148 msg.read(msgSensor, msgData);
149
150 // Check if it was the Present property that changed.
151 auto valPropMap = msgData.find(PRESENT_PROP);
152 if (valPropMap != msgData.end())
153 {
154 present = sdbusplus::message::variant_ns::get<bool>(valPropMap->second);
155
156 if (present)
157 {
158 readFailLogged = false;
159 vinUVFault = false;
Brandon Wyman253dc9b2017-08-12 13:45:52 -0500160 inputFault = false;
Brandon Wymanb165c252017-08-25 18:59:54 -0500161 outputOCFault = false;
Brandon Wymanab05c072017-08-30 18:26:41 -0500162 outputOVFault = false;
Brandon Wyman12661f12017-08-31 15:28:21 -0500163 fanFault = false;
Brandon Wyman875b3632017-09-13 18:46:03 -0500164 temperatureFault = false;
Brandon Wyman10295542017-08-09 18:20:44 -0500165 }
166 }
167
168 return;
169}
170
171void PowerSupply::updatePresence()
172{
173 // Use getProperty utility function to get presence status.
174 std::string path = INVENTORY_OBJ_PATH + inventoryPath;
175 std::string service = "xyz.openbmc_project.Inventory.Manager";
Brandon Wyman8731a302017-08-16 16:15:34 -0500176
Brandon Wyman800e01b2017-10-02 17:30:37 -0500177 util::getProperty(INVENTORY_INTERFACE, PRESENT_PROP, path,service, bus,
178 this->present);
Brandon Wyman10295542017-08-09 18:20:44 -0500179}
180
Brandon Wyman431fbe42017-08-18 16:22:09 -0500181void PowerSupply::powerStateChanged(sdbusplus::message::message& msg)
182{
183 int32_t state = 0;
184 std::string msgSensor;
185 std::map<std::string, sdbusplus::message::variant<int32_t, int32_t>>
186 msgData;
187 msg.read(msgSensor, msgData);
188
189 // Check if it was the Present property that changed.
190 auto valPropMap = msgData.find("state");
191 if (valPropMap != msgData.end())
192 {
193 state = sdbusplus::message::variant_ns::get<int32_t>(valPropMap->second);
194
195 // Power is on when state=1. Set the fault logged variables to false
196 // and start the power on timer when the state changes to 1.
197 if (state)
198 {
199 readFailLogged = false;
200 vinUVFault = false;
201 inputFault = false;
Brandon Wyman593d24f2017-10-13 18:15:23 -0500202 powerOnFault = 0;
Brandon Wymanb165c252017-08-25 18:59:54 -0500203 outputOCFault = false;
Brandon Wymanab05c072017-08-30 18:26:41 -0500204 outputOVFault = false;
Brandon Wyman12661f12017-08-31 15:28:21 -0500205 fanFault = false;
Brandon Wyman875b3632017-09-13 18:46:03 -0500206 temperatureFault = false;
Brandon Wyman431fbe42017-08-18 16:22:09 -0500207 powerOnTimer.start(powerOnInterval, Timer::TimerType::oneshot);
208 }
209 else
210 {
211 powerOnTimer.stop();
212 powerOn = false;
213 }
214 }
215
216}
217
218void PowerSupply::updatePowerState()
219{
220 // When state = 1, system is powered on
221 int32_t state = 0;
222
223 try
224 {
225 auto service = util::getService(POWER_OBJ_PATH,
226 POWER_INTERFACE,
227 bus);
228
229 // Use getProperty utility function to get power state.
230 util::getProperty<int32_t>(POWER_INTERFACE,
231 "state",
232 POWER_OBJ_PATH,
233 service,
234 bus,
235 state);
236
237 if (state)
238 {
239 powerOn = true;
240 }
241 else
242 {
243 powerOn = false;
244 }
245 }
246 catch (std::exception& e)
247 {
248 log<level::INFO>("Failed to get power state. Assuming it is off.");
249 powerOn = false;
250 }
251
252}
253
Brandon Wyman603cc002017-08-28 18:17:58 -0500254void PowerSupply::checkInputFault(const uint16_t statusWord)
255{
256 using namespace witherspoon::pmbus;
257
258 std::uint8_t statusInput = 0;
259
260 if ((statusWord & status_word::VIN_UV_FAULT) && !vinUVFault)
261 {
262 vinUVFault = true;
263
264 util::NamesValues nv;
265 nv.add("STATUS_WORD", statusWord);
266
Brandon Wymane0eb45c2017-10-06 12:58:42 -0500267 using metadata = org::open_power::Witherspoon::Fault::
Brandon Wyman603cc002017-08-28 18:17:58 -0500268 PowerSupplyUnderVoltageFault;
269
270 report<PowerSupplyUnderVoltageFault>(metadata::RAW_STATUS(
271 nv.get().c_str()));
272 }
273 else
274 {
275 if (vinUVFault)
276 {
277 vinUVFault = false;
278 log<level::INFO>("VIN_UV_FAULT cleared",
279 entry("POWERSUPPLY=%s",
280 inventoryPath.c_str()));
281 }
282 }
283
284 if ((statusWord & status_word::INPUT_FAULT_WARN) && !inputFault)
285 {
286 inputFault = true;
287
Brandon Wyman603cc002017-08-28 18:17:58 -0500288 util::NamesValues nv;
289 nv.add("STATUS_WORD", statusWord);
Brandon Wymana1e96342017-09-25 16:47:44 -0500290 captureCmd(nv, STATUS_INPUT, Type::Debug);
Brandon Wyman603cc002017-08-28 18:17:58 -0500291
Brandon Wymane0eb45c2017-10-06 12:58:42 -0500292 using metadata = org::open_power::Witherspoon::Fault::
Brandon Wyman603cc002017-08-28 18:17:58 -0500293 PowerSupplyInputFault;
294
295 report<PowerSupplyInputFault>(
296 metadata::RAW_STATUS(nv.get().c_str()));
297 }
298 else
299 {
300 if ((inputFault) &&
301 !(statusWord & status_word::INPUT_FAULT_WARN))
302 {
303 inputFault = false;
304 statusInput = pmbusIntf.read(STATUS_INPUT, Type::Debug);
305
306 log<level::INFO>("INPUT_FAULT_WARN cleared",
307 entry("POWERSUPPLY=%s", inventoryPath.c_str()),
308 entry("STATUS_WORD=0x%04X", statusWord),
309 entry("STATUS_INPUT=0x%02X", statusInput));
310 }
311 }
312}
313
314void PowerSupply::checkPGOrUnitOffFault(const uint16_t statusWord)
315{
316 using namespace witherspoon::pmbus;
317
Brandon Wyman593d24f2017-10-13 18:15:23 -0500318 if (powerOnFault < FAULT_COUNT)
Brandon Wyman603cc002017-08-28 18:17:58 -0500319 {
Brandon Wyman593d24f2017-10-13 18:15:23 -0500320 // Check PG# and UNIT_IS_OFF
321 if ((statusWord & status_word::POWER_GOOD_NEGATED) ||
322 (statusWord & status_word::UNIT_IS_OFF))
323 {
324 log<level::INFO>("PGOOD or UNIT_IS_OFF bit bad",
325 entry("STATUS_WORD=0x%04X", statusWord));
326 powerOnFault++;
327 }
328 else
329 {
330 if (powerOnFault > 0)
331 {
332 log<level::INFO>("PGOOD and UNIT_IS_OFF bits good");
333 powerOnFault = 0;
334 }
335 }
Brandon Wyman603cc002017-08-28 18:17:58 -0500336
Brandon Wyman593d24f2017-10-13 18:15:23 -0500337 if (powerOnFault >= FAULT_COUNT)
338 {
339 util::NamesValues nv;
340 nv.add("STATUS_WORD", statusWord);
341 captureCmd(nv, STATUS_INPUT, Type::Debug);
342 auto status0Vout = pmbusIntf.insertPageNum(STATUS_VOUT, 0);
343 captureCmd(nv, status0Vout, Type::Debug);
344 captureCmd(nv, STATUS_IOUT, Type::Debug);
345 captureCmd(nv, STATUS_MFR, Type::Debug);
Brandon Wyman603cc002017-08-28 18:17:58 -0500346
Brandon Wyman593d24f2017-10-13 18:15:23 -0500347 using metadata = org::open_power::Witherspoon::Fault::
348 PowerSupplyShouldBeOn;
Brandon Wyman603cc002017-08-28 18:17:58 -0500349
Brandon Wyman593d24f2017-10-13 18:15:23 -0500350 // A power supply is OFF (or pgood low) but should be on.
351 report<PowerSupplyShouldBeOn>(
352 metadata::RAW_STATUS(nv.get().c_str()),
353 metadata::CALLOUT_INVENTORY_PATH(
354 inventoryPath.c_str()));
355 }
Brandon Wyman603cc002017-08-28 18:17:58 -0500356 }
357
358}
359
360void PowerSupply::checkCurrentOutOverCurrentFault(const uint16_t statusWord)
361{
362 using namespace witherspoon::pmbus;
363
Brandon Wyman603cc002017-08-28 18:17:58 -0500364 // Check for an output overcurrent fault.
365 if ((statusWord & status_word::IOUT_OC_FAULT) &&
366 !outputOCFault)
367 {
Brandon Wyman603cc002017-08-28 18:17:58 -0500368 util::NamesValues nv;
369 nv.add("STATUS_WORD", statusWord);
Brandon Wymana1e96342017-09-25 16:47:44 -0500370 captureCmd(nv, STATUS_INPUT, Type::Debug);
371 auto status0Vout = pmbusIntf.insertPageNum(STATUS_VOUT, 0);
372 captureCmd(nv, status0Vout, Type::Debug);
373 captureCmd(nv, STATUS_IOUT, Type::Debug);
374 captureCmd(nv, STATUS_MFR, Type::Debug);
Brandon Wyman603cc002017-08-28 18:17:58 -0500375
Brandon Wymane0eb45c2017-10-06 12:58:42 -0500376 using metadata = org::open_power::Witherspoon::Fault::
Brandon Wyman603cc002017-08-28 18:17:58 -0500377 PowerSupplyOutputOvercurrent;
378
379 report<PowerSupplyOutputOvercurrent>(metadata::RAW_STATUS(
380 nv.get().c_str()),
381 metadata::CALLOUT_INVENTORY_PATH(
382 inventoryPath.c_str()));
383
384 outputOCFault = true;
385 }
386}
387
Brandon Wymanab05c072017-08-30 18:26:41 -0500388void PowerSupply::checkOutputOvervoltageFault(const uint16_t statusWord)
389{
390 using namespace witherspoon::pmbus;
391
Brandon Wymanab05c072017-08-30 18:26:41 -0500392 // Check for an output overvoltage fault.
393 if ((statusWord & status_word::VOUT_OV_FAULT) &&
394 !outputOVFault)
395 {
Brandon Wymanab05c072017-08-30 18:26:41 -0500396 util::NamesValues nv;
397 nv.add("STATUS_WORD", statusWord);
Brandon Wymana1e96342017-09-25 16:47:44 -0500398 captureCmd(nv, STATUS_INPUT, Type::Debug);
399 auto status0Vout = pmbusIntf.insertPageNum(STATUS_VOUT, 0);
400 captureCmd(nv, status0Vout, Type::Debug);
401 captureCmd(nv, STATUS_IOUT, Type::Debug);
402 captureCmd(nv, STATUS_MFR, Type::Debug);
Brandon Wymanab05c072017-08-30 18:26:41 -0500403
Brandon Wymane0eb45c2017-10-06 12:58:42 -0500404 using metadata = org::open_power::Witherspoon::Fault::
Brandon Wymanab05c072017-08-30 18:26:41 -0500405 PowerSupplyOutputOvervoltage;
406
407 report<PowerSupplyOutputOvervoltage>(metadata::RAW_STATUS(
408 nv.get().c_str()),
409 metadata::CALLOUT_INVENTORY_PATH(
410 inventoryPath.c_str()));
411
412 outputOVFault = true;
413 }
414}
415
Brandon Wyman12661f12017-08-31 15:28:21 -0500416void PowerSupply::checkFanFault(const uint16_t statusWord)
417{
418 using namespace witherspoon::pmbus;
419
Brandon Wyman875b3632017-09-13 18:46:03 -0500420 // Check for a fan fault or warning condition
Brandon Wyman12661f12017-08-31 15:28:21 -0500421 if ((statusWord & status_word::FAN_FAULT) &&
422 !fanFault)
423 {
Brandon Wyman12661f12017-08-31 15:28:21 -0500424 util::NamesValues nv;
425 nv.add("STATUS_WORD", statusWord);
Brandon Wymana1e96342017-09-25 16:47:44 -0500426 captureCmd(nv, STATUS_MFR, Type::Debug);
427 captureCmd(nv, STATUS_TEMPERATURE, Type::Debug);
428 captureCmd(nv, STATUS_FANS_1_2, Type::Debug);
Brandon Wyman12661f12017-08-31 15:28:21 -0500429
Brandon Wymane0eb45c2017-10-06 12:58:42 -0500430 using metadata = org::open_power::Witherspoon::Fault::
Brandon Wyman12661f12017-08-31 15:28:21 -0500431 PowerSupplyFanFault;
432
433 report<PowerSupplyFanFault>(
434 metadata::RAW_STATUS(nv.get().c_str()),
435 metadata::CALLOUT_INVENTORY_PATH(inventoryPath.c_str()));
436
437 fanFault = true;
438 }
439}
440
Brandon Wyman875b3632017-09-13 18:46:03 -0500441void PowerSupply::checkTemperatureFault(const uint16_t statusWord)
442{
443 using namespace witherspoon::pmbus;
444
445 // Due to how the PMBus core device driver sends a clear faults command
446 // the bit in STATUS_WORD will likely be cleared when we attempt to examine
447 // it for a Thermal Fault or Warning. So, check the STATUS_WORD and the
448 // STATUS_TEMPERATURE bits. If either indicates a fault, proceed with
449 // logging the over-temperature condition.
450 std::uint8_t statusTemperature = 0;
451 statusTemperature = pmbusIntf.read(STATUS_TEMPERATURE, Type::Debug);
452 if (((statusWord & status_word::TEMPERATURE_FAULT_WARN) ||
453 (statusTemperature & status_temperature::OT_FAULT)) &&
454 !temperatureFault)
455 {
456 // The power supply has had an over-temperature condition.
457 // This may not result in a shutdown if experienced for a short
458 // duration.
459 // This should not occur under normal conditions.
460 // The power supply may be faulty, or the paired supply may be putting
461 // out less current.
462 // Capture command responses with potentially relevant information,
463 // and call out the power supply reporting the condition.
Brandon Wyman875b3632017-09-13 18:46:03 -0500464 util::NamesValues nv;
465 nv.add("STATUS_WORD", statusWord);
Brandon Wymana1e96342017-09-25 16:47:44 -0500466 captureCmd(nv, STATUS_MFR, Type::Debug);
467 captureCmd(nv, STATUS_IOUT, Type::Debug);
Brandon Wyman875b3632017-09-13 18:46:03 -0500468 nv.add("STATUS_TEMPERATURE", statusTemperature);
Brandon Wymana1e96342017-09-25 16:47:44 -0500469 captureCmd(nv, STATUS_FANS_1_2, Type::Debug);
Brandon Wyman875b3632017-09-13 18:46:03 -0500470
Brandon Wymane0eb45c2017-10-06 12:58:42 -0500471 using metadata = org::open_power::Witherspoon::Fault::
Brandon Wyman875b3632017-09-13 18:46:03 -0500472 PowerSupplyTemperatureFault;
473
474 report<PowerSupplyTemperatureFault>(
475 metadata::RAW_STATUS(nv.get().c_str()),
476 metadata::CALLOUT_INVENTORY_PATH(inventoryPath.c_str()));
477
478 temperatureFault = true;
479 }
480}
481
Brandon Wyman1db9a9e2017-07-26 18:50:22 -0500482void PowerSupply::clearFaults()
483{
Brandon Wyman10295542017-08-09 18:20:44 -0500484 //TODO - Clear faults at pre-poweron. openbmc/openbmc#1736
Brandon Wyman1db9a9e2017-07-26 18:50:22 -0500485 return;
486}
487
Brandon Wyman24e422f2017-07-25 19:40:14 -0500488}
489}
490}