blob: e41887931e3855a056fda8f838c63aab2984c663 [file] [log] [blame]
Josh D. Kingbdd9cb72016-12-19 11:13:43 -06001#include "bmc_state_manager.hpp"
Andrew Geisslere426b582020-05-28 12:40:55 -05002
Andrew Geissler98e64e62022-01-25 16:02:56 -06003#include "utils.hpp"
Andrew Geissler2f60aae2019-09-12 13:25:21 -05004#include "xyz/openbmc_project/Common/error.hpp"
Josh D. Kingbdd9cb72016-12-19 11:13:43 -06005
Andrew Geissler98e64e62022-01-25 16:02:56 -06006#include <gpiod.h>
Andrew Geisslere426b582020-05-28 12:40:55 -05007#include <sys/sysinfo.h>
8
9#include <phosphor-logging/elog-errors.hpp>
Andrew Geissler429100a2021-09-09 12:50:24 -050010#include <phosphor-logging/lg2.hpp>
Andrew Geisslere426b582020-05-28 12:40:55 -050011#include <sdbusplus/exception.hpp>
12
13#include <cassert>
Tim Lee2bfb1ef2021-03-17 09:50:35 +080014#include <filesystem>
15#include <fstream>
16#include <iostream>
Andrew Geisslere426b582020-05-28 12:40:55 -050017
Josh D. Kingbdd9cb72016-12-19 11:13:43 -060018namespace phosphor
19{
20namespace state
21{
22namespace manager
23{
24
Andrew Geissler429100a2021-09-09 12:50:24 -050025PHOSPHOR_LOG2_USING;
26
Josh D. King6db38222016-12-19 14:52:40 -060027// When you see server:: you know we're referencing our base class
28namespace server = sdbusplus::xyz::openbmc_project::State::server;
29
30using namespace phosphor::logging;
Andrew Geissler2f60aae2019-09-12 13:25:21 -050031using sdbusplus::xyz::openbmc_project::Common::Error::InternalFailure;
Josh D. King6db38222016-12-19 14:52:40 -060032
Andrew Geissler9eb0e442022-02-18 10:21:15 -060033constexpr auto obmcQuiesceTarget = "obmc-bmc-service-quiesce@0.target";
Anthony Wilsoneef31f82019-04-23 17:04:09 -050034constexpr auto obmcStandbyTarget = "multi-user.target";
Josh D. Kingd613b812016-12-19 16:47:45 -060035constexpr auto signalDone = "done";
Josh D. Kingd3e58472017-02-02 11:09:11 -060036constexpr auto activeState = "active";
Josh D. Kingd613b812016-12-19 16:47:45 -060037
Josh D. King5162a7b2016-12-19 16:15:00 -060038/* Map a transition to it's systemd target */
Andrew Geissler58a18012018-01-19 19:36:05 -080039const std::map<server::BMC::Transition, const char*> SYSTEMD_TABLE = {
40 {server::BMC::Transition::Reboot, "reboot.target"}};
Josh D. King5162a7b2016-12-19 16:15:00 -060041
Andrew Geissler58a18012018-01-19 19:36:05 -080042constexpr auto SYSTEMD_SERVICE = "org.freedesktop.systemd1";
43constexpr auto SYSTEMD_OBJ_PATH = "/org/freedesktop/systemd1";
44constexpr auto SYSTEMD_INTERFACE = "org.freedesktop.systemd1.Manager";
Josh D. Kingd3e58472017-02-02 11:09:11 -060045constexpr auto SYSTEMD_PRP_INTERFACE = "org.freedesktop.DBus.Properties";
Josh D. Kingd3e58472017-02-02 11:09:11 -060046
Andrew Geissler2774c782022-02-17 16:57:14 -060047std::string BMC::getUnitState(const std::string& unitToCheck)
Josh D. Kingd3e58472017-02-02 11:09:11 -060048{
Patrick Williams2975e262020-05-13 18:01:09 -050049 std::variant<std::string> currentState;
Josh D. King2b5d8872017-02-21 13:37:17 -060050 sdbusplus::message::object_path unitTargetPath;
Josh D. Kingd3e58472017-02-02 11:09:11 -060051
Andrew Geissler58a18012018-01-19 19:36:05 -080052 auto method = this->bus.new_method_call(SYSTEMD_SERVICE, SYSTEMD_OBJ_PATH,
53 SYSTEMD_INTERFACE, "GetUnit");
Josh D. King2b5d8872017-02-21 13:37:17 -060054
Andrew Geissler2774c782022-02-17 16:57:14 -060055 method.append(unitToCheck);
Josh D. King2b5d8872017-02-21 13:37:17 -060056
Anthony Wilson32c532e2018-10-25 21:56:07 -050057 try
Josh D. King2b5d8872017-02-21 13:37:17 -060058 {
Anthony Wilson32c532e2018-10-25 21:56:07 -050059 auto result = this->bus.call(method);
60 result.read(unitTargetPath);
61 }
Patrick Williamsf053e6f2022-07-22 19:26:54 -050062 catch (const sdbusplus::exception_t& e)
Anthony Wilson32c532e2018-10-25 21:56:07 -050063 {
Andrew Geissler37d36312022-03-09 16:24:45 -060064 // Not all input units will have been loaded yet so just return an
65 // empty string if an exception is caught in this path
66 info("Unit {UNIT} not found: {ERROR}", "UNIT", unitToCheck, "ERROR", e);
Andrew Geissler2774c782022-02-17 16:57:14 -060067 return std::string{};
Josh D. King2b5d8872017-02-21 13:37:17 -060068 }
69
Andrew Geissler58a18012018-01-19 19:36:05 -080070 method = this->bus.new_method_call(
71 SYSTEMD_SERVICE,
72 static_cast<const std::string&>(unitTargetPath).c_str(),
73 SYSTEMD_PRP_INTERFACE, "Get");
Josh D. Kingd3e58472017-02-02 11:09:11 -060074
75 method.append("org.freedesktop.systemd1.Unit", "ActiveState");
76
Anthony Wilson32c532e2018-10-25 21:56:07 -050077 try
Josh D. King2b5d8872017-02-21 13:37:17 -060078 {
Anthony Wilson32c532e2018-10-25 21:56:07 -050079 auto result = this->bus.call(method);
80
Andrew Geissler37d36312022-03-09 16:24:45 -060081 // Is input target active or inactive?
Anthony Wilson32c532e2018-10-25 21:56:07 -050082 result.read(currentState);
83 }
Patrick Williamsf053e6f2022-07-22 19:26:54 -050084 catch (const sdbusplus::exception_t& e)
Anthony Wilson32c532e2018-10-25 21:56:07 -050085 {
Andrew Geissler429100a2021-09-09 12:50:24 -050086 info("Error in ActiveState Get: {ERROR}", "ERROR", e);
Andrew Geissler2774c782022-02-17 16:57:14 -060087 return std::string{};
Josh D. King2b5d8872017-02-21 13:37:17 -060088 }
Andrew Geissler2774c782022-02-17 16:57:14 -060089 return (std::get<std::string>(currentState));
90}
Josh D. Kingd3e58472017-02-02 11:09:11 -060091
Andrew Geissler2774c782022-02-17 16:57:14 -060092void BMC::discoverInitialState()
93{
Andrew Geissler9eb0e442022-02-18 10:21:15 -060094 // First look to see if the BMC quiesce target is active
95 auto currentStateStr = getUnitState(obmcQuiesceTarget);
96 if (currentStateStr == activeState)
97 {
98 info("Setting the BMCState field to BMC_QUIESCED");
99 this->currentBMCState(BMCState::Quiesced);
100 return;
101 }
102
103 // If not quiesced, then check standby target
104 currentStateStr = getUnitState(obmcStandbyTarget);
Anthony Wilson32c532e2018-10-25 21:56:07 -0500105 if (currentStateStr == activeState)
Josh D. Kingd3e58472017-02-02 11:09:11 -0600106 {
Andrew Geissler429100a2021-09-09 12:50:24 -0500107 info("Setting the BMCState field to BMC_READY");
Josh D. Kingd3e58472017-02-02 11:09:11 -0600108 this->currentBMCState(BMCState::Ready);
Josh D. Kingd3e58472017-02-02 11:09:11 -0600109 }
110 else
111 {
Andrew Geissler429100a2021-09-09 12:50:24 -0500112 info("Setting the BMCState field to BMC_NOTREADY");
Josh D. Kingd3e58472017-02-02 11:09:11 -0600113 this->currentBMCState(BMCState::NotReady);
114 }
115
116 return;
117}
118
Josh D. King5162a7b2016-12-19 16:15:00 -0600119void BMC::executeTransition(const Transition tranReq)
120{
Jayaprakash Mutyala44c223c2020-08-14 00:08:03 +0000121 // HardReboot does not shutdown any services and immediately transitions
122 // into the reboot process
123 if (server::BMC::Transition::HardReboot == tranReq)
Anthony Wilson32c532e2018-10-25 21:56:07 -0500124 {
Andrew Geissler4ee59462022-04-28 16:58:26 -0400125 // Put BMC state not NotReady when issuing a BMC reboot
126 // and stop monitoring for state changes
127 this->currentBMCState(BMCState::NotReady);
128 this->stateSignal.reset();
129
Jayaprakash Mutyala44c223c2020-08-14 00:08:03 +0000130 auto method = this->bus.new_method_call(
131 SYSTEMD_SERVICE, SYSTEMD_OBJ_PATH, SYSTEMD_INTERFACE, "Reboot");
132 try
133 {
134 this->bus.call(method);
135 }
Patrick Williamsf053e6f2022-07-22 19:26:54 -0500136 catch (const sdbusplus::exception_t& e)
Jayaprakash Mutyala44c223c2020-08-14 00:08:03 +0000137 {
Andrew Geissler429100a2021-09-09 12:50:24 -0500138 info("Error in HardReboot: {ERROR}", "ERROR", e);
Jayaprakash Mutyala44c223c2020-08-14 00:08:03 +0000139 }
Anthony Wilson32c532e2018-10-25 21:56:07 -0500140 }
Jayaprakash Mutyala44c223c2020-08-14 00:08:03 +0000141 else
Anthony Wilson32c532e2018-10-25 21:56:07 -0500142 {
Jayaprakash Mutyala44c223c2020-08-14 00:08:03 +0000143 // Check to make sure it can be found
144 auto iter = SYSTEMD_TABLE.find(tranReq);
145 if (iter == SYSTEMD_TABLE.end())
146 return;
Anthony Wilson32c532e2018-10-25 21:56:07 -0500147
Jayaprakash Mutyala44c223c2020-08-14 00:08:03 +0000148 const auto& sysdUnit = iter->second;
149
150 auto method = this->bus.new_method_call(
151 SYSTEMD_SERVICE, SYSTEMD_OBJ_PATH, SYSTEMD_INTERFACE, "StartUnit");
152 // The only valid transition is reboot and that
153 // needs to be irreversible once started
154
155 method.append(sysdUnit, "replace-irreversibly");
156
Andrew Geissler4ee59462022-04-28 16:58:26 -0400157 // Put BMC state not NotReady when issuing a BMC reboot
158 // and stop monitoring for state changes
159 this->currentBMCState(BMCState::NotReady);
160 this->stateSignal.reset();
161
Jayaprakash Mutyala44c223c2020-08-14 00:08:03 +0000162 try
163 {
164 this->bus.call(method);
165 }
Patrick Williamsf053e6f2022-07-22 19:26:54 -0500166 catch (const sdbusplus::exception_t& e)
Jayaprakash Mutyala44c223c2020-08-14 00:08:03 +0000167 {
Andrew Geissler429100a2021-09-09 12:50:24 -0500168 info("Error in StartUnit - replace-irreversibly: {ERROR}", "ERROR",
169 e);
Jayaprakash Mutyala44c223c2020-08-14 00:08:03 +0000170 }
171 }
Josh D. King5162a7b2016-12-19 16:15:00 -0600172 return;
173}
174
Patrick Williamsf053e6f2022-07-22 19:26:54 -0500175int BMC::bmcStateChange(sdbusplus::message_t& msg)
Josh D. Kingd613b812016-12-19 16:47:45 -0600176{
Andrew Geissler58a18012018-01-19 19:36:05 -0800177 uint32_t newStateID{};
Josh D. Kingd613b812016-12-19 16:47:45 -0600178 sdbusplus::message::object_path newStateObjPath;
179 std::string newStateUnit{};
180 std::string newStateResult{};
181
Andrew Geissler58a18012018-01-19 19:36:05 -0800182 // Read the msg and populate each variable
Patrick Williamsd32f8182017-05-05 15:55:24 -0500183 msg.read(newStateID, newStateObjPath, newStateUnit, newStateResult);
Josh D. Kingd613b812016-12-19 16:47:45 -0600184
Andrew Geissler9eb0e442022-02-18 10:21:15 -0600185 if ((newStateUnit == obmcQuiesceTarget) && (newStateResult == signalDone))
Josh D. Kingd613b812016-12-19 16:47:45 -0600186 {
Andrew Geissler9eb0e442022-02-18 10:21:15 -0600187 error("BMC has entered BMC_QUIESCED state");
188 this->currentBMCState(BMCState::Quiesced);
Josh D. Kingd613b812016-12-19 16:47:45 -0600189
Andrew Geissler9eb0e442022-02-18 10:21:15 -0600190 // There is no getting out of Quiesced once entered (other then BMC
191 // reboot) so stop watching for signals
Andrew Geissler58a18012018-01-19 19:36:05 -0800192 auto method =
193 this->bus.new_method_call(SYSTEMD_SERVICE, SYSTEMD_OBJ_PATH,
194 SYSTEMD_INTERFACE, "Unsubscribe");
Anthony Wilson32c532e2018-10-25 21:56:07 -0500195
196 try
197 {
198 this->bus.call(method);
Anthony Wilson32c532e2018-10-25 21:56:07 -0500199 }
Patrick Williamsf053e6f2022-07-22 19:26:54 -0500200 catch (const sdbusplus::exception_t& e)
Anthony Wilson32c532e2018-10-25 21:56:07 -0500201 {
Andrew Geissler429100a2021-09-09 12:50:24 -0500202 info("Error in Unsubscribe: {ERROR}", "ERROR", e);
Anthony Wilson32c532e2018-10-25 21:56:07 -0500203 }
Andrew Geissler9eb0e442022-02-18 10:21:15 -0600204
Andrew Geissler71e538f2022-03-21 11:22:43 -0500205 // disable the system state change object as well
NodeMan978c26f0e2022-04-27 20:15:22 -0500206 this->stateSignal.reset();
Andrew Geissler71e538f2022-03-21 11:22:43 -0500207
Andrew Geissler9eb0e442022-02-18 10:21:15 -0600208 return 0;
209 }
210
211 // Caught the signal that indicates the BMC is now BMC_READY
212 if ((newStateUnit == obmcStandbyTarget) && (newStateResult == signalDone))
213 {
214 info("BMC_READY");
215 this->currentBMCState(BMCState::Ready);
Josh D. Kingd613b812016-12-19 16:47:45 -0600216 }
217
218 return 0;
219}
220
Josh D. King6db38222016-12-19 14:52:40 -0600221BMC::Transition BMC::requestedBMCTransition(Transition value)
222{
Andrew Geissler429100a2021-09-09 12:50:24 -0500223 info("Setting the RequestedBMCTransition field to "
224 "{REQUESTED_BMC_TRANSITION}",
225 "REQUESTED_BMC_TRANSITION", value);
Josh D. King6db38222016-12-19 14:52:40 -0600226
Josh D. King5162a7b2016-12-19 16:15:00 -0600227 executeTransition(value);
228 return server::BMC::requestedBMCTransition(value);
Josh D. King6db38222016-12-19 14:52:40 -0600229}
230
Josh D. Kingd613b812016-12-19 16:47:45 -0600231BMC::BMCState BMC::currentBMCState(BMCState value)
232{
Andrew Geissler429100a2021-09-09 12:50:24 -0500233 info("Setting the BMCState field to {CURRENT_BMC_STATE}",
234 "CURRENT_BMC_STATE", value);
Josh D. Kingd613b812016-12-19 16:47:45 -0600235
236 return server::BMC::currentBMCState(value);
237}
238
Tim Lee2bfb1ef2021-03-17 09:50:35 +0800239BMC::RebootCause BMC::lastRebootCause(RebootCause value)
240{
Andrew Geissler8ffdb262021-09-20 15:25:19 -0500241 info("Setting the RebootCause field to {LAST_REBOOT_CAUSE}",
242 "LAST_REBOOT_CAUSE", value);
Tim Lee2bfb1ef2021-03-17 09:50:35 +0800243
244 return server::BMC::lastRebootCause(value);
245}
246
Matt Spinlere6710b72018-07-12 16:05:55 -0500247uint64_t BMC::lastRebootTime() const
248{
249 using namespace std::chrono;
250 struct sysinfo info;
251
252 auto rc = sysinfo(&info);
253 assert(rc == 0);
254
255 // Since uptime is in seconds, also get the current time in seconds.
256 auto now = time_point_cast<seconds>(system_clock::now());
257 auto rebootTime = now - seconds(info.uptime);
258
259 return duration_cast<milliseconds>(rebootTime.time_since_epoch()).count();
260}
261
Tim Lee2bfb1ef2021-03-17 09:50:35 +0800262void BMC::discoverLastRebootCause()
263{
264 uint64_t bootReason = 0;
265 std::ifstream file;
266 auto bootstatusPath = "/sys/class/watchdog/watchdog0/bootstatus";
267
268 file.exceptions(std::ifstream::failbit | std::ifstream::badbit |
269 std::ifstream::eofbit);
270
271 try
272 {
273 file.open(bootstatusPath);
274 file >> bootReason;
275 }
276 catch (const std::exception& e)
277 {
278 auto rc = errno;
Andrew Geissler8ffdb262021-09-20 15:25:19 -0500279 error("Failed to read sysfs file {FILE} with errno {ERRNO}", "FILE",
280 bootstatusPath, "ERRNO", rc);
Tim Lee2bfb1ef2021-03-17 09:50:35 +0800281 }
282
283 switch (bootReason)
284 {
285 case WDIOF_EXTERN1:
286 this->lastRebootCause(RebootCause::Watchdog);
Andrew Geissler98e64e62022-01-25 16:02:56 -0600287 return;
Tim Lee2bfb1ef2021-03-17 09:50:35 +0800288 case WDIOF_CARDRESET:
289 this->lastRebootCause(RebootCause::POR);
Andrew Geissler98e64e62022-01-25 16:02:56 -0600290 return;
Tim Lee2bfb1ef2021-03-17 09:50:35 +0800291 default:
292 this->lastRebootCause(RebootCause::Unknown);
Andrew Geissler98e64e62022-01-25 16:02:56 -0600293 // Continue below to see if more details can be found
294 // on reason for reboot
Tim Lee2bfb1ef2021-03-17 09:50:35 +0800295 break;
296 }
297
Andrew Geissler98e64e62022-01-25 16:02:56 -0600298 // If the above code could not detect a reason, look for a the
299 // reset-cause-pinhole gpio to see if it is the reason for the reboot
300 auto gpioval =
301 phosphor::state::manager::utils::getGpioValue("reset-cause-pinhole");
302
Andrew Geissler2e352a22022-03-02 11:31:40 -0600303 // A 0 indicates a pinhole reset occurred
304 if (0 == gpioval)
Andrew Geissler98e64e62022-01-25 16:02:56 -0600305 {
306 info("The BMC reset was caused by a pinhole reset");
307 this->lastRebootCause(RebootCause::PinholeReset);
Andrew Geisslera2a7e122022-01-26 13:30:18 -0600308
309 // Generate log telling user a pinhole reset has occurred
310 const std::string errorMsg = "xyz.openbmc_project.State.PinholeReset";
311 phosphor::state::manager::utils::createError(
312 this->bus, errorMsg,
313 sdbusplus::xyz::openbmc_project::Logging::server::Entry::Level::
314 Notice);
Andrew Geissler2038e492023-06-16 15:32:58 -0400315 return;
316 }
317
318 // If we still haven't found a reason, see if we lost AC power
319 // Note that a pinhole reset will remove AC power to the chassis
320 // on some systems so we always want to look for the pinhole reset
321 // first as that would be the main reason AC power was lost.
322 size_t chassisId = 0;
323 if (phosphor::state::manager::utils::checkACLoss(chassisId))
324 {
325 this->lastRebootCause(RebootCause::POR);
Andrew Geissler98e64e62022-01-25 16:02:56 -0600326 }
327
Tim Lee2bfb1ef2021-03-17 09:50:35 +0800328 return;
329}
330
Josh D. Kingbdd9cb72016-12-19 11:13:43 -0600331} // namespace manager
332} // namespace state
Andrew Geisslera965cf02018-08-31 08:37:05 -0700333} // namespace phosphor