| #include "config.h" |
| |
| #include "host_state_manager.hpp" |
| |
| #include "host_check.hpp" |
| |
| #include <fmt/format.h> |
| #include <stdio.h> |
| #include <systemd/sd-bus.h> |
| |
| #include <cereal/archives/json.hpp> |
| #include <cereal/cereal.hpp> |
| #include <cereal/types/string.hpp> |
| #include <cereal/types/tuple.hpp> |
| #include <cereal/types/vector.hpp> |
| #include <phosphor-logging/elog-errors.hpp> |
| #include <phosphor-logging/log.hpp> |
| #include <sdbusplus/exception.hpp> |
| #include <sdbusplus/server.hpp> |
| #include <xyz/openbmc_project/Common/error.hpp> |
| #include <xyz/openbmc_project/Control/Power/RestorePolicy/server.hpp> |
| |
| #include <filesystem> |
| #include <fstream> |
| #include <iostream> |
| #include <map> |
| #include <string> |
| |
| // Register class version with Cereal |
| CEREAL_CLASS_VERSION(phosphor::state::manager::Host, CLASS_VERSION) |
| |
| namespace phosphor |
| { |
| namespace state |
| { |
| namespace manager |
| { |
| |
| // When you see server:: or reboot:: you know we're referencing our base class |
| namespace server = sdbusplus::xyz::openbmc_project::State::server; |
| namespace reboot = sdbusplus::xyz::openbmc_project::Control::Boot::server; |
| namespace bootprogress = sdbusplus::xyz::openbmc_project::State::Boot::server; |
| namespace osstatus = |
| sdbusplus::xyz::openbmc_project::State::OperatingSystem::server; |
| using namespace phosphor::logging; |
| namespace fs = std::experimental::filesystem; |
| using sdbusplus::xyz::openbmc_project::Common::Error::InternalFailure; |
| |
| // host-shutdown notifies host of shutdown and that leads to host-stop being |
| // called so initiate a host shutdown with the -shutdown target and consider the |
| // host shut down when the -stop target is complete |
| constexpr auto HOST_STATE_SOFT_POWEROFF_TGT = "obmc-host-shutdown@0.target"; |
| constexpr auto HOST_STATE_POWEROFF_TGT = "obmc-host-stop@0.target"; |
| constexpr auto HOST_STATE_POWERON_TGT = "obmc-host-start@0.target"; |
| constexpr auto HOST_STATE_POWERON_MIN_TGT = "obmc-host-startmin@0.target"; |
| constexpr auto HOST_STATE_REBOOT_TGT = "obmc-host-reboot@0.target"; |
| constexpr auto HOST_STATE_WARM_REBOOT = "obmc-host-warm-reboot@0.target"; |
| constexpr auto HOST_STATE_FORCE_WARM_REBOOT = |
| "obmc-host-force-warm-reboot@0.target"; |
| constexpr auto HOST_STATE_DIAGNOSTIC_MODE = |
| "obmc-host-diagnostic-mode@0.target"; |
| |
| constexpr auto HOST_STATE_QUIESCE_TGT = "obmc-host-quiesce@0.target"; |
| |
| constexpr auto ACTIVE_STATE = "active"; |
| constexpr auto ACTIVATING_STATE = "activating"; |
| |
| /* Map a transition to it's systemd target */ |
| const std::map<server::Host::Transition, std::string> SYSTEMD_TARGET_TABLE = { |
| {server::Host::Transition::Off, HOST_STATE_SOFT_POWEROFF_TGT}, |
| {server::Host::Transition::On, HOST_STATE_POWERON_TGT}, |
| {server::Host::Transition::Reboot, HOST_STATE_REBOOT_TGT}, |
| // Some systems do not support a warm reboot so just map the reboot |
| // requests to our normal cold reboot in that case |
| #if ENABLE_WARM_REBOOT |
| {server::Host::Transition::GracefulWarmReboot, HOST_STATE_WARM_REBOOT}, |
| {server::Host::Transition::ForceWarmReboot, HOST_STATE_FORCE_WARM_REBOOT}}; |
| #else |
| {server::Host::Transition::GracefulWarmReboot, HOST_STATE_REBOOT_TGT}, |
| {server::Host::Transition::ForceWarmReboot, HOST_STATE_REBOOT_TGT}}; |
| #endif |
| |
| constexpr auto SYSTEMD_SERVICE = "org.freedesktop.systemd1"; |
| constexpr auto SYSTEMD_OBJ_PATH = "/org/freedesktop/systemd1"; |
| constexpr auto SYSTEMD_INTERFACE = "org.freedesktop.systemd1.Manager"; |
| |
| constexpr auto SYSTEMD_PROPERTY_IFACE = "org.freedesktop.DBus.Properties"; |
| constexpr auto SYSTEMD_INTERFACE_UNIT = "org.freedesktop.systemd1.Unit"; |
| |
| void Host::subscribeToSystemdSignals() |
| { |
| auto method = this->bus.new_method_call(SYSTEMD_SERVICE, SYSTEMD_OBJ_PATH, |
| SYSTEMD_INTERFACE, "Subscribe"); |
| try |
| { |
| this->bus.call_noreply(method); |
| } |
| catch (const sdbusplus::exception::exception& e) |
| { |
| log<level::ERR>("Failed to subscribe to systemd signals", |
| entry("ERR=%s", e.what())); |
| elog<InternalFailure>(); |
| } |
| return; |
| } |
| |
| void Host::determineInitialState() |
| { |
| |
| if (stateActive(HOST_STATE_POWERON_MIN_TGT) || isHostRunning()) |
| { |
| log<level::INFO>("Initial Host State will be Running", |
| entry("CURRENT_HOST_STATE=%s", |
| convertForMessage(HostState::Running).c_str())); |
| server::Host::currentHostState(HostState::Running); |
| server::Host::requestedHostTransition(Transition::On); |
| } |
| else |
| { |
| log<level::INFO>("Initial Host State will be Off", |
| entry("CURRENT_HOST_STATE=%s", |
| convertForMessage(HostState::Off).c_str())); |
| server::Host::currentHostState(HostState::Off); |
| server::Host::requestedHostTransition(Transition::Off); |
| } |
| |
| if (!deserialize(HOST_STATE_PERSIST_PATH)) |
| { |
| // set to default value. |
| server::Host::requestedHostTransition(Transition::Off); |
| } |
| |
| return; |
| } |
| |
| void Host::executeTransition(Transition tranReq) |
| { |
| auto sysdUnit = SYSTEMD_TARGET_TABLE.find(tranReq)->second; |
| |
| auto method = this->bus.new_method_call(SYSTEMD_SERVICE, SYSTEMD_OBJ_PATH, |
| SYSTEMD_INTERFACE, "StartUnit"); |
| |
| method.append(sysdUnit); |
| method.append("replace"); |
| |
| this->bus.call_noreply(method); |
| |
| return; |
| } |
| |
| bool Host::stateActive(const std::string& target) |
| { |
| std::variant<std::string> currentState; |
| sdbusplus::message::object_path unitTargetPath; |
| |
| auto method = this->bus.new_method_call(SYSTEMD_SERVICE, SYSTEMD_OBJ_PATH, |
| SYSTEMD_INTERFACE, "GetUnit"); |
| |
| method.append(target); |
| |
| try |
| { |
| auto result = this->bus.call(method); |
| result.read(unitTargetPath); |
| } |
| catch (const sdbusplus::exception::exception& e) |
| { |
| log<level::ERR>("Error in GetUnit call", entry("ERROR=%s", e.what())); |
| return false; |
| } |
| |
| method = this->bus.new_method_call( |
| SYSTEMD_SERVICE, |
| static_cast<const std::string&>(unitTargetPath).c_str(), |
| SYSTEMD_PROPERTY_IFACE, "Get"); |
| |
| method.append(SYSTEMD_INTERFACE_UNIT, "ActiveState"); |
| |
| try |
| { |
| auto result = this->bus.call(method); |
| result.read(currentState); |
| } |
| catch (const sdbusplus::exception::exception& e) |
| { |
| log<level::ERR>("Error in ActiveState Get", |
| entry("ERROR=%s", e.what())); |
| return false; |
| } |
| |
| const auto& currentStateStr = std::get<std::string>(currentState); |
| return currentStateStr == ACTIVE_STATE || |
| currentStateStr == ACTIVATING_STATE; |
| } |
| |
| bool Host::isAutoReboot() |
| { |
| using namespace settings; |
| |
| /* The logic here is to first check the one-time AutoReboot setting. |
| * If this property is true (the default) then look at the persistent |
| * user setting in the non one-time object, otherwise honor the one-time |
| * setting and do not auto reboot. |
| */ |
| auto methodOneTime = bus.new_method_call( |
| settings.service(settings.autoReboot, autoRebootIntf).c_str(), |
| settings.autoRebootOneTime.c_str(), SYSTEMD_PROPERTY_IFACE, "Get"); |
| methodOneTime.append(autoRebootIntf, "AutoReboot"); |
| |
| auto methodUserSetting = bus.new_method_call( |
| settings.service(settings.autoReboot, autoRebootIntf).c_str(), |
| settings.autoReboot.c_str(), SYSTEMD_PROPERTY_IFACE, "Get"); |
| methodUserSetting.append(autoRebootIntf, "AutoReboot"); |
| |
| try |
| { |
| auto reply = bus.call(methodOneTime); |
| std::variant<bool> result; |
| reply.read(result); |
| auto autoReboot = std::get<bool>(result); |
| |
| if (!autoReboot) |
| { |
| log<level::INFO>("Auto reboot (one-time) disabled"); |
| return false; |
| } |
| else |
| { |
| // one-time is true so read the user setting |
| reply = bus.call(methodUserSetting); |
| reply.read(result); |
| autoReboot = std::get<bool>(result); |
| } |
| |
| auto rebootCounterParam = reboot::RebootAttempts::attemptsLeft(); |
| |
| if (autoReboot) |
| { |
| if (rebootCounterParam > 0) |
| { |
| // Reduce BOOTCOUNT by 1 |
| log<level::INFO>("Auto reboot enabled, rebooting"); |
| return true; |
| } |
| else if (rebootCounterParam == 0) |
| { |
| // Reset reboot counter and go to quiesce state |
| log<level::INFO>("Auto reboot enabled. " |
| "HOST BOOTCOUNT already set to 0."); |
| attemptsLeft(BOOT_COUNT_MAX_ALLOWED); |
| return false; |
| } |
| else |
| { |
| log<level::INFO>("Auto reboot enabled. " |
| "HOST BOOTCOUNT has an invalid value."); |
| return false; |
| } |
| } |
| else |
| { |
| log<level::INFO>("Auto reboot disabled."); |
| return false; |
| } |
| } |
| catch (const sdbusplus::exception::exception& e) |
| { |
| log<level::ERR>("Error in AutoReboot Get", entry("ERROR=%s", e.what())); |
| return false; |
| } |
| } |
| |
| void Host::sysStateChangeJobRemoved(sdbusplus::message::message& msg) |
| { |
| uint32_t newStateID{}; |
| sdbusplus::message::object_path newStateObjPath; |
| std::string newStateUnit{}; |
| std::string newStateResult{}; |
| |
| // Read the msg and populate each variable |
| msg.read(newStateID, newStateObjPath, newStateUnit, newStateResult); |
| |
| if ((newStateUnit == HOST_STATE_POWEROFF_TGT) && |
| (newStateResult == "done") && |
| (!stateActive(HOST_STATE_POWERON_MIN_TGT))) |
| { |
| log<level::INFO>("Received signal that host is off"); |
| this->currentHostState(server::Host::HostState::Off); |
| this->bootProgress(bootprogress::Progress::ProgressStages::Unspecified); |
| this->operatingSystemState(osstatus::Status::OSStatus::Inactive); |
| } |
| else if ((newStateUnit == HOST_STATE_POWERON_MIN_TGT) && |
| (newStateResult == "done") && |
| (stateActive(HOST_STATE_POWERON_MIN_TGT))) |
| { |
| log<level::INFO>("Received signal that host is running"); |
| this->currentHostState(server::Host::HostState::Running); |
| |
| // Remove temporary file which is utilized for scenarios where the |
| // BMC is rebooted while the host is still up. |
| // This file is used to indicate to host related systemd services |
| // that the host is already running and they should skip running. |
| // Once the host state is back to running we can clear this file. |
| auto size = std::snprintf(nullptr, 0, HOST_RUNNING_FILE, 0); |
| size++; // null |
| std::unique_ptr<char[]> hostFile(new char[size]); |
| std::snprintf(hostFile.get(), size, HOST_RUNNING_FILE, 0); |
| if (std::filesystem::exists(hostFile.get())) |
| { |
| std::filesystem::remove(hostFile.get()); |
| } |
| } |
| else if ((newStateUnit == HOST_STATE_QUIESCE_TGT) && |
| (newStateResult == "done") && |
| (stateActive(HOST_STATE_QUIESCE_TGT))) |
| { |
| if (Host::isAutoReboot()) |
| { |
| log<level::INFO>("Beginning reboot..."); |
| Host::requestedHostTransition(server::Host::Transition::Reboot); |
| } |
| else |
| { |
| log<level::INFO>("Maintaining quiesce"); |
| this->currentHostState(server::Host::HostState::Quiesced); |
| } |
| } |
| } |
| |
| void Host::sysStateChangeJobNew(sdbusplus::message::message& msg) |
| { |
| uint32_t newStateID{}; |
| sdbusplus::message::object_path newStateObjPath; |
| std::string newStateUnit{}; |
| |
| // Read the msg and populate each variable |
| msg.read(newStateID, newStateObjPath, newStateUnit); |
| |
| if (newStateUnit == HOST_STATE_DIAGNOSTIC_MODE) |
| { |
| log<level::INFO>("Received signal that host is in diagnostice mode"); |
| this->currentHostState(server::Host::HostState::DiagnosticMode); |
| } |
| } |
| |
| uint32_t Host::decrementRebootCount() |
| { |
| auto rebootCount = reboot::RebootAttempts::attemptsLeft(); |
| if (rebootCount > 0) |
| { |
| return (reboot::RebootAttempts::attemptsLeft(rebootCount - 1)); |
| } |
| return rebootCount; |
| } |
| |
| fs::path Host::serialize(const fs::path& dir) |
| { |
| std::ofstream os(dir.c_str(), std::ios::binary); |
| cereal::JSONOutputArchive oarchive(os); |
| oarchive(*this); |
| return dir; |
| } |
| |
| bool Host::deserialize(const fs::path& path) |
| { |
| try |
| { |
| if (fs::exists(path)) |
| { |
| std::ifstream is(path.c_str(), std::ios::in | std::ios::binary); |
| cereal::JSONInputArchive iarchive(is); |
| iarchive(*this); |
| return true; |
| } |
| return false; |
| } |
| catch (cereal::Exception& e) |
| { |
| log<level::ERR>(e.what()); |
| fs::remove(path); |
| return false; |
| } |
| } |
| |
| Host::Transition Host::requestedHostTransition(Transition value) |
| { |
| log<level::INFO>(fmt::format("Host state transition request of {}", |
| convertForMessage(value)) |
| .c_str()); |
| // If this is not a power off request then we need to |
| // decrement the reboot counter. This code should |
| // never prevent a power on, it should just decrement |
| // the count to 0. The quiesce handling is where the |
| // check of this count will occur |
| if (value != server::Host::Transition::Off) |
| { |
| decrementRebootCount(); |
| } |
| |
| executeTransition(value); |
| |
| auto retVal = server::Host::requestedHostTransition(value); |
| serialize(); |
| return retVal; |
| } |
| |
| Host::ProgressStages Host::bootProgress(ProgressStages value) |
| { |
| auto retVal = bootprogress::Progress::bootProgress(value); |
| serialize(); |
| return retVal; |
| } |
| |
| Host::OSStatus Host::operatingSystemState(OSStatus value) |
| { |
| auto retVal = osstatus::Status::operatingSystemState(value); |
| serialize(); |
| return retVal; |
| } |
| |
| Host::HostState Host::currentHostState(HostState value) |
| { |
| log<level::INFO>( |
| fmt::format("Change to Host State: {}", convertForMessage(value)) |
| .c_str()); |
| return server::Host::currentHostState(value); |
| } |
| |
| } // namespace manager |
| } // namespace state |
| } // namespace phosphor |