blob: 26a4f39b237c553019bc2dfd53637232486cd17b [file] [log] [blame]
Vishwanatha Subbanna15b1dc12017-05-23 15:16:13 +05301/**
2 * Copyright © 2017 IBM Corporation
3 *
4 * Licensed under the Apache License, Version 2.0 (the "License");
5 * you may not use this file except in compliance with the License.
6 * You may obtain a copy of the License at
7 *
8 * http://www.apache.org/licenses/LICENSE-2.0
9 *
10 * Unless required by applicable law or agreed to in writing, software
11 * distributed under the License is distributed on an "AS IS" BASIS,
12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 * See the License for the specific language governing permissions and
14 * limitations under the License.
15 */
16
Vishwanatha Subbannad7a3f132017-05-29 19:39:08 +053017#include "watchdog.hpp"
Vishwanatha Subbanna15b1dc12017-05-23 15:16:13 +053018
William A. Kennington III1eb97d92018-09-13 00:36:12 -070019#include <CLI/CLI.hpp>
William A. Kennington III26eef262019-04-04 15:30:30 -070020#include <functional>
Patrick Venture8f6c5152018-09-11 17:45:33 -070021#include <iostream>
William A. Kennington III73c2cfb2018-09-12 18:01:37 -070022#include <optional>
Patrick Venture8f6c5152018-09-11 17:45:33 -070023#include <phosphor-logging/elog-errors.hpp>
24#include <phosphor-logging/elog.hpp>
25#include <phosphor-logging/log.hpp>
William A. Kennington III8d8bc462019-01-16 14:59:07 -080026#include <sdbusplus/bus.hpp>
27#include <sdbusplus/exception.hpp>
28#include <sdbusplus/server/manager.hpp>
29#include <sdeventplus/event.hpp>
William A. Kennington III658527b2021-12-19 20:43:22 -080030#include <sdeventplus/source/signal.hpp>
31#include <stdplus/signal.hpp>
Patrick Venture8f6c5152018-09-11 17:45:33 -070032#include <string>
33#include <xyz/openbmc_project/Common/error.hpp>
34
William A. Kennington III1232a152018-02-02 15:57:34 -080035using phosphor::watchdog::Watchdog;
William A. Kennington III93975262018-02-02 16:00:50 -080036using sdbusplus::xyz::openbmc_project::State::server::convertForMessage;
William A. Kennington III1232a152018-02-02 15:57:34 -080037
William A. Kennington III3bb2f402018-09-13 00:35:47 -070038void printActionTargetMap(const Watchdog::ActionTargetMap& actionTargetMap)
William A. Kennington III93975262018-02-02 16:00:50 -080039{
40 std::cerr << "Action Targets:\n";
William A. Kennington III3bb2f402018-09-13 00:35:47 -070041 for (const auto& [action, target] : actionTargetMap)
William A. Kennington III93975262018-02-02 16:00:50 -080042 {
William A. Kennington III3bb2f402018-09-13 00:35:47 -070043 std::cerr << " " << convertForMessage(action) << " -> " << target
44 << "\n";
William A. Kennington III93975262018-02-02 16:00:50 -080045 }
46 std::cerr << std::flush;
47}
48
William A. Kennington III1eb97d92018-09-13 00:36:12 -070049void printFallback(const Watchdog::Fallback& fallback)
50{
51 std::cerr << "Fallback Options:\n";
52 std::cerr << " Action: " << convertForMessage(fallback.action) << "\n";
53 std::cerr << " Interval(ms): " << std::dec << fallback.interval << "\n";
54 std::cerr << " Always re-execute: " << std::boolalpha << fallback.always
55 << "\n";
56 std::cerr << std::flush;
57}
58
William A. Kennington III3bb2f402018-09-13 00:35:47 -070059int main(int argc, char* argv[])
Vishwanatha Subbanna15b1dc12017-05-23 15:16:13 +053060{
Vishwanatha Subbanna7e146552017-05-29 17:03:33 +053061 using namespace phosphor::logging;
Patrick Venture8f6c5152018-09-11 17:45:33 -070062 using InternalFailure =
63 sdbusplus::xyz::openbmc_project::Common::Error::InternalFailure;
Vishwanatha Subbanna15b1dc12017-05-23 15:16:13 +053064
William A. Kennington III1eb97d92018-09-13 00:36:12 -070065 CLI::App app{"Canonical openbmc host watchdog daemon"};
Patrick Venture09eebe32017-08-11 15:23:17 -070066
William A. Kennington III1eb97d92018-09-13 00:36:12 -070067 // Service related options
68 const std::string serviceGroup = "Service Options";
69 std::string path;
70 app.add_option("-p,--path", path,
71 "DBus Object Path. "
72 "Ex: /xyz/openbmc_project/state/watchdog/host0")
73 ->required()
74 ->group(serviceGroup);
75 std::string service;
76 app.add_option("-s,--service", service,
77 "DBus Service Name. "
78 "Ex: xyz.openbmc_project.State.Watchdog.Host")
79 ->required()
80 ->group(serviceGroup);
Jae Hyun Yoo61bc6cd2021-07-01 14:48:41 -070081 bool continueAfterTimeout{false};
William A. Kennington III1eb97d92018-09-13 00:36:12 -070082 app.add_flag("-c,--continue", continueAfterTimeout,
83 "Continue daemon after watchdog timeout")
84 ->group(serviceGroup);
Vishwanatha Subbanna15b1dc12017-05-23 15:16:13 +053085
William A. Kennington III1eb97d92018-09-13 00:36:12 -070086 // Target related options
87 const std::string targetGroup = "Target Options";
88 std::optional<std::string> target;
89 app.add_option("-t,--target", target,
90 "Systemd unit to be called on "
91 "timeout for all actions but NONE. "
92 "Deprecated, use --action_target instead.")
93 ->group(targetGroup);
94 std::vector<std::string> actionTargets;
95 app.add_option("-a,--action_target", actionTargets,
96 "Map of action to "
97 "systemd unit to be called on timeout if that action is "
98 "set for ExpireAction when the timer expires.")
99 ->group(targetGroup);
Vishwanatha Subbanna15b1dc12017-05-23 15:16:13 +0530100
William A. Kennington III1eb97d92018-09-13 00:36:12 -0700101 // Fallback related options
102 const std::string fallbackGroup = "Fallback Options";
103 std::optional<std::string> fallbackAction;
104 auto fallbackActionOpt =
105 app.add_option("-f,--fallback_action", fallbackAction,
106 "Enables the "
107 "watchdog even when disabled via the dbus interface. "
108 "Perform this action when the fallback expires.")
109 ->group(fallbackGroup);
110 std::optional<unsigned> fallbackIntervalMs;
111 auto fallbackIntervalOpt =
112 app.add_option("-i,--fallback_interval", fallbackIntervalMs,
113 "Enables the "
114 "watchdog even when disabled via the dbus interface. "
115 "Waits for this interval before performing the fallback "
116 "action.")
117 ->group(fallbackGroup);
118 fallbackIntervalOpt->needs(fallbackActionOpt);
119 fallbackActionOpt->needs(fallbackIntervalOpt);
Jae Hyun Yoo61bc6cd2021-07-01 14:48:41 -0700120 bool fallbackAlways{false};
William A. Kennington III1eb97d92018-09-13 00:36:12 -0700121 app.add_flag("-e,--fallback_always", fallbackAlways,
122 "Enables the "
123 "watchdog even when disabled by the dbus interface. "
124 "This option is only valid with a fallback specified")
125 ->group(fallbackGroup)
126 ->needs(fallbackActionOpt)
127 ->needs(fallbackIntervalOpt);
128
William A. Kennington III26eef262019-04-04 15:30:30 -0700129 // Should we watch for postcodes
Jae Hyun Yoo61bc6cd2021-07-01 14:48:41 -0700130 bool watchPostcodes{false};
William A. Kennington III26eef262019-04-04 15:30:30 -0700131 app.add_flag("-w,--watch_postcodes", watchPostcodes,
132 "Should we reset the time remaining any time a postcode "
133 "is signaled.");
134
Andrew Geisslerafc369a2021-06-03 14:17:16 -0500135 // Interval related options
Ofer Yehiellic35135d2019-06-14 11:30:25 -0700136 uint64_t minInterval = phosphor::watchdog::DEFAULT_MIN_INTERVAL_MS;
Kun Yi08683752019-12-05 10:34:45 -0800137 app.add_option("-m,--min_interval", minInterval,
138 "Set minimum interval for watchdog in milliseconds");
Ofer Yehiellic35135d2019-06-14 11:30:25 -0700139
Andrew Geisslerafc369a2021-06-03 14:17:16 -0500140 // 0 to indicate to use default from PDI if not passed in
141 uint64_t defaultInterval = 0;
142 app.add_option("-d,--default_interval", defaultInterval,
143 "Set default interval for watchdog in milliseconds");
144
William A. Kennington III1eb97d92018-09-13 00:36:12 -0700145 CLI11_PARSE(app, argc, argv);
146
147 // Put together a list of actions and associated systemd targets
148 // The new --action_target options take precedence over the legacy
149 // --target
William A. Kennington III3bb2f402018-09-13 00:35:47 -0700150 Watchdog::ActionTargetMap actionTargetMap;
William A. Kennington III1eb97d92018-09-13 00:36:12 -0700151 if (target)
Patrick Venture8f6c5152018-09-11 17:45:33 -0700152 {
William A. Kennington III1eb97d92018-09-13 00:36:12 -0700153 actionTargetMap[Watchdog::Action::HardReset] = *target;
154 actionTargetMap[Watchdog::Action::PowerOff] = *target;
155 actionTargetMap[Watchdog::Action::PowerCycle] = *target;
William A. Kennington III1232a152018-02-02 15:57:34 -0800156 }
William A. Kennington III1eb97d92018-09-13 00:36:12 -0700157 for (const auto& actionTarget : actionTargets)
William A. Kennington III27df4b52018-02-02 16:02:05 -0800158 {
159 size_t keyValueSplit = actionTarget.find("=");
160 if (keyValueSplit == std::string::npos)
161 {
William A. Kennington III1eb97d92018-09-13 00:36:12 -0700162 std::cerr << "Invalid action_target format, "
163 "expect <action>=<target>."
164 << std::endl;
165 return 1;
William A. Kennington III27df4b52018-02-02 16:02:05 -0800166 }
167
168 std::string key = actionTarget.substr(0, keyValueSplit);
Patrick Venture8f6c5152018-09-11 17:45:33 -0700169 std::string value = actionTarget.substr(keyValueSplit + 1);
William A. Kennington III27df4b52018-02-02 16:02:05 -0800170
171 // Convert an action from a fully namespaced value
172 Watchdog::Action action;
173 try
174 {
175 action = Watchdog::convertActionFromString(key);
176 }
Patrick Venture8f6c5152018-09-11 17:45:33 -0700177 catch (const sdbusplus::exception::InvalidEnumString&)
William A. Kennington III27df4b52018-02-02 16:02:05 -0800178 {
William A. Kennington III1eb97d92018-09-13 00:36:12 -0700179 std::cerr << "Bad action specified: " << key << std::endl;
180 return 1;
William A. Kennington III27df4b52018-02-02 16:02:05 -0800181 }
182
William A. Kennington IIIc2c26ce2018-09-13 18:35:56 -0700183 // Detect duplicate action target arguments
184 if (actionTargetMap.find(action) != actionTargetMap.end())
185 {
William A. Kennington III1eb97d92018-09-13 00:36:12 -0700186 std::cerr << "Got duplicate action: " << key << std::endl;
187 return 1;
William A. Kennington IIIc2c26ce2018-09-13 18:35:56 -0700188 }
189
William A. Kennington III3bb2f402018-09-13 00:35:47 -0700190 actionTargetMap[action] = std::move(value);
William A. Kennington III27df4b52018-02-02 16:02:05 -0800191 }
William A. Kennington III3bb2f402018-09-13 00:35:47 -0700192 printActionTargetMap(actionTargetMap);
William A. Kennington III93975262018-02-02 16:00:50 -0800193
William A. Kennington III1eb97d92018-09-13 00:36:12 -0700194 // Build the fallback option used for the Watchdog
195 std::optional<Watchdog::Fallback> maybeFallback;
196 if (fallbackAction)
William A. Kennington IIId1331082018-02-27 18:47:05 -0800197 {
William A. Kennington III1eb97d92018-09-13 00:36:12 -0700198 Watchdog::Fallback fallback;
William A. Kennington IIId1331082018-02-27 18:47:05 -0800199 try
200 {
William A. Kennington III1eb97d92018-09-13 00:36:12 -0700201 fallback.action =
202 Watchdog::convertActionFromString(*fallbackAction);
William A. Kennington IIId1331082018-02-27 18:47:05 -0800203 }
Patrick Venture8f6c5152018-09-11 17:45:33 -0700204 catch (const sdbusplus::exception::InvalidEnumString&)
William A. Kennington IIId1331082018-02-27 18:47:05 -0800205 {
William A. Kennington III1eb97d92018-09-13 00:36:12 -0700206 std::cerr << "Bad fallback action specified: " << *fallbackAction
207 << std::endl;
208 return 1;
William A. Kennington IIId1331082018-02-27 18:47:05 -0800209 }
William A. Kennington III1eb97d92018-09-13 00:36:12 -0700210 fallback.interval = *fallbackIntervalMs;
211 fallback.always = fallbackAlways;
William A. Kennington IIId1331082018-02-27 18:47:05 -0800212
William A. Kennington III1eb97d92018-09-13 00:36:12 -0700213 printFallback(fallback);
Willy Tucf4ce3c2021-12-09 20:39:37 -0800214 maybeFallback = fallback;
William A. Kennington III22352192018-02-27 18:51:44 -0800215 }
216
Vishwanatha Subbanna4d5ef3f2017-05-31 18:54:22 +0530217 try
Vishwanatha Subbanna7e146552017-05-29 17:03:33 +0530218 {
William A. Kennington IIIf505fc02018-09-12 18:30:09 -0700219 // Get a default event loop
220 auto event = sdeventplus::Event::get_default();
221
222 // Get a handle to system dbus.
223 auto bus = sdbusplus::bus::new_default();
224
225 // Add systemd object manager.
Willy Tucf4ce3c2021-12-09 20:39:37 -0800226 sdbusplus::server::manager::manager watchdogManager(bus, path.c_str());
William A. Kennington IIIf505fc02018-09-12 18:30:09 -0700227
228 // Attach the bus to sd_event to service user requests
229 bus.attach_event(event.get(), SD_EVENT_PRIORITY_NORMAL);
230
Vishwanatha Subbanna4d5ef3f2017-05-31 18:54:22 +0530231 // Create a watchdog object
William A. Kennington IIIf505fc02018-09-12 18:30:09 -0700232 Watchdog watchdog(bus, path.c_str(), event, std::move(actionTargetMap),
Andrew Geisslerafc369a2021-06-03 14:17:16 -0500233 std::move(maybeFallback), minInterval,
234 defaultInterval);
William A. Kennington IIId1331082018-02-27 18:47:05 -0800235
William A. Kennington III26eef262019-04-04 15:30:30 -0700236 std::optional<sdbusplus::bus::match::match> watchPostcodeMatch;
237 if (watchPostcodes)
238 {
239 watchPostcodeMatch.emplace(
240 bus,
241 sdbusplus::bus::match::rules::propertiesChanged(
William A. Kennington III459b6c72021-05-12 12:02:48 -0700242 "/xyz/openbmc_project/state/boot/raw0",
William A. Kennington III26eef262019-04-04 15:30:30 -0700243 "xyz.openbmc_project.State.Boot.Raw"),
244 std::bind(&Watchdog::resetTimeRemaining, std::ref(watchdog),
245 false));
246 }
247
Vishwanatha Subbanna4d5ef3f2017-05-31 18:54:22 +0530248 // Claim the bus
249 bus.request_name(service.c_str());
250
William A. Kennington III658527b2021-12-19 20:43:22 -0800251 bool done = false;
252 auto intCb = [&](sdeventplus::source::Signal&,
253 const struct signalfd_siginfo*) { done = true; };
254 stdplus::signal::block(SIGINT);
255 sdeventplus::source::Signal sigint(event, SIGINT, intCb);
256 stdplus::signal::block(SIGTERM);
257 sdeventplus::source::Signal sigterm(event, SIGTERM, std::move(intCb));
258
William A. Kennington III825f4982018-02-27 19:10:56 -0800259 // Loop until our timer expires and we don't want to continue
William A. Kennington III658527b2021-12-19 20:43:22 -0800260 while (!done && (continueAfterTimeout || !watchdog.timerExpired()))
Vishwanatha Subbanna7e146552017-05-29 17:03:33 +0530261 {
William A. Kennington IIIf505fc02018-09-12 18:30:09 -0700262 // Run and never timeout
263 event.run(std::nullopt);
Vishwanatha Subbanna7e146552017-05-29 17:03:33 +0530264 }
265 }
Patrick Williams120bc4c2021-10-06 14:41:25 -0500266 catch (const InternalFailure& e)
Vishwanatha Subbanna4d5ef3f2017-05-31 18:54:22 +0530267 {
268 phosphor::logging::commit<InternalFailure>();
269
270 // Need a coredump in the error cases.
271 std::terminate();
272 }
Vishwanatha Subbanna15b1dc12017-05-23 15:16:13 +0530273 return 0;
274}