blob: c92412343ba6c927a808478f48ca33b5766704b2 [file] [log] [blame]
Alexander Hansen46a755f2025-10-27 16:31:08 +01001// SPDX-License-Identifier: Apache-2.0
2// SPDX-FileCopyrightText: Copyright 2017 Google Inc
3
Pete O_o765a6d82025-07-23 21:44:14 -07004#include "config.h"
Patrick Venturee6206562018-03-08 15:36:53 -08005
Harvey Wu3dcfd542022-10-31 17:11:02 +08006#include "buildjson/buildjson.hpp"
Patrick Ventureda4a5dd2018-08-31 09:42:48 -07007#include "conf.hpp"
Patrick Venture7f9d6902020-09-10 12:09:57 -07008#include "dbus/dbusconfiguration.hpp"
James Zheng6df8bb52024-11-27 23:38:47 +00009#include "failsafeloggers/builder.hpp"
Potin Laie1fa8592025-08-29 15:27:08 +080010#include "hoststatemonitor.hpp"
Patrick Venture5c7cc542018-06-11 14:29:38 -070011#include "pid/builder.hpp"
Patrick Ventureba8ffa72019-02-11 12:03:56 -080012#include "pid/buildjson.hpp"
James Feistce6a3f32019-03-12 11:20:16 -070013#include "pid/pidloop.hpp"
Patrick Venturec32e3fc2019-02-28 10:01:11 -080014#include "pid/tuning.hpp"
Patrick Venture5e929092018-06-08 10:55:23 -070015#include "sensors/builder.hpp"
Patrick Ventureba8ffa72019-02-11 12:03:56 -080016#include "sensors/buildjson.hpp"
Patrick Venturee6206562018-03-08 15:36:53 -080017#include "sensors/manager.hpp"
Patrick Ventureda4a5dd2018-08-31 09:42:48 -070018#include "util.hpp"
Ed Tanousf8b6e552025-06-27 13:27:50 -070019#include "zone_interface.hpp"
20
21#include <signal.h>
Patrick Venturee6206562018-03-08 15:36:53 -080022
Patrick Ventureb5cc37c2019-03-11 09:11:55 -070023#include <CLI/CLI.hpp>
Ed Tanousf8b6e552025-06-27 13:27:50 -070024#include <boost/asio/error.hpp>
James Feistce6a3f32019-03-12 11:20:16 -070025#include <boost/asio/io_context.hpp>
Ed Tanousf8b6e552025-06-27 13:27:50 -070026#include <boost/asio/post.hpp>
Potin Laie2ec69a2022-09-30 17:09:34 +080027#include <boost/asio/signal_set.hpp>
James Feistce6a3f32019-03-12 11:20:16 -070028#include <boost/asio/steady_timer.hpp>
Patrick Venturea83a3ec2020-08-04 09:52:05 -070029#include <sdbusplus/asio/connection.hpp>
30#include <sdbusplus/bus.hpp>
Bruce Leecb4c1a22021-04-20 16:06:38 +080031#include <sdbusplus/server/manager.hpp>
Patrick Venturea83a3ec2020-08-04 09:52:05 -070032
Patrick Ventureda4a5dd2018-08-31 09:42:48 -070033#include <chrono>
Ed Tanousf8b6e552025-06-27 13:27:50 -070034#include <csignal>
35#include <cstdint>
36#include <cstdlib>
37#include <exception>
Patrick Venture7f9d6902020-09-10 12:09:57 -070038#include <filesystem>
Ed Tanousf8b6e552025-06-27 13:27:50 -070039#include <fstream>
Patrick Ventureda4a5dd2018-08-31 09:42:48 -070040#include <iostream>
41#include <map>
42#include <memory>
Patrick Williamse3c60772025-04-07 17:53:42 -040043#include <optional>
Ed Tanousf8b6e552025-06-27 13:27:50 -070044#include <stdexcept>
45#include <string>
46#include <tuple>
Patrick Ventureda4a5dd2018-08-31 09:42:48 -070047#include <unordered_map>
Patrick Ventureba8ffa72019-02-11 12:03:56 -080048#include <utility>
Patrick Ventureda4a5dd2018-08-31 09:42:48 -070049#include <vector>
Patrick Venturee6206562018-03-08 15:36:53 -080050
Patrick Venturea0764872020-08-08 07:48:43 -070051namespace pid_control
52{
53
James Feist1fe08952019-05-07 09:17:16 -070054/* The configuration converted sensor list. */
Patrick Venture1df9e872020-10-08 15:35:01 -070055std::map<std::string, conf::SensorConfig> sensorConfig = {};
James Feist1fe08952019-05-07 09:17:16 -070056/* The configuration converted PID list. */
James Feistf81f2882019-02-26 11:26:36 -080057std::map<int64_t, conf::PIDConf> zoneConfig = {};
James Feist1fe08952019-05-07 09:17:16 -070058/* The configuration converted Zone configuration. */
Patrick Venture1df9e872020-10-08 15:35:01 -070059std::map<int64_t, conf::ZoneConfig> zoneDetailsConfig = {};
Patrick Venturee6206562018-03-08 15:36:53 -080060
Patrick Rudolphc7b2be32023-10-13 12:34:58 +020061namespace state
62{
63/* Set to true while canceling is in progress */
64static bool isCanceling = false;
65/* The zones build from configuration */
66static std::unordered_map<int64_t, std::shared_ptr<ZoneInterface>> zones;
67/* The timers used by the PID loop */
68static std::vector<std::shared_ptr<boost::asio::steady_timer>> timers;
69/* The sensors build from configuration */
Patrick Williamse3c60772025-04-07 17:53:42 -040070static std::optional<SensorManager> mgmr;
Patrick Rudolphc7b2be32023-10-13 12:34:58 +020071} // namespace state
72
Patrick Venturea0764872020-08-08 07:48:43 -070073} // namespace pid_control
74
Potin Lai79cde002023-02-16 13:53:10 +080075std::filesystem::path configPath = "";
Patrick Venturec19f5d42019-02-14 10:59:47 -080076
James Feist1fe08952019-05-07 09:17:16 -070077/* async io context for operation */
78boost::asio::io_context io;
Potin Laie2ec69a2022-09-30 17:09:34 +080079/* async signal_set for signal handling */
Patrick Rudolphc7b2be32023-10-13 12:34:58 +020080boost::asio::signal_set signals(io, SIGHUP, SIGTERM);
James Feist1fe08952019-05-07 09:17:16 -070081
82/* buses for system control */
83static sdbusplus::asio::connection modeControlBus(io);
Patrick Williams7dea66c2025-04-07 14:23:50 -040084static sdbusplus::asio::connection hostBus(io, sdbusplus::bus::new_bus());
85static sdbusplus::asio::connection passiveBus(io, sdbusplus::bus::new_bus());
Potin Laie1fa8592025-08-29 15:27:08 +080086static sdbusplus::asio::connection hostMatchBus(io, sdbusplus::bus::new_bus());
James Feist1fe08952019-05-07 09:17:16 -070087
Patrick Venturea0764872020-08-08 07:48:43 -070088namespace pid_control
89{
90
Potin Lai79cde002023-02-16 13:53:10 +080091std::filesystem::path searchConfigurationPath()
92{
93 static constexpr auto name = "config.json";
94
Ed Tanousd2768c52025-06-26 11:42:57 -070095 for (const auto& pathSeg : {std::filesystem::current_path(),
96 std::filesystem::path{"/var/lib/swampd"},
97 std::filesystem::path{"/usr/share/swampd"}})
Potin Lai79cde002023-02-16 13:53:10 +080098 {
99 auto file = pathSeg / name;
100 if (std::filesystem::exists(file))
101 {
102 return file;
103 }
104 }
105
106 return name;
107}
108
Patrick Rudolphc7b2be32023-10-13 12:34:58 +0200109void stopControlLoops()
Patrick Venturee6206562018-03-08 15:36:53 -0800110{
Patrick Rudolphc7b2be32023-10-13 12:34:58 +0200111 for (const auto& timer : state::timers)
Johnathan Mantey5301aae2020-09-28 11:06:58 -0700112 {
113 timer->cancel();
114 }
Patrick Rudolphc7b2be32023-10-13 12:34:58 +0200115 state::isCanceling = true;
116 state::timers.clear();
Hao Jiangb228cea2021-02-20 11:53:09 -0800117
Patrick Rudolphc7b2be32023-10-13 12:34:58 +0200118 if (state::zones.size() > 0 && state::zones.begin()->second.use_count() > 1)
Hao Jiangb228cea2021-02-20 11:53:09 -0800119 {
120 throw std::runtime_error("wait for count back to 1");
121 }
Patrick Rudolphc7b2be32023-10-13 12:34:58 +0200122
123 state::zones.clear();
124 state::isCanceling = false;
125}
126
127void restartControlLoops()
128{
129 stopControlLoops();
Patrick Venture4cb7c052019-02-14 11:11:33 -0800130
Potin Lai79cde002023-02-16 13:53:10 +0800131 const std::filesystem::path path =
132 (!configPath.empty()) ? configPath : searchConfigurationPath();
Patrick Venturee6206562018-03-08 15:36:53 -0800133
Patrick Venture7f9d6902020-09-10 12:09:57 -0700134 if (std::filesystem::exists(path))
Patrick Venturee6206562018-03-08 15:36:53 -0800135 {
Patrick Venture7f9d6902020-09-10 12:09:57 -0700136 /*
137 * When building the sensors, if any of the dbus passive ones aren't on
138 * the bus, it'll fail immediately.
139 */
140 try
141 {
142 auto jsonData = parseValidateJson(path);
143 sensorConfig = buildSensorsFromJson(jsonData);
Patrick Williamsbd63bca2024-08-16 15:21:10 -0400144 std::tie(zoneConfig, zoneDetailsConfig) =
145 buildPIDsFromJson(jsonData);
Patrick Venture7f9d6902020-09-10 12:09:57 -0700146 }
147 catch (const std::exception& e)
148 {
149 std::cerr << "Failed during building: " << e.what() << "\n";
150 exit(EXIT_FAILURE); /* fatal error. */
151 }
Patrick Venturee6206562018-03-08 15:36:53 -0800152 }
Patrick Venture7f9d6902020-09-10 12:09:57 -0700153 else
Patrick Venture18b13112019-02-14 11:43:59 -0800154 {
Patrick Venture7f9d6902020-09-10 12:09:57 -0700155 static boost::asio::steady_timer reloadTimer(io);
Patrick Venture73823182020-10-08 15:12:51 -0700156 if (!dbus_configuration::init(modeControlBus, reloadTimer, sensorConfig,
157 zoneConfig, zoneDetailsConfig))
Patrick Venture7f9d6902020-09-10 12:09:57 -0700158 {
159 return; // configuration not ready
160 }
Patrick Venture18b13112019-02-14 11:43:59 -0800161 }
Patrick Venture4cb7c052019-02-14 11:11:33 -0800162
Patrick Rudolphc7b2be32023-10-13 12:34:58 +0200163 state::mgmr = buildSensors(sensorConfig, passiveBus, hostBus);
Patrick Williamsbd63bca2024-08-16 15:21:10 -0400164 state::zones =
Patrick Williamse3c60772025-04-07 17:53:42 -0400165 buildZones(zoneConfig, zoneDetailsConfig, *state::mgmr, modeControlBus);
James Zheng6df8bb52024-11-27 23:38:47 +0000166 // Set `logMaxCountPerSecond` to 20 will limit the number of logs output per
167 // second in each zone. Using 20 here would limit the output rate to be no
168 // larger than 100 per sec for most platforms as the number of zones are
169 // usually <=3. This will effectively avoid resource exhaustion.
170 buildFailsafeLoggers(state::zones, /* logMaxCountPerSecond = */ 20);
Patrick Venturee6206562018-03-08 15:36:53 -0800171
Patrick Rudolphc7b2be32023-10-13 12:34:58 +0200172 if (0 == state::zones.size())
Patrick Venturee6206562018-03-08 15:36:53 -0800173 {
174 std::cerr << "No zones defined, exiting.\n";
James Feist1fe08952019-05-07 09:17:16 -0700175 std::exit(EXIT_FAILURE);
Patrick Venturee6206562018-03-08 15:36:53 -0800176 }
177
Patrick Rudolphc7b2be32023-10-13 12:34:58 +0200178 for (const auto& i : state::zones)
James Feist1fe08952019-05-07 09:17:16 -0700179 {
Patrick Rudolphc7b2be32023-10-13 12:34:58 +0200180 std::shared_ptr<boost::asio::steady_timer> timer =
181 state::timers.emplace_back(
182 std::make_shared<boost::asio::steady_timer>(io));
James Feist1fe08952019-05-07 09:17:16 -0700183 std::cerr << "pushing zone " << i.first << "\n";
Patrick Rudolphc7b2be32023-10-13 12:34:58 +0200184 pidControlLoop(i.second, timer, &state::isCanceling);
James Feist1fe08952019-05-07 09:17:16 -0700185 }
186}
187
Hao Jiangb228cea2021-02-20 11:53:09 -0800188void tryRestartControlLoops(bool first)
Yong Li298a95c2020-04-07 15:11:02 +0800189{
Hao Jiangd11a7322021-03-24 11:25:57 -0700190 static const auto delayTime = std::chrono::seconds(10);
Hao Jiangb228cea2021-02-20 11:53:09 -0800191 static boost::asio::steady_timer timer(io);
Hao Jiangd11a7322021-03-24 11:25:57 -0700192
193 auto restartLbd = [](const boost::system::error_code& error) {
Hao Jiang232ffe42021-02-21 20:11:49 -0800194 if (error == boost::asio::error::operation_aborted)
195 {
196 return;
197 }
Hao Jiangb228cea2021-02-20 11:53:09 -0800198
Hao Jiang232ffe42021-02-21 20:11:49 -0800199 // retry when restartControlLoops() has some failure.
200 try
201 {
202 restartControlLoops();
Hao Jiang232ffe42021-02-21 20:11:49 -0800203 }
204 catch (const std::exception& e)
205 {
Zev Weiss5293ec22023-03-06 18:58:36 -0800206 std::cerr << "Failed during restartControlLoops, try again: "
Hao Jiang232ffe42021-02-21 20:11:49 -0800207 << e.what() << "\n";
208 tryRestartControlLoops(false);
209 }
Hao Jiangd11a7322021-03-24 11:25:57 -0700210 };
Zev Weiss5293ec22023-03-06 18:58:36 -0800211
Hao Jiangd11a7322021-03-24 11:25:57 -0700212 // first time of trying to restart the control loop without a delay
213 if (first)
214 {
Ed Tanousd2768c52025-06-26 11:42:57 -0700215 boost::asio::post(io, [restartLbd] {
216 restartLbd(boost::system::error_code());
217 });
Hao Jiangd11a7322021-03-24 11:25:57 -0700218 }
219 // re-try control loop, set up a delay.
220 else
221 {
222 timer.expires_after(delayTime);
223 timer.async_wait(restartLbd);
224 }
Yong Li298a95c2020-04-07 15:11:02 +0800225
226 return;
227}
228
Patrick Rudolphc7b2be32023-10-13 12:34:58 +0200229void tryTerminateControlLoops(bool first)
230{
231 static const auto delayTime = std::chrono::milliseconds(50);
232 static boost::asio::steady_timer timer(io);
233
234 auto stopLbd = [](const boost::system::error_code& error) {
235 if (error == boost::asio::error::operation_aborted)
236 {
237 return;
238 }
239
240 // retry when stopControlLoops() has some failure.
241 try
242 {
243 stopControlLoops();
244 }
245 catch (const std::exception& e)
246 {
247 std::cerr << "Failed during stopControlLoops, try again: "
248 << e.what() << "\n";
249 tryTerminateControlLoops(false);
250 return;
251 }
252 io.stop();
253 };
254
255 // first time of trying to stop the control loop without a delay
256 if (first)
257 {
Ed Tanousd2768c52025-06-26 11:42:57 -0700258 boost::asio::post(io,
259 [stopLbd] { stopLbd(boost::system::error_code()); });
Patrick Rudolphc7b2be32023-10-13 12:34:58 +0200260 }
261 // re-try control loop, set up a delay.
262 else
263 {
264 timer.expires_after(delayTime);
265 timer.async_wait(stopLbd);
266 }
267
268 return;
269}
270
Patrick Venturea0764872020-08-08 07:48:43 -0700271} // namespace pid_control
272
Patrick Rudolphc7b2be32023-10-13 12:34:58 +0200273void signalHandler(const boost::system::error_code& error, int signal_number)
Potin Laie2ec69a2022-09-30 17:09:34 +0800274{
275 static boost::asio::steady_timer timer(io);
276
277 if (error)
278 {
279 std::cout << "Signal " << signal_number
280 << " handler error: " << error.message() << "\n";
281 return;
282 }
Patrick Rudolphc7b2be32023-10-13 12:34:58 +0200283 if (signal_number == SIGTERM)
284 {
285 pid_control::tryTerminateControlLoops(true);
286 }
287 else
288 {
289 timer.expires_after(std::chrono::seconds(1));
290 timer.async_wait([](const boost::system::error_code ec) {
291 if (ec)
292 {
293 std::cout << "Signal timer error: " << ec.message() << "\n";
294 return;
295 }
Potin Laie2ec69a2022-09-30 17:09:34 +0800296
Patrick Rudolphc7b2be32023-10-13 12:34:58 +0200297 std::cout << "reloading configuration\n";
298 pid_control::tryRestartControlLoops();
299 });
300 }
Potin Laie2ec69a2022-09-30 17:09:34 +0800301
Patrick Rudolphc7b2be32023-10-13 12:34:58 +0200302 signals.async_wait(signalHandler);
Potin Laie2ec69a2022-09-30 17:09:34 +0800303}
304
James Feist1fe08952019-05-07 09:17:16 -0700305int main(int argc, char* argv[])
306{
307 loggingPath = "";
308 loggingEnabled = false;
309 tuningEnabled = false;
Bonnie Loc51ba912022-10-12 14:07:22 +0800310 debugEnabled = false;
Josh Lehande745422020-11-07 02:14:09 -0800311 coreLoggingEnabled = false;
James Feist1fe08952019-05-07 09:17:16 -0700312
313 CLI::App app{"OpenBMC Fan Control Daemon"};
314
315 app.add_option("-c,--conf", configPath,
316 "Optional parameter to specify configuration at run-time")
317 ->check(CLI::ExistingFile);
318 app.add_option("-l,--log", loggingPath,
319 "Optional parameter to specify logging folder")
320 ->check(CLI::ExistingDirectory);
321 app.add_flag("-t,--tuning", tuningEnabled, "Enable or disable tuning");
Bonnie Loc51ba912022-10-12 14:07:22 +0800322 app.add_flag("-d,--debug", debugEnabled, "Enable or disable debug mode");
Josh Lehande745422020-11-07 02:14:09 -0800323 app.add_flag("-g,--corelogging", coreLoggingEnabled,
324 "Enable or disable logging of core PID loop computations");
James Feist1fe08952019-05-07 09:17:16 -0700325
James Feist1fe08952019-05-07 09:17:16 -0700326 CLI11_PARSE(app, argc, argv);
327
Josh Lehan811f31d2020-09-20 23:31:55 -0700328 static constexpr auto loggingEnablePath = "/etc/thermal.d/logging";
329 static constexpr auto tuningEnablePath = "/etc/thermal.d/tuning";
Bonnie Loc51ba912022-10-12 14:07:22 +0800330 static constexpr auto debugEnablePath = "/etc/thermal.d/debugging";
Josh Lehande745422020-11-07 02:14:09 -0800331 static constexpr auto coreLoggingEnablePath = "/etc/thermal.d/corelogging";
Josh Lehan811f31d2020-09-20 23:31:55 -0700332
Josh Lehanf54b2602021-04-09 12:17:34 -0700333 // Set up default logging path, preferring command line if it was given
334 std::string defLoggingPath(loggingPath);
335 if (defLoggingPath.empty())
336 {
337 defLoggingPath = std::filesystem::temp_directory_path();
338 }
339 else
340 {
341 // Enable logging, if user explicitly gave path on command line
342 loggingEnabled = true;
343 }
344
Josh Lehan811f31d2020-09-20 23:31:55 -0700345 // If this file exists, enable logging at runtime
346 std::ifstream fsLogging(loggingEnablePath);
347 if (fsLogging)
348 {
Josh Lehande745422020-11-07 02:14:09 -0800349 // Allow logging path to be changed by file content
350 std::string altPath;
351 std::getline(fsLogging, altPath);
Josh Lehan811f31d2020-09-20 23:31:55 -0700352 fsLogging.close();
353
Josh Lehande745422020-11-07 02:14:09 -0800354 if (std::filesystem::exists(altPath))
Josh Lehanf54b2602021-04-09 12:17:34 -0700355 {
Josh Lehande745422020-11-07 02:14:09 -0800356 loggingPath = altPath;
Josh Lehanf54b2602021-04-09 12:17:34 -0700357 }
Jinliang Wangcdc8dca2023-04-20 14:36:22 -0700358 else
359 {
360 loggingPath = defLoggingPath;
361 }
Josh Lehanf54b2602021-04-09 12:17:34 -0700362
Josh Lehan811f31d2020-09-20 23:31:55 -0700363 loggingEnabled = true;
Josh Lehanf54b2602021-04-09 12:17:34 -0700364 }
Josh Lehanf54b2602021-04-09 12:17:34 -0700365 if (loggingEnabled)
366 {
Josh Lehan811f31d2020-09-20 23:31:55 -0700367 std::cerr << "Logging enabled: " << loggingPath << "\n";
368 }
369
370 // If this file exists, enable tuning at runtime
371 if (std::filesystem::exists(tuningEnablePath))
372 {
373 tuningEnabled = true;
Josh Lehanf54b2602021-04-09 12:17:34 -0700374 }
Josh Lehanf54b2602021-04-09 12:17:34 -0700375 if (tuningEnabled)
376 {
Josh Lehan811f31d2020-09-20 23:31:55 -0700377 std::cerr << "Tuning enabled\n";
378 }
Kun Yid4695592019-05-17 10:42:18 -0700379
Bonnie Loc51ba912022-10-12 14:07:22 +0800380 // If this file exists, enable debug mode at runtime
381 if (std::filesystem::exists(debugEnablePath))
382 {
383 debugEnabled = true;
384 }
385
386 if (debugEnabled)
387 {
388 std::cerr << "Debug mode enabled\n";
389 }
390
Josh Lehande745422020-11-07 02:14:09 -0800391 // If this file exists, enable core logging at runtime
392 if (std::filesystem::exists(coreLoggingEnablePath))
393 {
394 coreLoggingEnabled = true;
395 }
396 if (coreLoggingEnabled)
397 {
398 std::cerr << "Core logging enabled\n";
399 }
400
James Feist1fe08952019-05-07 09:17:16 -0700401 static constexpr auto modeRoot = "/xyz/openbmc_project/settings/fanctrl";
402 // Create a manager for the ModeBus because we own it.
Ed Tanousd2768c52025-06-26 11:42:57 -0700403 sdbusplus::server::manager_t manager(
404 static_cast<sdbusplus::bus_t&>(modeControlBus), modeRoot);
James Feist1fe08952019-05-07 09:17:16 -0700405 hostBus.request_name("xyz.openbmc_project.Hwmon.external");
406 modeControlBus.request_name("xyz.openbmc_project.State.FanCtrl");
Patrick Williamsb228bc32022-07-22 19:26:56 -0500407 sdbusplus::server::manager_t objManager(modeControlBus, modeRoot);
James Feist1fe08952019-05-07 09:17:16 -0700408
Potin Laie2ec69a2022-09-30 17:09:34 +0800409 // Enable SIGHUP handling to reload JSON config
Patrick Rudolphc7b2be32023-10-13 12:34:58 +0200410 signals.async_wait(signalHandler);
Potin Laie2ec69a2022-09-30 17:09:34 +0800411
Patrick Venturee6206562018-03-08 15:36:53 -0800412 /*
413 * All sensors are managed by one manager, but each zone has a pointer to
414 * it.
415 */
416
Patrick Venturea0764872020-08-08 07:48:43 -0700417 pid_control::tryRestartControlLoops();
Patrick Venturee6206562018-03-08 15:36:53 -0800418
Potin Laie1fa8592025-08-29 15:27:08 +0800419 /* setup host state monitor */
420 auto& monitor = HostStateMonitor::getInstance(hostMatchBus);
421 monitor.startMonitoring();
422
James Feistce6a3f32019-03-12 11:20:16 -0700423 io.run();
James Feist1fe08952019-05-07 09:17:16 -0700424 return 0;
Patrick Venturee6206562018-03-08 15:36:53 -0800425}