blob: d4bfaae5c4e7bc7789ef95759891c6d329c7ca31 [file] [log] [blame]
Patrick Venturee6206562018-03-08 15:36:53 -08001/**
2 * Copyright 2017 Google Inc.
3 *
4 * Licensed under the Apache License, Version 2.0 (the "License");
5 * you may not use this file except in compliance with the License.
6 * You may obtain a copy of the License at
7 *
8 * http://www.apache.org/licenses/LICENSE-2.0
9 *
10 * Unless required by applicable law or agreed to in writing, software
11 * distributed under the License is distributed on an "AS IS" BASIS,
12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 * See the License for the specific language governing permissions and
14 * limitations under the License.
15 */
Pete O_o765a6d82025-07-23 21:44:14 -070016#include "config.h"
Patrick Venturee6206562018-03-08 15:36:53 -080017
Harvey Wu3dcfd542022-10-31 17:11:02 +080018#include "buildjson/buildjson.hpp"
Patrick Ventureda4a5dd2018-08-31 09:42:48 -070019#include "conf.hpp"
Patrick Venture7f9d6902020-09-10 12:09:57 -070020#include "dbus/dbusconfiguration.hpp"
James Zheng6df8bb52024-11-27 23:38:47 +000021#include "failsafeloggers/builder.hpp"
Patrick Venture5c7cc542018-06-11 14:29:38 -070022#include "pid/builder.hpp"
Patrick Ventureba8ffa72019-02-11 12:03:56 -080023#include "pid/buildjson.hpp"
James Feistce6a3f32019-03-12 11:20:16 -070024#include "pid/pidloop.hpp"
Patrick Venturec32e3fc2019-02-28 10:01:11 -080025#include "pid/tuning.hpp"
Patrick Venture5e929092018-06-08 10:55:23 -070026#include "sensors/builder.hpp"
Patrick Ventureba8ffa72019-02-11 12:03:56 -080027#include "sensors/buildjson.hpp"
Patrick Venturee6206562018-03-08 15:36:53 -080028#include "sensors/manager.hpp"
Patrick Ventureda4a5dd2018-08-31 09:42:48 -070029#include "util.hpp"
Ed Tanousf8b6e552025-06-27 13:27:50 -070030#include "zone_interface.hpp"
31
32#include <signal.h>
Patrick Venturee6206562018-03-08 15:36:53 -080033
Patrick Ventureb5cc37c2019-03-11 09:11:55 -070034#include <CLI/CLI.hpp>
Ed Tanousf8b6e552025-06-27 13:27:50 -070035#include <boost/asio/error.hpp>
James Feistce6a3f32019-03-12 11:20:16 -070036#include <boost/asio/io_context.hpp>
Ed Tanousf8b6e552025-06-27 13:27:50 -070037#include <boost/asio/post.hpp>
Potin Laie2ec69a2022-09-30 17:09:34 +080038#include <boost/asio/signal_set.hpp>
James Feistce6a3f32019-03-12 11:20:16 -070039#include <boost/asio/steady_timer.hpp>
Patrick Venturea83a3ec2020-08-04 09:52:05 -070040#include <sdbusplus/asio/connection.hpp>
41#include <sdbusplus/bus.hpp>
Bruce Leecb4c1a22021-04-20 16:06:38 +080042#include <sdbusplus/server/manager.hpp>
Patrick Venturea83a3ec2020-08-04 09:52:05 -070043
Patrick Ventureda4a5dd2018-08-31 09:42:48 -070044#include <chrono>
Ed Tanousf8b6e552025-06-27 13:27:50 -070045#include <csignal>
46#include <cstdint>
47#include <cstdlib>
48#include <exception>
Patrick Venture7f9d6902020-09-10 12:09:57 -070049#include <filesystem>
Ed Tanousf8b6e552025-06-27 13:27:50 -070050#include <fstream>
Patrick Ventureda4a5dd2018-08-31 09:42:48 -070051#include <iostream>
52#include <map>
53#include <memory>
Patrick Williamse3c60772025-04-07 17:53:42 -040054#include <optional>
Ed Tanousf8b6e552025-06-27 13:27:50 -070055#include <stdexcept>
56#include <string>
57#include <tuple>
Patrick Ventureda4a5dd2018-08-31 09:42:48 -070058#include <unordered_map>
Patrick Ventureba8ffa72019-02-11 12:03:56 -080059#include <utility>
Patrick Ventureda4a5dd2018-08-31 09:42:48 -070060#include <vector>
Patrick Venturee6206562018-03-08 15:36:53 -080061
Patrick Venturea0764872020-08-08 07:48:43 -070062namespace pid_control
63{
64
James Feist1fe08952019-05-07 09:17:16 -070065/* The configuration converted sensor list. */
Patrick Venture1df9e872020-10-08 15:35:01 -070066std::map<std::string, conf::SensorConfig> sensorConfig = {};
James Feist1fe08952019-05-07 09:17:16 -070067/* The configuration converted PID list. */
James Feistf81f2882019-02-26 11:26:36 -080068std::map<int64_t, conf::PIDConf> zoneConfig = {};
James Feist1fe08952019-05-07 09:17:16 -070069/* The configuration converted Zone configuration. */
Patrick Venture1df9e872020-10-08 15:35:01 -070070std::map<int64_t, conf::ZoneConfig> zoneDetailsConfig = {};
Patrick Venturee6206562018-03-08 15:36:53 -080071
Patrick Rudolphc7b2be32023-10-13 12:34:58 +020072namespace state
73{
74/* Set to true while canceling is in progress */
75static bool isCanceling = false;
76/* The zones build from configuration */
77static std::unordered_map<int64_t, std::shared_ptr<ZoneInterface>> zones;
78/* The timers used by the PID loop */
79static std::vector<std::shared_ptr<boost::asio::steady_timer>> timers;
80/* The sensors build from configuration */
Patrick Williamse3c60772025-04-07 17:53:42 -040081static std::optional<SensorManager> mgmr;
Patrick Rudolphc7b2be32023-10-13 12:34:58 +020082} // namespace state
83
Patrick Venturea0764872020-08-08 07:48:43 -070084} // namespace pid_control
85
Potin Lai79cde002023-02-16 13:53:10 +080086std::filesystem::path configPath = "";
Patrick Venturec19f5d42019-02-14 10:59:47 -080087
James Feist1fe08952019-05-07 09:17:16 -070088/* async io context for operation */
89boost::asio::io_context io;
Potin Laie2ec69a2022-09-30 17:09:34 +080090/* async signal_set for signal handling */
Patrick Rudolphc7b2be32023-10-13 12:34:58 +020091boost::asio::signal_set signals(io, SIGHUP, SIGTERM);
James Feist1fe08952019-05-07 09:17:16 -070092
93/* buses for system control */
94static sdbusplus::asio::connection modeControlBus(io);
Patrick Williams7dea66c2025-04-07 14:23:50 -040095static sdbusplus::asio::connection hostBus(io, sdbusplus::bus::new_bus());
96static sdbusplus::asio::connection passiveBus(io, sdbusplus::bus::new_bus());
James Feist1fe08952019-05-07 09:17:16 -070097
Patrick Venturea0764872020-08-08 07:48:43 -070098namespace pid_control
99{
100
Potin Lai79cde002023-02-16 13:53:10 +0800101std::filesystem::path searchConfigurationPath()
102{
103 static constexpr auto name = "config.json";
104
Ed Tanousd2768c52025-06-26 11:42:57 -0700105 for (const auto& pathSeg : {std::filesystem::current_path(),
106 std::filesystem::path{"/var/lib/swampd"},
107 std::filesystem::path{"/usr/share/swampd"}})
Potin Lai79cde002023-02-16 13:53:10 +0800108 {
109 auto file = pathSeg / name;
110 if (std::filesystem::exists(file))
111 {
112 return file;
113 }
114 }
115
116 return name;
117}
118
Patrick Rudolphc7b2be32023-10-13 12:34:58 +0200119void stopControlLoops()
Patrick Venturee6206562018-03-08 15:36:53 -0800120{
Patrick Rudolphc7b2be32023-10-13 12:34:58 +0200121 for (const auto& timer : state::timers)
Johnathan Mantey5301aae2020-09-28 11:06:58 -0700122 {
123 timer->cancel();
124 }
Patrick Rudolphc7b2be32023-10-13 12:34:58 +0200125 state::isCanceling = true;
126 state::timers.clear();
Hao Jiangb228cea2021-02-20 11:53:09 -0800127
Patrick Rudolphc7b2be32023-10-13 12:34:58 +0200128 if (state::zones.size() > 0 && state::zones.begin()->second.use_count() > 1)
Hao Jiangb228cea2021-02-20 11:53:09 -0800129 {
130 throw std::runtime_error("wait for count back to 1");
131 }
Patrick Rudolphc7b2be32023-10-13 12:34:58 +0200132
133 state::zones.clear();
134 state::isCanceling = false;
135}
136
137void restartControlLoops()
138{
139 stopControlLoops();
Patrick Venture4cb7c052019-02-14 11:11:33 -0800140
Potin Lai79cde002023-02-16 13:53:10 +0800141 const std::filesystem::path path =
142 (!configPath.empty()) ? configPath : searchConfigurationPath();
Patrick Venturee6206562018-03-08 15:36:53 -0800143
Patrick Venture7f9d6902020-09-10 12:09:57 -0700144 if (std::filesystem::exists(path))
Patrick Venturee6206562018-03-08 15:36:53 -0800145 {
Patrick Venture7f9d6902020-09-10 12:09:57 -0700146 /*
147 * When building the sensors, if any of the dbus passive ones aren't on
148 * the bus, it'll fail immediately.
149 */
150 try
151 {
152 auto jsonData = parseValidateJson(path);
153 sensorConfig = buildSensorsFromJson(jsonData);
Patrick Williamsbd63bca2024-08-16 15:21:10 -0400154 std::tie(zoneConfig, zoneDetailsConfig) =
155 buildPIDsFromJson(jsonData);
Patrick Venture7f9d6902020-09-10 12:09:57 -0700156 }
157 catch (const std::exception& e)
158 {
159 std::cerr << "Failed during building: " << e.what() << "\n";
160 exit(EXIT_FAILURE); /* fatal error. */
161 }
Patrick Venturee6206562018-03-08 15:36:53 -0800162 }
Patrick Venture7f9d6902020-09-10 12:09:57 -0700163 else
Patrick Venture18b13112019-02-14 11:43:59 -0800164 {
Patrick Venture7f9d6902020-09-10 12:09:57 -0700165 static boost::asio::steady_timer reloadTimer(io);
Patrick Venture73823182020-10-08 15:12:51 -0700166 if (!dbus_configuration::init(modeControlBus, reloadTimer, sensorConfig,
167 zoneConfig, zoneDetailsConfig))
Patrick Venture7f9d6902020-09-10 12:09:57 -0700168 {
169 return; // configuration not ready
170 }
Patrick Venture18b13112019-02-14 11:43:59 -0800171 }
Patrick Venture4cb7c052019-02-14 11:11:33 -0800172
Patrick Rudolphc7b2be32023-10-13 12:34:58 +0200173 state::mgmr = buildSensors(sensorConfig, passiveBus, hostBus);
Patrick Williamsbd63bca2024-08-16 15:21:10 -0400174 state::zones =
Patrick Williamse3c60772025-04-07 17:53:42 -0400175 buildZones(zoneConfig, zoneDetailsConfig, *state::mgmr, modeControlBus);
James Zheng6df8bb52024-11-27 23:38:47 +0000176 // Set `logMaxCountPerSecond` to 20 will limit the number of logs output per
177 // second in each zone. Using 20 here would limit the output rate to be no
178 // larger than 100 per sec for most platforms as the number of zones are
179 // usually <=3. This will effectively avoid resource exhaustion.
180 buildFailsafeLoggers(state::zones, /* logMaxCountPerSecond = */ 20);
Patrick Venturee6206562018-03-08 15:36:53 -0800181
Patrick Rudolphc7b2be32023-10-13 12:34:58 +0200182 if (0 == state::zones.size())
Patrick Venturee6206562018-03-08 15:36:53 -0800183 {
184 std::cerr << "No zones defined, exiting.\n";
James Feist1fe08952019-05-07 09:17:16 -0700185 std::exit(EXIT_FAILURE);
Patrick Venturee6206562018-03-08 15:36:53 -0800186 }
187
Patrick Rudolphc7b2be32023-10-13 12:34:58 +0200188 for (const auto& i : state::zones)
James Feist1fe08952019-05-07 09:17:16 -0700189 {
Patrick Rudolphc7b2be32023-10-13 12:34:58 +0200190 std::shared_ptr<boost::asio::steady_timer> timer =
191 state::timers.emplace_back(
192 std::make_shared<boost::asio::steady_timer>(io));
James Feist1fe08952019-05-07 09:17:16 -0700193 std::cerr << "pushing zone " << i.first << "\n";
Patrick Rudolphc7b2be32023-10-13 12:34:58 +0200194 pidControlLoop(i.second, timer, &state::isCanceling);
James Feist1fe08952019-05-07 09:17:16 -0700195 }
196}
197
Hao Jiangb228cea2021-02-20 11:53:09 -0800198void tryRestartControlLoops(bool first)
Yong Li298a95c2020-04-07 15:11:02 +0800199{
Hao Jiangd11a7322021-03-24 11:25:57 -0700200 static const auto delayTime = std::chrono::seconds(10);
Hao Jiangb228cea2021-02-20 11:53:09 -0800201 static boost::asio::steady_timer timer(io);
Hao Jiangd11a7322021-03-24 11:25:57 -0700202
203 auto restartLbd = [](const boost::system::error_code& error) {
Hao Jiang232ffe42021-02-21 20:11:49 -0800204 if (error == boost::asio::error::operation_aborted)
205 {
206 return;
207 }
Hao Jiangb228cea2021-02-20 11:53:09 -0800208
Hao Jiang232ffe42021-02-21 20:11:49 -0800209 // retry when restartControlLoops() has some failure.
210 try
211 {
212 restartControlLoops();
Hao Jiang232ffe42021-02-21 20:11:49 -0800213 }
214 catch (const std::exception& e)
215 {
Zev Weiss5293ec22023-03-06 18:58:36 -0800216 std::cerr << "Failed during restartControlLoops, try again: "
Hao Jiang232ffe42021-02-21 20:11:49 -0800217 << e.what() << "\n";
218 tryRestartControlLoops(false);
219 }
Hao Jiangd11a7322021-03-24 11:25:57 -0700220 };
Zev Weiss5293ec22023-03-06 18:58:36 -0800221
Hao Jiangd11a7322021-03-24 11:25:57 -0700222 // first time of trying to restart the control loop without a delay
223 if (first)
224 {
Ed Tanousd2768c52025-06-26 11:42:57 -0700225 boost::asio::post(io, [restartLbd] {
226 restartLbd(boost::system::error_code());
227 });
Hao Jiangd11a7322021-03-24 11:25:57 -0700228 }
229 // re-try control loop, set up a delay.
230 else
231 {
232 timer.expires_after(delayTime);
233 timer.async_wait(restartLbd);
234 }
Yong Li298a95c2020-04-07 15:11:02 +0800235
236 return;
237}
238
Patrick Rudolphc7b2be32023-10-13 12:34:58 +0200239void tryTerminateControlLoops(bool first)
240{
241 static const auto delayTime = std::chrono::milliseconds(50);
242 static boost::asio::steady_timer timer(io);
243
244 auto stopLbd = [](const boost::system::error_code& error) {
245 if (error == boost::asio::error::operation_aborted)
246 {
247 return;
248 }
249
250 // retry when stopControlLoops() has some failure.
251 try
252 {
253 stopControlLoops();
254 }
255 catch (const std::exception& e)
256 {
257 std::cerr << "Failed during stopControlLoops, try again: "
258 << e.what() << "\n";
259 tryTerminateControlLoops(false);
260 return;
261 }
262 io.stop();
263 };
264
265 // first time of trying to stop the control loop without a delay
266 if (first)
267 {
Ed Tanousd2768c52025-06-26 11:42:57 -0700268 boost::asio::post(io,
269 [stopLbd] { stopLbd(boost::system::error_code()); });
Patrick Rudolphc7b2be32023-10-13 12:34:58 +0200270 }
271 // re-try control loop, set up a delay.
272 else
273 {
274 timer.expires_after(delayTime);
275 timer.async_wait(stopLbd);
276 }
277
278 return;
279}
280
Patrick Venturea0764872020-08-08 07:48:43 -0700281} // namespace pid_control
282
Patrick Rudolphc7b2be32023-10-13 12:34:58 +0200283void signalHandler(const boost::system::error_code& error, int signal_number)
Potin Laie2ec69a2022-09-30 17:09:34 +0800284{
285 static boost::asio::steady_timer timer(io);
286
287 if (error)
288 {
289 std::cout << "Signal " << signal_number
290 << " handler error: " << error.message() << "\n";
291 return;
292 }
Patrick Rudolphc7b2be32023-10-13 12:34:58 +0200293 if (signal_number == SIGTERM)
294 {
295 pid_control::tryTerminateControlLoops(true);
296 }
297 else
298 {
299 timer.expires_after(std::chrono::seconds(1));
300 timer.async_wait([](const boost::system::error_code ec) {
301 if (ec)
302 {
303 std::cout << "Signal timer error: " << ec.message() << "\n";
304 return;
305 }
Potin Laie2ec69a2022-09-30 17:09:34 +0800306
Patrick Rudolphc7b2be32023-10-13 12:34:58 +0200307 std::cout << "reloading configuration\n";
308 pid_control::tryRestartControlLoops();
309 });
310 }
Potin Laie2ec69a2022-09-30 17:09:34 +0800311
Patrick Rudolphc7b2be32023-10-13 12:34:58 +0200312 signals.async_wait(signalHandler);
Potin Laie2ec69a2022-09-30 17:09:34 +0800313}
314
James Feist1fe08952019-05-07 09:17:16 -0700315int main(int argc, char* argv[])
316{
317 loggingPath = "";
318 loggingEnabled = false;
319 tuningEnabled = false;
Bonnie Loc51ba912022-10-12 14:07:22 +0800320 debugEnabled = false;
Josh Lehande745422020-11-07 02:14:09 -0800321 coreLoggingEnabled = false;
James Feist1fe08952019-05-07 09:17:16 -0700322
323 CLI::App app{"OpenBMC Fan Control Daemon"};
324
325 app.add_option("-c,--conf", configPath,
326 "Optional parameter to specify configuration at run-time")
327 ->check(CLI::ExistingFile);
328 app.add_option("-l,--log", loggingPath,
329 "Optional parameter to specify logging folder")
330 ->check(CLI::ExistingDirectory);
331 app.add_flag("-t,--tuning", tuningEnabled, "Enable or disable tuning");
Bonnie Loc51ba912022-10-12 14:07:22 +0800332 app.add_flag("-d,--debug", debugEnabled, "Enable or disable debug mode");
Josh Lehande745422020-11-07 02:14:09 -0800333 app.add_flag("-g,--corelogging", coreLoggingEnabled,
334 "Enable or disable logging of core PID loop computations");
James Feist1fe08952019-05-07 09:17:16 -0700335
James Feist1fe08952019-05-07 09:17:16 -0700336 CLI11_PARSE(app, argc, argv);
337
Josh Lehan811f31d2020-09-20 23:31:55 -0700338 static constexpr auto loggingEnablePath = "/etc/thermal.d/logging";
339 static constexpr auto tuningEnablePath = "/etc/thermal.d/tuning";
Bonnie Loc51ba912022-10-12 14:07:22 +0800340 static constexpr auto debugEnablePath = "/etc/thermal.d/debugging";
Josh Lehande745422020-11-07 02:14:09 -0800341 static constexpr auto coreLoggingEnablePath = "/etc/thermal.d/corelogging";
Josh Lehan811f31d2020-09-20 23:31:55 -0700342
Josh Lehanf54b2602021-04-09 12:17:34 -0700343 // Set up default logging path, preferring command line if it was given
344 std::string defLoggingPath(loggingPath);
345 if (defLoggingPath.empty())
346 {
347 defLoggingPath = std::filesystem::temp_directory_path();
348 }
349 else
350 {
351 // Enable logging, if user explicitly gave path on command line
352 loggingEnabled = true;
353 }
354
Josh Lehan811f31d2020-09-20 23:31:55 -0700355 // If this file exists, enable logging at runtime
356 std::ifstream fsLogging(loggingEnablePath);
357 if (fsLogging)
358 {
Josh Lehande745422020-11-07 02:14:09 -0800359 // Allow logging path to be changed by file content
360 std::string altPath;
361 std::getline(fsLogging, altPath);
Josh Lehan811f31d2020-09-20 23:31:55 -0700362 fsLogging.close();
363
Josh Lehande745422020-11-07 02:14:09 -0800364 if (std::filesystem::exists(altPath))
Josh Lehanf54b2602021-04-09 12:17:34 -0700365 {
Josh Lehande745422020-11-07 02:14:09 -0800366 loggingPath = altPath;
Josh Lehanf54b2602021-04-09 12:17:34 -0700367 }
Jinliang Wangcdc8dca2023-04-20 14:36:22 -0700368 else
369 {
370 loggingPath = defLoggingPath;
371 }
Josh Lehanf54b2602021-04-09 12:17:34 -0700372
Josh Lehan811f31d2020-09-20 23:31:55 -0700373 loggingEnabled = true;
Josh Lehanf54b2602021-04-09 12:17:34 -0700374 }
Josh Lehanf54b2602021-04-09 12:17:34 -0700375 if (loggingEnabled)
376 {
Josh Lehan811f31d2020-09-20 23:31:55 -0700377 std::cerr << "Logging enabled: " << loggingPath << "\n";
378 }
379
380 // If this file exists, enable tuning at runtime
381 if (std::filesystem::exists(tuningEnablePath))
382 {
383 tuningEnabled = true;
Josh Lehanf54b2602021-04-09 12:17:34 -0700384 }
Josh Lehanf54b2602021-04-09 12:17:34 -0700385 if (tuningEnabled)
386 {
Josh Lehan811f31d2020-09-20 23:31:55 -0700387 std::cerr << "Tuning enabled\n";
388 }
Kun Yid4695592019-05-17 10:42:18 -0700389
Bonnie Loc51ba912022-10-12 14:07:22 +0800390 // If this file exists, enable debug mode at runtime
391 if (std::filesystem::exists(debugEnablePath))
392 {
393 debugEnabled = true;
394 }
395
396 if (debugEnabled)
397 {
398 std::cerr << "Debug mode enabled\n";
399 }
400
Josh Lehande745422020-11-07 02:14:09 -0800401 // If this file exists, enable core logging at runtime
402 if (std::filesystem::exists(coreLoggingEnablePath))
403 {
404 coreLoggingEnabled = true;
405 }
406 if (coreLoggingEnabled)
407 {
408 std::cerr << "Core logging enabled\n";
409 }
410
James Feist1fe08952019-05-07 09:17:16 -0700411 static constexpr auto modeRoot = "/xyz/openbmc_project/settings/fanctrl";
412 // Create a manager for the ModeBus because we own it.
Ed Tanousd2768c52025-06-26 11:42:57 -0700413 sdbusplus::server::manager_t manager(
414 static_cast<sdbusplus::bus_t&>(modeControlBus), modeRoot);
James Feist1fe08952019-05-07 09:17:16 -0700415 hostBus.request_name("xyz.openbmc_project.Hwmon.external");
416 modeControlBus.request_name("xyz.openbmc_project.State.FanCtrl");
Patrick Williamsb228bc32022-07-22 19:26:56 -0500417 sdbusplus::server::manager_t objManager(modeControlBus, modeRoot);
James Feist1fe08952019-05-07 09:17:16 -0700418
Potin Laie2ec69a2022-09-30 17:09:34 +0800419 // Enable SIGHUP handling to reload JSON config
Patrick Rudolphc7b2be32023-10-13 12:34:58 +0200420 signals.async_wait(signalHandler);
Potin Laie2ec69a2022-09-30 17:09:34 +0800421
Patrick Venturee6206562018-03-08 15:36:53 -0800422 /*
423 * All sensors are managed by one manager, but each zone has a pointer to
424 * it.
425 */
426
Patrick Venturea0764872020-08-08 07:48:43 -0700427 pid_control::tryRestartControlLoops();
Patrick Venturee6206562018-03-08 15:36:53 -0800428
James Feistce6a3f32019-03-12 11:20:16 -0700429 io.run();
James Feist1fe08952019-05-07 09:17:16 -0700430 return 0;
Patrick Venturee6206562018-03-08 15:36:53 -0800431}