blob: aa4cbaf07bf2d3c9a51da2505ea79267d611af55 [file] [log] [blame]
Patrick Venture863b9242018-03-08 08:29:23 -08001/**
2 * Copyright 2017 Google Inc.
3 *
4 * Licensed under the Apache License, Version 2.0 (the "License");
5 * you may not use this file except in compliance with the License.
6 * You may obtain a copy of the License at
7 *
8 * http://www.apache.org/licenses/LICENSE-2.0
9 *
10 * Unless required by applicable law or agreed to in writing, software
11 * distributed under the License is distributed on an "AS IS" BASIS,
12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 * See the License for the specific language governing permissions and
14 * limitations under the License.
15 */
Jonico Eustaquioaf97d8e2024-01-02 14:35:07 -060016#include "config.h"
17
Patrick Ventureda4a5dd2018-08-31 09:42:48 -070018#include "dbuspassive.hpp"
19
Patrick Ventureaadb30d2020-08-10 09:17:11 -070020#include "dbushelper_interface.hpp"
James Feist98b704e2019-06-03 16:24:53 -070021#include "dbuspassiveredundancy.hpp"
Patrick Ventureaadb30d2020-08-10 09:17:11 -070022#include "dbusutil.hpp"
James Feist0c8223b2019-05-08 15:33:33 -070023#include "util.hpp"
Patrick Ventureda4a5dd2018-08-31 09:42:48 -070024
Patrick Venturea83a3ec2020-08-04 09:52:05 -070025#include <sdbusplus/bus.hpp>
26
Patrick Venture863b9242018-03-08 08:29:23 -080027#include <chrono>
28#include <cmath>
Patrick Venture0ef1faf2018-06-13 12:50:53 -070029#include <memory>
Patrick Venture863b9242018-03-08 08:29:23 -080030#include <mutex>
Patrick Venture0ef1faf2018-06-13 12:50:53 -070031#include <string>
James Feist1f802f52019-02-08 13:51:43 -080032#include <variant>
Patrick Venture863b9242018-03-08 08:29:23 -080033
Patrick Venturea0764872020-08-08 07:48:43 -070034namespace pid_control
35{
36
Patrick Venture563a3562018-10-30 09:31:26 -070037std::unique_ptr<ReadInterface> DbusPassive::createDbusPassive(
Patrick Williamsb228bc32022-07-22 19:26:56 -050038 sdbusplus::bus_t& bus, const std::string& type, const std::string& id,
Patrick Venture8729eb92020-08-10 10:38:44 -070039 std::unique_ptr<DbusHelperInterface> helper, const conf::SensorConfig* info,
James Feist98b704e2019-06-03 16:24:53 -070040 const std::shared_ptr<DbusPassiveRedundancy>& redundancy)
Patrick Venture0ef1faf2018-06-13 12:50:53 -070041{
42 if (helper == nullptr)
43 {
44 return nullptr;
45 }
Patrick Venture7af157b2018-10-30 11:24:40 -070046 if (!validType(type))
Patrick Venture0ef1faf2018-06-13 12:50:53 -070047 {
48 return nullptr;
49 }
50
Patrick Venture863b9242018-03-08 08:29:23 -080051 /* Need to get the scale and initial value */
Patrick Venture863b9242018-03-08 08:29:23 -080052 /* service == busname */
Harvey.Wuf2efcbb2022-02-09 10:24:30 +080053 std::string path;
54 if (info->readPath.empty())
55 {
56 path = getSensorPath(type, id);
57 }
58 else
59 {
60 path = info->readPath;
61 }
Patrick Venture34ddc902018-10-30 11:05:17 -070062
Patrick Venture1df9e872020-10-08 15:35:01 -070063 SensorProperties settings;
Patrick Venturef8cb4642018-10-30 12:02:53 -070064 bool failed;
Patrick Venture863b9242018-03-08 08:29:23 -080065
Patrick Venturef8cb4642018-10-30 12:02:53 -070066 try
67 {
Patrick Venture9b936922020-08-10 11:28:39 -070068 std::string service = helper->getService(sensorintf, path);
Patrick Venturef8cb4642018-10-30 12:02:53 -070069
Patrick Venture9b936922020-08-10 11:28:39 -070070 helper->getProperties(service, path, &settings);
71 failed = helper->thresholdsAsserted(service, path);
Patrick Venturef8cb4642018-10-30 12:02:53 -070072 }
73 catch (const std::exception& e)
74 {
75 return nullptr;
76 }
77
Patrick Venture6b9f5992019-09-10 09:18:28 -070078 /* if these values are zero, they're ignored. */
79 if (info->ignoreDbusMinMax)
80 {
81 settings.min = 0;
82 settings.max = 0;
83 }
84
Alex.Song8f73ad72021-10-07 00:18:27 +080085 settings.unavailableAsFailed = info->unavailableAsFailed;
86
Patrick Venture8729eb92020-08-10 10:38:44 -070087 return std::make_unique<DbusPassive>(bus, type, id, std::move(helper),
88 settings, failed, path, redundancy);
Patrick Venturef8cb4642018-10-30 12:02:53 -070089}
90
James Feist98b704e2019-06-03 16:24:53 -070091DbusPassive::DbusPassive(
Patrick Williamsb228bc32022-07-22 19:26:56 -050092 sdbusplus::bus_t& bus, const std::string& type, const std::string& id,
Patrick Venture8729eb92020-08-10 10:38:44 -070093 std::unique_ptr<DbusHelperInterface> helper,
Patrick Venture1df9e872020-10-08 15:35:01 -070094 const SensorProperties& settings, bool failed, const std::string& path,
James Feist98b704e2019-06-03 16:24:53 -070095 const std::shared_ptr<DbusPassiveRedundancy>& redundancy) :
Patrick Williamsbd63bca2024-08-16 15:21:10 -040096 ReadInterface(), _signal(bus, getMatch(path), dbusHandleSignal, this),
97 _id(id), _helper(std::move(helper)), _failed(failed), path(path),
James Feist98b704e2019-06-03 16:24:53 -070098 redundancy(redundancy)
99
Patrick Venturef8cb4642018-10-30 12:02:53 -0700100{
Patrick Venture863b9242018-03-08 08:29:23 -0800101 _scale = settings.scale;
Josh Lehan3e2f7582020-09-20 22:06:03 -0700102 _min = settings.min * std::pow(10.0, _scale);
103 _max = settings.max * std::pow(10.0, _scale);
Alex.Song8f73ad72021-10-07 00:18:27 +0800104 _available = settings.available;
105 _unavailableAsFailed = settings.unavailableAsFailed;
Josh Lehan3e2f7582020-09-20 22:06:03 -0700106
107 // Cache this type knowledge, to avoid repeated string comparison
108 _typeMargin = (type == "margin");
Alex.Song8f73ad72021-10-07 00:18:27 +0800109 _typeFan = (type == "fan");
Josh Lehan3e2f7582020-09-20 22:06:03 -0700110
111 // Force value to be stored, otherwise member would be uninitialized
112 updateValue(settings.value, true);
Patrick Venture863b9242018-03-08 08:29:23 -0800113}
114
115ReadReturn DbusPassive::read(void)
116{
117 std::lock_guard<std::mutex> guard(_lock);
118
Josh Lehanb3005752022-02-22 20:48:07 -0800119 ReadReturn r = {_value, _updated, _unscaled};
Patrick Venture863b9242018-03-08 08:29:23 -0800120
121 return r;
122}
123
Josh Lehanb3005752022-02-22 20:48:07 -0800124void DbusPassive::setValue(double value, double unscaled)
Patrick Venture863b9242018-03-08 08:29:23 -0800125{
126 std::lock_guard<std::mutex> guard(_lock);
127
128 _value = value;
Josh Lehanb3005752022-02-22 20:48:07 -0800129 _unscaled = unscaled;
Patrick Venture863b9242018-03-08 08:29:23 -0800130 _updated = std::chrono::high_resolution_clock::now();
131}
132
Josh Lehanb3005752022-02-22 20:48:07 -0800133void DbusPassive::setValue(double value)
134{
135 // First param is scaled, second param is unscaled, assume same here
136 setValue(value, value);
137}
138
James Feist36b7d8e2018-10-05 15:39:01 -0700139bool DbusPassive::getFailed(void) const
140{
James Feist98b704e2019-06-03 16:24:53 -0700141 if (redundancy)
142 {
143 const std::set<std::string>& failures = redundancy->getFailed();
144 if (failures.find(path) != failures.end())
145 {
146 return true;
147 }
148 }
James Feist4b36f262020-07-07 16:56:41 -0700149
Alex.Song8f73ad72021-10-07 00:18:27 +0800150 /*
151 * Unavailable thermal sensors, who are not present or
152 * power-state-not-matching, should not trigger the failSafe mode. For
153 * example, when a system stays at a powered-off state, its CPU Temp
154 * sensors will be unavailable, these unavailable sensors should not be
155 * treated as failed and trigger failSafe.
156 * This is important for systems whose Fans are always on.
157 */
158 if (!_typeFan && !_available && !_unavailableAsFailed)
159 {
160 return false;
161 }
162
Josh Lehan3e2f7582020-09-20 22:06:03 -0700163 // If a reading has came in,
164 // but its value bad in some way (determined by sensor type),
165 // indicate this sensor has failed,
166 // until another value comes in that is no longer bad.
167 // This is different from the overall _failed flag,
168 // which is set and cleared by other causes.
169 if (_badReading)
170 {
171 return true;
172 }
173
174 // If a reading has came in, and it is not a bad reading,
175 // but it indicates there is no more thermal margin left,
176 // that is bad, something is wrong with the PID loops,
177 // they are not cooling the system, enable failsafe mode also.
178 if (_marginHot)
179 {
180 return true;
181 }
182
Alex.Song8f73ad72021-10-07 00:18:27 +0800183 return _failed || !_available || !_functional;
James Feist36b7d8e2018-10-05 15:39:01 -0700184}
185
186void DbusPassive::setFailed(bool value)
187{
188 _failed = value;
189}
190
James Feist4b36f262020-07-07 16:56:41 -0700191void DbusPassive::setFunctional(bool value)
192{
193 _functional = value;
194}
195
Alex.Song8f73ad72021-10-07 00:18:27 +0800196void DbusPassive::setAvailable(bool value)
197{
198 _available = value;
199}
200
Patrick Venture863b9242018-03-08 08:29:23 -0800201int64_t DbusPassive::getScale(void)
202{
203 return _scale;
204}
205
Patrick Venture563a3562018-10-30 09:31:26 -0700206std::string DbusPassive::getID(void)
Patrick Venture863b9242018-03-08 08:29:23 -0800207{
208 return _id;
209}
210
James Feist75eb7692019-02-25 12:50:02 -0800211double DbusPassive::getMax(void)
212{
213 return _max;
214}
215
216double DbusPassive::getMin(void)
217{
218 return _min;
219}
220
Josh Lehan3e2f7582020-09-20 22:06:03 -0700221void DbusPassive::updateValue(double value, bool force)
222{
223 _badReading = false;
224
225 // Do not let a NAN, or other floating-point oddity, be used to update
226 // the value, as that indicates the sensor has no valid reading.
227 if (!(std::isfinite(value)))
228 {
229 _badReading = true;
230
231 // Do not continue with a bad reading, unless caller forcing
232 if (!force)
233 {
234 return;
235 }
236 }
237
238 value *= std::pow(10.0, _scale);
239
240 auto unscaled = value;
241 scaleSensorReading(_min, _max, value);
242
243 if (_typeMargin)
244 {
245 _marginHot = false;
246
247 // Unlike an absolute temperature sensor,
248 // where 0 degrees C is a good reading,
249 // a value received of 0 (or negative) margin is worrisome,
250 // and should be flagged.
251 // Either it indicates margin not calculated properly,
252 // or somebody forgot to set the margin-zero setpoint,
253 // or the system is really overheating that much.
254 // This is a different condition from _failed
255 // and _badReading, so it merits its own flag.
256 // The sensor has not failed, the reading is good, but the zone
257 // still needs to know that it should go to failsafe mode.
258 if (unscaled <= 0.0)
259 {
260 _marginHot = true;
261 }
262 }
263
Josh Lehanb3005752022-02-22 20:48:07 -0800264 setValue(value, unscaled);
Josh Lehan3e2f7582020-09-20 22:06:03 -0700265}
266
Patrick Williamsb228bc32022-07-22 19:26:56 -0500267int handleSensorValue(sdbusplus::message_t& msg, DbusPassive* owner)
Patrick Venture863b9242018-03-08 08:29:23 -0800268{
Patrick Venture863b9242018-03-08 08:29:23 -0800269 std::string msgSensor;
James Feist1f802f52019-02-08 13:51:43 -0800270 std::map<std::string, std::variant<int64_t, double, bool>> msgData;
Patrick Ventured0c75662018-06-12 19:03:21 -0700271
272 msg.read(msgSensor, msgData);
Patrick Venture863b9242018-03-08 08:29:23 -0800273
274 if (msgSensor == "xyz.openbmc_project.Sensor.Value")
275 {
276 auto valPropMap = msgData.find("Value");
277 if (valPropMap != msgData.end())
278 {
Patrick Williamsbd63bca2024-08-16 15:21:10 -0400279 double value =
280 std::visit(VariantToDoubleVisitor(), valPropMap->second);
Patrick Venture863b9242018-03-08 08:29:23 -0800281
Josh Lehan3e2f7582020-09-20 22:06:03 -0700282 owner->updateValue(value, false);
Patrick Venture863b9242018-03-08 08:29:23 -0800283 }
284 }
James Feist36b7d8e2018-10-05 15:39:01 -0700285 else if (msgSensor == "xyz.openbmc_project.Sensor.Threshold.Critical")
286 {
287 auto criticalAlarmLow = msgData.find("CriticalAlarmLow");
288 auto criticalAlarmHigh = msgData.find("CriticalAlarmHigh");
289 if (criticalAlarmHigh == msgData.end() &&
290 criticalAlarmLow == msgData.end())
291 {
292 return 0;
293 }
294
295 bool asserted = false;
296 if (criticalAlarmLow != msgData.end())
297 {
James Feist1f802f52019-02-08 13:51:43 -0800298 asserted = std::get<bool>(criticalAlarmLow->second);
James Feist36b7d8e2018-10-05 15:39:01 -0700299 }
300
301 // checking both as in theory you could de-assert one threshold and
302 // assert the other at the same moment
303 if (!asserted && criticalAlarmHigh != msgData.end())
304 {
James Feist1f802f52019-02-08 13:51:43 -0800305 asserted = std::get<bool>(criticalAlarmHigh->second);
James Feist36b7d8e2018-10-05 15:39:01 -0700306 }
307 owner->setFailed(asserted);
308 }
Jonico Eustaquioaf97d8e2024-01-02 14:35:07 -0600309#ifdef UNC_FAILSAFE
310 else if (msgSensor == "xyz.openbmc_project.Sensor.Threshold.Warning")
311 {
312 auto warningAlarmHigh = msgData.find("WarningAlarmHigh");
313 if (warningAlarmHigh == msgData.end())
314 {
315 return 0;
316 }
317
318 bool asserted = false;
319 if (warningAlarmHigh != msgData.end())
320 {
321 asserted = std::get<bool>(warningAlarmHigh->second);
322 }
323 owner->setFailed(asserted);
324 }
325#endif
Alex.Song8f73ad72021-10-07 00:18:27 +0800326 else if (msgSensor == "xyz.openbmc_project.State.Decorator.Availability")
327 {
328 auto available = msgData.find("Available");
329 if (available == msgData.end())
330 {
331 return 0;
332 }
333 bool asserted = std::get<bool>(available->second);
334 owner->setAvailable(asserted);
335 if (!asserted)
336 {
337 // A thermal controller will continue its PID calculation and not
338 // trigger a 'failsafe' when some inputs are unavailable.
339 // So, forced to clear the value here to prevent a historical
340 // value to participate in a latter PID calculation.
341 owner->updateValue(std::numeric_limits<double>::quiet_NaN(), true);
342 }
343 }
James Feist4b36f262020-07-07 16:56:41 -0700344 else if (msgSensor ==
345 "xyz.openbmc_project.State.Decorator.OperationalStatus")
346 {
347 auto functional = msgData.find("Functional");
348 if (functional == msgData.end())
349 {
350 return 0;
351 }
352 bool asserted = std::get<bool>(functional->second);
353 owner->setFunctional(asserted);
354 }
Patrick Venture863b9242018-03-08 08:29:23 -0800355
356 return 0;
357}
Patrick Ventured0c75662018-06-12 19:03:21 -0700358
Harvey.Wua1ae4fa2022-10-28 17:38:35 +0800359int dbusHandleSignal(sd_bus_message* msg, void* usrData,
360 [[maybe_unused]] sd_bus_error* err)
Patrick Ventured0c75662018-06-12 19:03:21 -0700361{
Patrick Williamsb228bc32022-07-22 19:26:56 -0500362 auto sdbpMsg = sdbusplus::message_t(msg);
Patrick Ventured0c75662018-06-12 19:03:21 -0700363 DbusPassive* obj = static_cast<DbusPassive*>(usrData);
364
Patrick Venture7af157b2018-10-30 11:24:40 -0700365 return handleSensorValue(sdbpMsg, obj);
Patrick Ventured0c75662018-06-12 19:03:21 -0700366}
Patrick Venturea0764872020-08-08 07:48:43 -0700367
368} // namespace pid_control