blob: f53ce52646b76772a8ed8bc3858d97cee736637e [file] [log] [blame]
Vishwanatha Subbannadfc7ec72017-09-07 18:18:01 +05301#include "config.h"
2
Gunnar Mills94df8c92018-09-14 14:50:03 -05003#include "occ_manager.hpp"
4
5#include "i2c_occ.hpp"
Chicago Duanbb895cb2021-06-18 19:37:16 +08006#include "occ_dbus.hpp"
Gunnar Mills94df8c92018-09-14 14:50:03 -05007#include "utils.hpp"
8
George Liub5ca1012021-09-10 12:53:11 +08009#include <phosphor-logging/elog-errors.hpp>
10#include <phosphor-logging/log.hpp>
11#include <xyz/openbmc_project/Common/error.hpp>
12
Matt Spinlerd267cec2021-09-01 14:49:19 -050013#include <chrono>
Chicago Duanbb895cb2021-06-18 19:37:16 +080014#include <cmath>
George Liubcef3b42021-09-10 12:39:02 +080015#include <filesystem>
Chicago Duanbb895cb2021-06-18 19:37:16 +080016#include <regex>
Gunnar Mills94df8c92018-09-14 14:50:03 -050017
Vishwanatha Subbannadfc7ec72017-09-07 18:18:01 +053018namespace open_power
19{
20namespace occ
21{
22
Matt Spinler8b8abee2021-08-25 15:18:21 -050023constexpr uint32_t fruTypeNotAvailable = 0xFF;
Matt Spinlera26f1522021-08-25 15:50:20 -050024constexpr auto fruTypeSuffix = "fru_type";
25constexpr auto faultSuffix = "fault";
26constexpr auto inputSuffix = "input";
Matt Spinler8b8abee2021-08-25 15:18:21 -050027
Chris Caina8857c52021-01-27 11:53:05 -060028using namespace phosphor::logging;
29
Matt Spinlera26f1522021-08-25 15:50:20 -050030template <typename T>
31T readFile(const std::string& path)
32{
33 std::ifstream ifs;
34 ifs.exceptions(std::ifstream::failbit | std::ifstream::badbit |
35 std::ifstream::eofbit);
36 T data;
37
38 try
39 {
40 ifs.open(path);
41 ifs >> data;
42 ifs.close();
43 }
44 catch (const std::exception& e)
45 {
46 auto err = errno;
47 throw std::system_error(err, std::generic_category());
48 }
49
50 return data;
51}
52
Vishwanatha Subbannadfc7ec72017-09-07 18:18:01 +053053void Manager::findAndCreateObjects()
54{
Matt Spinlerd267cec2021-09-01 14:49:19 -050055#ifndef POWER10
Deepak Kodihalli370f06b2017-10-25 04:26:07 -050056 for (auto id = 0; id < MAX_CPUS; ++id)
57 {
Deepak Kodihalli30417a12017-12-04 00:54:01 -060058 // Create one occ per cpu
59 auto occ = std::string(OCC_NAME) + std::to_string(id);
60 createObjects(occ);
Vishwanatha Subbannadfc7ec72017-09-07 18:18:01 +053061 }
Matt Spinlerd267cec2021-09-01 14:49:19 -050062#else
63 // Create the OCCs based on on the /dev/occX devices
64 auto occs = findOCCsInDev();
65
66 if (occs.empty() || (prevOCCSearch.size() != occs.size()))
67 {
68 // Something changed or no OCCs yet, try again in 10s.
69 // Note on the first pass prevOCCSearch will be empty,
70 // so there will be at least one delay to give things
71 // a chance to settle.
72 prevOCCSearch = occs;
73
74 using namespace std::literals::chrono_literals;
75 discoverTimer->restartOnce(10s);
76 }
77 else
78 {
79 discoverTimer.reset();
80
81 // createObjects requires OCC0 first.
82 std::sort(occs.begin(), occs.end());
83
84 for (auto id : occs)
85 {
86 createObjects(std::string(OCC_NAME) + std::to_string(id));
87 }
88 }
89#endif
90}
91
92std::vector<int> Manager::findOCCsInDev()
93{
94 std::vector<int> occs;
95 std::regex expr{R"(occ(\d+)$)"};
96
97 for (auto& file : fs::directory_iterator("/dev"))
98 {
99 std::smatch match;
100 std::string path{file.path().string()};
101 if (std::regex_search(path, match, expr))
102 {
103 auto num = std::stoi(match[1].str());
104
105 // /dev numbering starts at 1, ours starts at 0.
106 occs.push_back(num - 1);
107 }
108 }
109
110 return occs;
Vishwanatha Subbannadfc7ec72017-09-07 18:18:01 +0530111}
112
113int Manager::cpuCreated(sdbusplus::message::message& msg)
114{
George Liubcef3b42021-09-10 12:39:02 +0800115 namespace fs = std::filesystem;
Vishwanatha Subbannadfc7ec72017-09-07 18:18:01 +0530116
117 sdbusplus::message::object_path o;
118 msg.read(o);
119 fs::path cpuPath(std::string(std::move(o)));
120
121 auto name = cpuPath.filename().string();
122 auto index = name.find(CPU_NAME);
123 name.replace(index, std::strlen(CPU_NAME), OCC_NAME);
124
125 createObjects(name);
126
127 return 0;
128}
129
130void Manager::createObjects(const std::string& occ)
131{
132 auto path = fs::path(OCC_CONTROL_ROOT) / occ;
133
134 passThroughObjects.emplace_back(
George Liuf3b75142021-06-10 11:22:50 +0800135 std::make_unique<PassThrough>(path.c_str()));
Vishwanatha Subbannadfc7ec72017-09-07 18:18:01 +0530136
Gunnar Mills94df8c92018-09-14 14:50:03 -0500137 statusObjects.emplace_back(std::make_unique<Status>(
George Liuf3b75142021-06-10 11:22:50 +0800138 event, path.c_str(), *this,
Gunnar Mills94df8c92018-09-14 14:50:03 -0500139 std::bind(std::mem_fn(&Manager::statusCallBack), this,
Tom Joseph00325232020-07-29 17:51:48 +0530140 std::placeholders::_1)
141#ifdef PLDM
142 ,
143 std::bind(std::mem_fn(&pldm::Interface::resetOCC), pldmHandle.get(),
144 std::placeholders::_1)
145#endif
146 ));
Vishwanatha Subbannadfc7ec72017-09-07 18:18:01 +0530147
148 // Create the power cap monitor object for master occ (0)
149 if (!pcap)
150 {
151 pcap = std::make_unique<open_power::occ::powercap::PowerCap>(
George Liuf3b75142021-06-10 11:22:50 +0800152 *statusObjects.front());
Vishwanatha Subbannadfc7ec72017-09-07 18:18:01 +0530153 }
Chris Cain78e86012021-03-04 16:15:31 -0600154
155#ifdef POWER10
156 // Create the power mode monitor object for master occ (0)
157 if (!pmode)
158 {
159 pmode = std::make_unique<open_power::occ::powermode::PowerMode>(
160 *statusObjects.front());
161 }
162#endif
Vishwanatha Subbannadfc7ec72017-09-07 18:18:01 +0530163}
164
165void Manager::statusCallBack(bool status)
166{
Gunnar Mills94df8c92018-09-14 14:50:03 -0500167 using InternalFailure =
168 sdbusplus::xyz::openbmc_project::Common::Error::InternalFailure;
Vishwanatha Subbannadfc7ec72017-09-07 18:18:01 +0530169
170 // At this time, it won't happen but keeping it
171 // here just in case something changes in the future
172 if ((activeCount == 0) && (!status))
173 {
174 log<level::ERR>("Invalid update on OCCActive");
175 elog<InternalFailure>();
176 }
177
178 activeCount += status ? 1 : -1;
Eddie Jamesdae2d942017-12-20 10:50:03 -0600179
180 // Only start presence detection if all the OCCs are bound
181 if (activeCount == statusObjects.size())
182 {
Gunnar Mills94df8c92018-09-14 14:50:03 -0500183 for (auto& obj : statusObjects)
Eddie Jamesdae2d942017-12-20 10:50:03 -0600184 {
185 obj->addPresenceWatchMaster();
186 }
187 }
Chris Caina8857c52021-01-27 11:53:05 -0600188
189 if ((!_pollTimer->isEnabled()) && (activeCount > 0))
190 {
George Liub5ca1012021-09-10 12:53:11 +0800191 log<level::INFO>(
192 fmt::format(
193 "Manager::statusCallBack(): {} OCCs will be polled every {} seconds",
194 activeCount, pollInterval)
195 .c_str());
Chris Caina8857c52021-01-27 11:53:05 -0600196
197 // Send poll and start OCC poll timer
198 pollerTimerExpired();
199 }
200 else if ((_pollTimer->isEnabled()) && (activeCount == 0))
201 {
202 // Stop OCC poll timer
George Liub5ca1012021-09-10 12:53:11 +0800203 log<level::INFO>(
204 "Manager::statusCallBack(): OCCs are not running, stopping poll timer");
Chris Caina8857c52021-01-27 11:53:05 -0600205 _pollTimer->setEnabled(false);
Matt Spinler53f68142021-08-25 15:47:31 -0500206
207#ifdef READ_OCC_SENSORS
208 for (auto& obj : statusObjects)
209 {
210 setSensorValueToNaN(obj->getOccInstanceID());
211 }
212#endif
Chris Caina8857c52021-01-27 11:53:05 -0600213 }
Vishwanatha Subbannadfc7ec72017-09-07 18:18:01 +0530214}
215
216#ifdef I2C_OCC
217void Manager::initStatusObjects()
218{
219 // Make sure we have a valid path string
220 static_assert(sizeof(DEV_PATH) != 0);
221
222 auto deviceNames = i2c_occ::getOccHwmonDevices(DEV_PATH);
Lei YU41470e52017-11-30 16:03:50 +0800223 auto occMasterName = deviceNames.front();
Vishwanatha Subbannadfc7ec72017-09-07 18:18:01 +0530224 for (auto& name : deviceNames)
225 {
226 i2c_occ::i2cToDbus(name);
Lei YUb5259a12017-09-01 16:22:40 +0800227 name = std::string(OCC_NAME) + '_' + name;
Vishwanatha Subbannadfc7ec72017-09-07 18:18:01 +0530228 auto path = fs::path(OCC_CONTROL_ROOT) / name;
229 statusObjects.emplace_back(
George Liuf3b75142021-06-10 11:22:50 +0800230 std::make_unique<Status>(event, path.c_str(), *this));
Vishwanatha Subbannadfc7ec72017-09-07 18:18:01 +0530231 }
Lei YU41470e52017-11-30 16:03:50 +0800232 // The first device is master occ
233 pcap = std::make_unique<open_power::occ::powercap::PowerCap>(
George Liuf3b75142021-06-10 11:22:50 +0800234 *statusObjects.front(), occMasterName);
Chris Cain78e86012021-03-04 16:15:31 -0600235#ifdef POWER10
236 pmode = std::make_unique<open_power::occ::powermode::PowerMode>(
237 *statusObjects.front());
238#endif
Vishwanatha Subbannadfc7ec72017-09-07 18:18:01 +0530239}
240#endif
241
Tom Joseph815f9f52020-07-27 12:12:13 +0530242#ifdef PLDM
243bool Manager::updateOCCActive(instanceID instance, bool status)
244{
245 return (statusObjects[instance])->occActive(status);
246}
247#endif
248
Chris Caina8857c52021-01-27 11:53:05 -0600249void Manager::pollerTimerExpired()
250{
251 if (activeCount == 0)
252 {
253 // No OCCs running, so poll timer will not be restarted
George Liub5ca1012021-09-10 12:53:11 +0800254 log<level::INFO>(
255 "Manager::pollerTimerExpire(): No OCCs running, poll timer not restarted");
Chris Caina8857c52021-01-27 11:53:05 -0600256 }
257
258 if (!_pollTimer)
259 {
260 log<level::ERR>(
261 "Manager::pollerTimerExpired() ERROR: Timer not defined");
262 return;
263 }
264
265 for (auto& obj : statusObjects)
266 {
267 // Read sysfs to force kernel to poll OCC
268 obj->readOccState();
Chicago Duanbb895cb2021-06-18 19:37:16 +0800269
270#ifdef READ_OCC_SENSORS
271 // Read occ sensor values
272 auto id = obj->getOccInstanceID();
273 if (!obj->occActive())
274 {
275 // Occ not activated
276 setSensorValueToNaN(id);
277 continue;
278 }
279 getSensorValues(id, obj->isMasterOcc());
280#endif
Chris Caina8857c52021-01-27 11:53:05 -0600281 }
282
283 // Restart OCC poll timer
284 _pollTimer->restartOnce(std::chrono::seconds(pollInterval));
285}
286
Chicago Duanbb895cb2021-06-18 19:37:16 +0800287#ifdef READ_OCC_SENSORS
288void Manager::readTempSensors(const fs::path& path, uint32_t id)
289{
Chicago Duanbb895cb2021-06-18 19:37:16 +0800290 std::regex expr{"temp\\d+_label$"}; // Example: temp5_label
291 for (auto& file : fs::directory_iterator(path))
292 {
293 if (!std::regex_search(file.path().string(), expr))
294 {
295 continue;
296 }
Chicago Duanbb895cb2021-06-18 19:37:16 +0800297
Matt Spinlera26f1522021-08-25 15:50:20 -0500298 uint32_t labelValue{0};
299
300 try
301 {
302 labelValue = readFile<uint32_t>(file.path());
303 }
304 catch (const std::system_error& e)
305 {
306 log<level::DEBUG>(
307 fmt::format("readTempSensors: Failed reading {}, errno = {}",
308 file.path().string(), e.code().value())
309 .c_str());
Chicago Duanbb895cb2021-06-18 19:37:16 +0800310 continue;
311 }
Chicago Duanbb895cb2021-06-18 19:37:16 +0800312
313 const std::string& tempLabel = "label";
314 const std::string filePathString = file.path().string().substr(
315 0, file.path().string().length() - tempLabel.length());
Matt Spinlera26f1522021-08-25 15:50:20 -0500316
317 uint32_t fruTypeValue{0};
318 try
Chicago Duanbb895cb2021-06-18 19:37:16 +0800319 {
Matt Spinlera26f1522021-08-25 15:50:20 -0500320 fruTypeValue = readFile<uint32_t>(filePathString + fruTypeSuffix);
321 }
322 catch (const std::system_error& e)
323 {
Chicago Duanbb895cb2021-06-18 19:37:16 +0800324 log<level::DEBUG>(
Matt Spinlera26f1522021-08-25 15:50:20 -0500325 fmt::format("readTempSensors: Failed reading {}, errno = {}",
326 filePathString + fruTypeSuffix, e.code().value())
Chicago Duanbb895cb2021-06-18 19:37:16 +0800327 .c_str());
328 continue;
329 }
Chicago Duanbb895cb2021-06-18 19:37:16 +0800330
331 std::string sensorPath =
332 OCC_SENSORS_ROOT + std::string("/temperature/");
333
334 if (fruTypeValue == VRMVdd)
335 {
336 sensorPath.append("vrm_vdd" + std::to_string(id) + "_temp");
337 }
338 else
339 {
Matt Spinler14d14022021-08-25 15:38:29 -0500340 uint16_t type = (labelValue & 0xFF000000) >> 24;
341 uint16_t instanceID = labelValue & 0x0000FFFF;
Chicago Duanbb895cb2021-06-18 19:37:16 +0800342
343 if (type == OCC_DIMM_TEMP_SENSOR_TYPE)
344 {
Matt Spinler8b8abee2021-08-25 15:18:21 -0500345 if (fruTypeValue == fruTypeNotAvailable)
346 {
347 // Not all DIMM related temps are available to read
348 // (no _input file in this case)
349 continue;
350 }
Chicago Duanbb895cb2021-06-18 19:37:16 +0800351 auto iter = dimmTempSensorName.find(fruTypeValue);
352 if (iter == dimmTempSensorName.end())
353 {
George Liub5ca1012021-09-10 12:53:11 +0800354 log<level::ERR>(
355 fmt::format(
356 "readTempSensors: Fru type error! fruTypeValue = {}) ",
357 fruTypeValue)
358 .c_str());
Chicago Duanbb895cb2021-06-18 19:37:16 +0800359 continue;
360 }
361
362 sensorPath.append("dimm" + std::to_string(instanceID) +
363 iter->second);
364 }
365 else if (type == OCC_CPU_TEMP_SENSOR_TYPE)
366 {
367 if (fruTypeValue != processorCore)
368 {
Matt Spinlerabbcfc52021-08-25 15:22:22 -0500369 // TODO: support IO ring temp
Chicago Duanbb895cb2021-06-18 19:37:16 +0800370 continue;
371 }
372
373 sensorPath.append("proc" + std::to_string(id) + "_core" +
374 std::to_string(instanceID) + "_temp");
375 }
376 else
377 {
378 continue;
379 }
380 }
381
Matt Spinlera26f1522021-08-25 15:50:20 -0500382 uint32_t faultValue{0};
383 try
Chicago Duanbb895cb2021-06-18 19:37:16 +0800384 {
Matt Spinlera26f1522021-08-25 15:50:20 -0500385 faultValue = readFile<uint32_t>(filePathString + faultSuffix);
386 }
387 catch (const std::system_error& e)
388 {
389 log<level::DEBUG>(
390 fmt::format("readTempSensors: Failed reading {}, errno = {}",
391 filePathString + faultSuffix, e.code().value())
392 .c_str());
393 continue;
Chicago Duanbb895cb2021-06-18 19:37:16 +0800394 }
395
Matt Spinlera26f1522021-08-25 15:50:20 -0500396 if (faultValue != 0)
Chicago Duanbb895cb2021-06-18 19:37:16 +0800397 {
Chicago Duanbb895cb2021-06-18 19:37:16 +0800398 open_power::occ::dbus::OccDBusSensors::getOccDBus().setValue(
Matt Spinlera26f1522021-08-25 15:50:20 -0500399 sensorPath, std::numeric_limits<double>::quiet_NaN());
Chicago Duanbb895cb2021-06-18 19:37:16 +0800400
401 open_power::occ::dbus::OccDBusSensors::getOccDBus()
Matt Spinlera26f1522021-08-25 15:50:20 -0500402 .setOperationalStatus(sensorPath, false);
Chicago Duanbb895cb2021-06-18 19:37:16 +0800403
Matt Spinlera26f1522021-08-25 15:50:20 -0500404 continue;
Chicago Duanbb895cb2021-06-18 19:37:16 +0800405 }
Matt Spinlera26f1522021-08-25 15:50:20 -0500406
407 double tempValue{0};
408
409 try
Chicago Duanbb895cb2021-06-18 19:37:16 +0800410 {
Matt Spinlera26f1522021-08-25 15:50:20 -0500411 tempValue = readFile<double>(filePathString + inputSuffix);
Chicago Duanbb895cb2021-06-18 19:37:16 +0800412 }
Matt Spinlera26f1522021-08-25 15:50:20 -0500413 catch (const std::system_error& e)
414 {
415 log<level::DEBUG>(
416 fmt::format("readTempSensors: Failed reading {}, errno = {}",
417 filePathString + inputSuffix, e.code().value())
418 .c_str());
419 continue;
420 }
421
422 open_power::occ::dbus::OccDBusSensors::getOccDBus().setValue(
423 sensorPath, tempValue * std::pow(10, -3));
424
425 open_power::occ::dbus::OccDBusSensors::getOccDBus()
426 .setOperationalStatus(sensorPath, true);
427
428 existingSensors[sensorPath] = id;
Chicago Duanbb895cb2021-06-18 19:37:16 +0800429 }
430 return;
431}
432
433std::optional<std::string>
434 Manager::getPowerLabelFunctionID(const std::string& value)
435{
436 // If the value is "system", then the FunctionID is "system".
437 if (value == "system")
438 {
439 return value;
440 }
441
442 // If the value is not "system", then the label value have 3 numbers, of
443 // which we only care about the middle one:
444 // <sensor id>_<function id>_<apss channel>
445 // eg: The value is "0_10_5" , then the FunctionID is "10".
446 if (value.find("_") == std::string::npos)
447 {
448 return std::nullopt;
449 }
450
451 auto powerLabelValue = value.substr((value.find("_") + 1));
452
453 if (powerLabelValue.find("_") == std::string::npos)
454 {
455 return std::nullopt;
456 }
457
458 return powerLabelValue.substr(0, powerLabelValue.find("_"));
459}
460
461void Manager::readPowerSensors(const fs::path& path, uint32_t id)
462{
Chicago Duanbb895cb2021-06-18 19:37:16 +0800463 std::regex expr{"power\\d+_label$"}; // Example: power5_label
464 for (auto& file : fs::directory_iterator(path))
465 {
466 if (!std::regex_search(file.path().string(), expr))
467 {
468 continue;
469 }
Chicago Duanbb895cb2021-06-18 19:37:16 +0800470
Matt Spinlera26f1522021-08-25 15:50:20 -0500471 std::string labelValue;
472 try
473 {
474 labelValue = readFile<std::string>(file.path());
475 }
476 catch (const std::system_error& e)
477 {
478 log<level::DEBUG>(
479 fmt::format("readPowerSensors: Failed reading {}, errno = {}",
480 file.path().string(), e.code().value())
481 .c_str());
Chicago Duanbb895cb2021-06-18 19:37:16 +0800482 continue;
483 }
Chicago Duanbb895cb2021-06-18 19:37:16 +0800484
485 auto functionID = getPowerLabelFunctionID(labelValue);
486 if (functionID == std::nullopt)
487 {
488 continue;
489 }
490
491 const std::string& tempLabel = "label";
492 const std::string filePathString = file.path().string().substr(
493 0, file.path().string().length() - tempLabel.length());
494
495 std::string sensorPath = OCC_SENSORS_ROOT + std::string("/power/");
496
497 auto iter = powerSensorName.find(*functionID);
498 if (iter == powerSensorName.end())
499 {
500 continue;
501 }
502 sensorPath.append(iter->second);
503
Matt Spinlera26f1522021-08-25 15:50:20 -0500504 double tempValue{0};
505
506 try
Chicago Duanbb895cb2021-06-18 19:37:16 +0800507 {
Matt Spinlera26f1522021-08-25 15:50:20 -0500508 tempValue = readFile<double>(filePathString + inputSuffix);
Chicago Duanbb895cb2021-06-18 19:37:16 +0800509 }
Matt Spinlera26f1522021-08-25 15:50:20 -0500510 catch (const std::system_error& e)
Chicago Duanbb895cb2021-06-18 19:37:16 +0800511 {
Chicago Duanbb895cb2021-06-18 19:37:16 +0800512 log<level::DEBUG>(
Matt Spinlera26f1522021-08-25 15:50:20 -0500513 fmt::format("readTempSensors: Failed reading {}, errno = {}",
514 filePathString + inputSuffix, e.code().value())
Chicago Duanbb895cb2021-06-18 19:37:16 +0800515 .c_str());
Matt Spinlera26f1522021-08-25 15:50:20 -0500516 continue;
Chicago Duanbb895cb2021-06-18 19:37:16 +0800517 }
Matt Spinlera26f1522021-08-25 15:50:20 -0500518
519 open_power::occ::dbus::OccDBusSensors::getOccDBus().setValue(
520 sensorPath, tempValue * std::pow(10, -3) * std::pow(10, -3));
521
522 open_power::occ::dbus::OccDBusSensors::getOccDBus()
523 .setOperationalStatus(sensorPath, true);
524
525 existingSensors[sensorPath] = id;
Chicago Duanbb895cb2021-06-18 19:37:16 +0800526 }
527 return;
528}
529
530void Manager::setSensorValueToNaN(uint32_t id)
531{
532 for (const auto& [sensorPath, occId] : existingSensors)
533 {
534 if (occId == id)
535 {
536 open_power::occ::dbus::OccDBusSensors::getOccDBus().setValue(
537 sensorPath, std::numeric_limits<double>::quiet_NaN());
538 }
539 }
540 return;
541}
542
543void Manager::getSensorValues(uint32_t id, bool masterOcc)
544{
545 const auto occ = std::string("occ-hwmon.") + std::to_string(id + 1);
546
547 fs::path fileName{OCC_HWMON_PATH + occ + "/hwmon/"};
548
549 // Need to get the hwmonXX directory name, there better only be 1 dir
550 assert(std::distance(fs::directory_iterator(fileName),
551 fs::directory_iterator{}) == 1);
552 // Now set our path to this full path, including this hwmonXX directory
553 fileName = fs::path(*fs::directory_iterator(fileName));
554
555 // Read temperature sensors
556 readTempSensors(fileName, id);
557
558 if (masterOcc)
559 {
560 // Read power sensors
561 readPowerSensors(fileName, id);
562 }
563
564 return;
565}
566#endif
567
Vishwanatha Subbannadfc7ec72017-09-07 18:18:01 +0530568} // namespace occ
569} // namespace open_power