Brandon Kim | dab96f1 | 2021-02-18 11:21:37 -0800 | [diff] [blame] | 1 | // Copyright 2021 Google LLC |
| 2 | // |
| 3 | // Licensed under the Apache License, Version 2.0 (the "License"); |
| 4 | // you may not use this file except in compliance with the License. |
| 5 | // You may obtain a copy of the License at |
| 6 | // |
| 7 | // http://www.apache.org/licenses/LICENSE-2.0 |
| 8 | // |
| 9 | // Unless required by applicable law or agreed to in writing, software |
| 10 | // distributed under the License is distributed on an "AS IS" BASIS, |
| 11 | // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| 12 | // See the License for the specific language governing permissions and |
| 13 | // limitations under the License. |
| 14 | |
Sui Chen | 03eba28 | 2021-02-11 11:35:56 -0800 | [diff] [blame] | 15 | #include "metric.hpp" |
| 16 | |
William A. Kennington III | 7f49370 | 2024-02-08 01:09:11 -0800 | [diff] [blame] | 17 | #include "metricblob.pb.n.h" |
Sui Chen | 03eba28 | 2021-02-11 11:35:56 -0800 | [diff] [blame] | 18 | |
| 19 | #include "util.hpp" |
| 20 | |
William A. Kennington III | 7f49370 | 2024-02-08 01:09:11 -0800 | [diff] [blame] | 21 | #include <pb_encode.h> |
Sui Chen | 03eba28 | 2021-02-11 11:35:56 -0800 | [diff] [blame] | 22 | #include <sys/statvfs.h> |
| 23 | |
| 24 | #include <phosphor-logging/log.hpp> |
| 25 | |
| 26 | #include <cstdint> |
| 27 | #include <filesystem> |
| 28 | #include <sstream> |
| 29 | #include <string> |
| 30 | #include <string_view> |
| 31 | |
| 32 | namespace metric_blob |
| 33 | { |
| 34 | |
| 35 | using phosphor::logging::entry; |
| 36 | using phosphor::logging::log; |
| 37 | using level = phosphor::logging::level; |
| 38 | |
| 39 | BmcHealthSnapshot::BmcHealthSnapshot() : |
| 40 | done(false), stringId(0), ticksPerSec(0) |
| 41 | {} |
| 42 | |
William A. Kennington III | 7f49370 | 2024-02-08 01:09:11 -0800 | [diff] [blame] | 43 | template <typename T> |
Patrick Williams | c66ebc3 | 2024-08-16 15:21:56 -0400 | [diff] [blame] | 44 | static constexpr auto pbEncodeStr = |
| 45 | [](pb_ostream_t* stream, const pb_field_iter_t* field, |
| 46 | void* const* arg) noexcept { |
| 47 | static_assert(sizeof(*std::declval<T>().data()) == sizeof(pb_byte_t)); |
| 48 | const auto& s = *reinterpret_cast<const T*>(*arg); |
| 49 | return pb_encode_tag_for_field(stream, field) && |
| 50 | pb_encode_string(stream, |
| 51 | reinterpret_cast<const pb_byte_t*>(s.data()), |
| 52 | s.size()); |
| 53 | }; |
William A. Kennington III | 7f49370 | 2024-02-08 01:09:11 -0800 | [diff] [blame] | 54 | |
| 55 | template <typename T> |
| 56 | static pb_callback_t pbStrEncoder(const T& t) noexcept |
| 57 | { |
| 58 | return {{.encode = pbEncodeStr<T>}, const_cast<T*>(&t)}; |
| 59 | } |
| 60 | |
| 61 | template <auto fields, typename T> |
Patrick Williams | c66ebc3 | 2024-08-16 15:21:56 -0400 | [diff] [blame] | 62 | static constexpr auto pbEncodeSubs = |
| 63 | [](pb_ostream_t* stream, const pb_field_iter_t* field, |
| 64 | void* const* arg) noexcept { |
| 65 | for (const auto& sub : *reinterpret_cast<const std::vector<T>*>(*arg)) |
William A. Kennington III | 7f49370 | 2024-02-08 01:09:11 -0800 | [diff] [blame] | 66 | { |
Patrick Williams | c66ebc3 | 2024-08-16 15:21:56 -0400 | [diff] [blame] | 67 | if (!pb_encode_tag_for_field(stream, field) || |
| 68 | !pb_encode_submessage(stream, fields, &sub)) |
| 69 | { |
| 70 | return false; |
| 71 | } |
William A. Kennington III | 7f49370 | 2024-02-08 01:09:11 -0800 | [diff] [blame] | 72 | } |
Patrick Williams | c66ebc3 | 2024-08-16 15:21:56 -0400 | [diff] [blame] | 73 | return true; |
| 74 | }; |
William A. Kennington III | 7f49370 | 2024-02-08 01:09:11 -0800 | [diff] [blame] | 75 | |
| 76 | template <auto fields, typename T> |
| 77 | static pb_callback_t pbSubsEncoder(const std::vector<T>& t) |
| 78 | { |
| 79 | return {{.encode = pbEncodeSubs<fields, T>}, |
| 80 | const_cast<std::vector<T>*>(&t)}; |
| 81 | } |
| 82 | |
Sui Chen | 03eba28 | 2021-02-11 11:35:56 -0800 | [diff] [blame] | 83 | struct ProcStatEntry |
| 84 | { |
| 85 | std::string cmdline; |
| 86 | std::string tcomm; |
| 87 | float utime; |
| 88 | float stime; |
| 89 | |
| 90 | // Processes with the longest utime + stime are ranked first. |
| 91 | // Tie breaking is done with cmdline then tcomm. |
| 92 | bool operator<(const ProcStatEntry& other) const |
| 93 | { |
| 94 | const float negTime = -(utime + stime); |
| 95 | const float negOtherTime = -(other.utime + other.stime); |
| 96 | return std::tie(negTime, cmdline, tcomm) < |
| 97 | std::tie(negOtherTime, other.cmdline, other.tcomm); |
| 98 | } |
| 99 | }; |
| 100 | |
William A. Kennington III | 7f49370 | 2024-02-08 01:09:11 -0800 | [diff] [blame] | 101 | static bmcmetrics_metricproto_BmcProcStatMetric getProcStatMetric( |
| 102 | BmcHealthSnapshot& obj, long ticksPerSec, |
| 103 | std::vector<bmcmetrics_metricproto_BmcProcStatMetric_BmcProcStat>& procs, |
| 104 | bool& use) noexcept |
Sui Chen | 03eba28 | 2021-02-11 11:35:56 -0800 | [diff] [blame] | 105 | { |
William A. Kennington III | 7f49370 | 2024-02-08 01:09:11 -0800 | [diff] [blame] | 106 | if (ticksPerSec == 0) |
| 107 | { |
| 108 | return {}; |
| 109 | } |
Sui Chen | 03eba28 | 2021-02-11 11:35:56 -0800 | [diff] [blame] | 110 | constexpr std::string_view procPath = "/proc/"; |
| 111 | |
Sui Chen | 03eba28 | 2021-02-11 11:35:56 -0800 | [diff] [blame] | 112 | std::vector<ProcStatEntry> entries; |
| 113 | |
| 114 | for (const auto& procEntry : std::filesystem::directory_iterator(procPath)) |
| 115 | { |
| 116 | const std::string& path = procEntry.path(); |
| 117 | int pid = -1; |
| 118 | if (isNumericPath(path, pid)) |
| 119 | { |
| 120 | ProcStatEntry entry; |
| 121 | |
| 122 | try |
| 123 | { |
| 124 | entry.cmdline = getCmdLine(pid); |
| 125 | TcommUtimeStime t = getTcommUtimeStime(pid, ticksPerSec); |
| 126 | entry.tcomm = t.tcomm; |
| 127 | entry.utime = t.utime; |
| 128 | entry.stime = t.stime; |
| 129 | |
| 130 | entries.push_back(entry); |
| 131 | } |
| 132 | catch (const std::exception& e) |
| 133 | { |
| 134 | log<level::ERR>("Could not obtain process stats"); |
| 135 | } |
| 136 | } |
| 137 | } |
| 138 | |
| 139 | std::sort(entries.begin(), entries.end()); |
| 140 | |
| 141 | bool isOthers = false; |
| 142 | ProcStatEntry others; |
| 143 | others.cmdline = "(Others)"; |
| 144 | others.utime = others.stime = 0; |
| 145 | |
| 146 | // Only show this many processes and aggregate all remaining ones into |
| 147 | // "others" in order to keep the size of the snapshot reasonably small. |
| 148 | // With 10 process stat entries and 10 FD count entries, the size of the |
| 149 | // snapshot reaches around 1.5KiB. This is non-trivial, and we have to set |
| 150 | // the collection interval long enough so as not to over-stress the IPMI |
| 151 | // interface and the data collection service. The value of 10 is chosen |
| 152 | // empirically, it might be subject to adjustments when the system is |
| 153 | // launched later. |
| 154 | constexpr int topN = 10; |
| 155 | |
| 156 | for (size_t i = 0; i < entries.size(); ++i) |
| 157 | { |
| 158 | if (i >= topN) |
| 159 | { |
| 160 | isOthers = true; |
| 161 | } |
| 162 | |
William A. Kennington III | 7f49370 | 2024-02-08 01:09:11 -0800 | [diff] [blame] | 163 | const ProcStatEntry& entry = entries[i]; |
Sui Chen | 03eba28 | 2021-02-11 11:35:56 -0800 | [diff] [blame] | 164 | |
| 165 | if (isOthers) |
| 166 | { |
| 167 | others.utime += entry.utime; |
| 168 | others.stime += entry.stime; |
| 169 | } |
| 170 | else |
| 171 | { |
Sui Chen | 03eba28 | 2021-02-11 11:35:56 -0800 | [diff] [blame] | 172 | std::string fullCmdline = entry.cmdline; |
| 173 | if (entry.tcomm.size() > 0) |
| 174 | { |
William A. Kennington III | 7f49370 | 2024-02-08 01:09:11 -0800 | [diff] [blame] | 175 | fullCmdline += " "; |
| 176 | fullCmdline += entry.tcomm; |
Sui Chen | 03eba28 | 2021-02-11 11:35:56 -0800 | [diff] [blame] | 177 | } |
William A. Kennington III | 7f49370 | 2024-02-08 01:09:11 -0800 | [diff] [blame] | 178 | procs.emplace_back( |
| 179 | bmcmetrics_metricproto_BmcProcStatMetric_BmcProcStat{ |
| 180 | .sidx_cmdline = obj.getStringID(fullCmdline), |
| 181 | .utime = entry.utime, |
| 182 | .stime = entry.stime, |
| 183 | }); |
Sui Chen | 03eba28 | 2021-02-11 11:35:56 -0800 | [diff] [blame] | 184 | } |
| 185 | } |
| 186 | |
| 187 | if (isOthers) |
| 188 | { |
William A. Kennington III | 7f49370 | 2024-02-08 01:09:11 -0800 | [diff] [blame] | 189 | procs.emplace_back(bmcmetrics_metricproto_BmcProcStatMetric_BmcProcStat{ |
| 190 | .sidx_cmdline = obj.getStringID(others.cmdline), |
| 191 | .utime = others.utime, |
| 192 | .stime = others.stime, |
| 193 | |
| 194 | }); |
Sui Chen | 03eba28 | 2021-02-11 11:35:56 -0800 | [diff] [blame] | 195 | } |
| 196 | |
William A. Kennington III | 7f49370 | 2024-02-08 01:09:11 -0800 | [diff] [blame] | 197 | use = true; |
| 198 | return bmcmetrics_metricproto_BmcProcStatMetric{ |
| 199 | .stats = pbSubsEncoder< |
| 200 | bmcmetrics_metricproto_BmcProcStatMetric_BmcProcStat_fields>(procs), |
| 201 | }; |
Sui Chen | 03eba28 | 2021-02-11 11:35:56 -0800 | [diff] [blame] | 202 | } |
| 203 | |
| 204 | int getFdCount(int pid) |
| 205 | { |
| 206 | const std::string& fdPath = "/proc/" + std::to_string(pid) + "/fd"; |
| 207 | return std::distance(std::filesystem::directory_iterator(fdPath), |
| 208 | std::filesystem::directory_iterator{}); |
| 209 | } |
| 210 | |
| 211 | struct FdStatEntry |
| 212 | { |
| 213 | int fdCount; |
| 214 | std::string cmdline; |
| 215 | std::string tcomm; |
| 216 | |
| 217 | // Processes with the largest fdCount goes first. |
| 218 | // Tie-breaking using cmdline then tcomm. |
| 219 | bool operator<(const FdStatEntry& other) const |
| 220 | { |
| 221 | const int negFdCount = -fdCount; |
| 222 | const int negOtherFdCount = -other.fdCount; |
| 223 | return std::tie(negFdCount, cmdline, tcomm) < |
| 224 | std::tie(negOtherFdCount, other.cmdline, other.tcomm); |
| 225 | } |
| 226 | }; |
| 227 | |
William A. Kennington III | 7f49370 | 2024-02-08 01:09:11 -0800 | [diff] [blame] | 228 | static bmcmetrics_metricproto_BmcFdStatMetric getFdStatMetric( |
| 229 | BmcHealthSnapshot& obj, long ticksPerSec, |
| 230 | std::vector<bmcmetrics_metricproto_BmcFdStatMetric_BmcFdStat>& fds, |
| 231 | bool& use) noexcept |
Sui Chen | 03eba28 | 2021-02-11 11:35:56 -0800 | [diff] [blame] | 232 | { |
William A. Kennington III | 7f49370 | 2024-02-08 01:09:11 -0800 | [diff] [blame] | 233 | if (ticksPerSec == 0) |
| 234 | { |
| 235 | return {}; |
| 236 | } |
Sui Chen | 03eba28 | 2021-02-11 11:35:56 -0800 | [diff] [blame] | 237 | |
| 238 | // Sort by fd count, no tie-breaking |
| 239 | std::vector<FdStatEntry> entries; |
| 240 | |
| 241 | const std::string_view procPath = "/proc/"; |
| 242 | for (const auto& procEntry : std::filesystem::directory_iterator(procPath)) |
| 243 | { |
| 244 | const std::string& path = procEntry.path(); |
| 245 | int pid = 0; |
| 246 | FdStatEntry entry; |
| 247 | if (isNumericPath(path, pid)) |
| 248 | { |
| 249 | try |
| 250 | { |
| 251 | entry.fdCount = getFdCount(pid); |
| 252 | TcommUtimeStime t = getTcommUtimeStime(pid, ticksPerSec); |
| 253 | entry.cmdline = getCmdLine(pid); |
| 254 | entry.tcomm = t.tcomm; |
| 255 | entries.push_back(entry); |
| 256 | } |
| 257 | catch (const std::exception& e) |
| 258 | { |
| 259 | log<level::ERR>("Could not get file descriptor stats"); |
| 260 | } |
| 261 | } |
| 262 | } |
| 263 | |
| 264 | std::sort(entries.begin(), entries.end()); |
| 265 | |
| 266 | bool isOthers = false; |
| 267 | |
| 268 | // Only report the detailed fd count and cmdline for the top 10 entries, |
| 269 | // and collapse all others into "others". |
| 270 | constexpr int topN = 10; |
| 271 | |
| 272 | FdStatEntry others; |
| 273 | others.cmdline = "(Others)"; |
| 274 | others.fdCount = 0; |
| 275 | |
| 276 | for (size_t i = 0; i < entries.size(); ++i) |
| 277 | { |
| 278 | if (i >= topN) |
| 279 | { |
| 280 | isOthers = true; |
| 281 | } |
| 282 | |
| 283 | const FdStatEntry& entry = entries[i]; |
| 284 | if (isOthers) |
| 285 | { |
| 286 | others.fdCount += entry.fdCount; |
| 287 | } |
| 288 | else |
| 289 | { |
Sui Chen | 03eba28 | 2021-02-11 11:35:56 -0800 | [diff] [blame] | 290 | std::string fullCmdline = entry.cmdline; |
| 291 | if (entry.tcomm.size() > 0) |
| 292 | { |
William A. Kennington III | 7f49370 | 2024-02-08 01:09:11 -0800 | [diff] [blame] | 293 | fullCmdline += " "; |
| 294 | fullCmdline += entry.tcomm; |
Sui Chen | 03eba28 | 2021-02-11 11:35:56 -0800 | [diff] [blame] | 295 | } |
William A. Kennington III | 7f49370 | 2024-02-08 01:09:11 -0800 | [diff] [blame] | 296 | fds.emplace_back(bmcmetrics_metricproto_BmcFdStatMetric_BmcFdStat{ |
| 297 | .sidx_cmdline = obj.getStringID(fullCmdline), |
| 298 | .fd_count = entry.fdCount, |
| 299 | }); |
Sui Chen | 03eba28 | 2021-02-11 11:35:56 -0800 | [diff] [blame] | 300 | } |
| 301 | } |
| 302 | |
| 303 | if (isOthers) |
| 304 | { |
William A. Kennington III | 7f49370 | 2024-02-08 01:09:11 -0800 | [diff] [blame] | 305 | fds.emplace_back(bmcmetrics_metricproto_BmcFdStatMetric_BmcFdStat{ |
| 306 | .sidx_cmdline = obj.getStringID(others.cmdline), |
| 307 | .fd_count = others.fdCount, |
| 308 | }); |
Sui Chen | 03eba28 | 2021-02-11 11:35:56 -0800 | [diff] [blame] | 309 | } |
| 310 | |
William A. Kennington III | 7f49370 | 2024-02-08 01:09:11 -0800 | [diff] [blame] | 311 | use = true; |
| 312 | return bmcmetrics_metricproto_BmcFdStatMetric{ |
| 313 | .stats = pbSubsEncoder< |
| 314 | bmcmetrics_metricproto_BmcFdStatMetric_BmcFdStat_fields>(fds), |
| 315 | }; |
| 316 | } |
| 317 | |
Willy Tu | 4dba220 | 2024-04-08 21:27:20 +0000 | [diff] [blame] | 318 | static bmcmetrics_metricproto_BmcECCMetric getECCMetric(bool& use) noexcept |
| 319 | { |
| 320 | EccCounts eccCounts; |
| 321 | use = getECCErrorCounts(eccCounts); |
| 322 | if (!use) |
| 323 | { |
| 324 | return {}; |
| 325 | } |
| 326 | return bmcmetrics_metricproto_BmcECCMetric{ |
| 327 | .correctable_error_count = eccCounts.correctableErrCount, |
| 328 | .uncorrectable_error_count = eccCounts.uncorrectableErrCount, |
| 329 | }; |
| 330 | } |
| 331 | |
William A. Kennington III | 7f49370 | 2024-02-08 01:09:11 -0800 | [diff] [blame] | 332 | static bmcmetrics_metricproto_BmcMemoryMetric getMemMetric() noexcept |
| 333 | { |
| 334 | bmcmetrics_metricproto_BmcMemoryMetric ret = {}; |
| 335 | auto data = readFileThenGrepIntoString("/proc/meminfo"); |
| 336 | int value; |
| 337 | if (parseMeminfoValue(data, "MemAvailable:", value)) |
| 338 | { |
| 339 | ret.mem_available = value; |
| 340 | } |
| 341 | if (parseMeminfoValue(data, "Slab:", value)) |
| 342 | { |
| 343 | ret.slab = value; |
| 344 | } |
| 345 | |
| 346 | if (parseMeminfoValue(data, "KernelStack:", value)) |
| 347 | { |
| 348 | ret.kernel_stack = value; |
| 349 | } |
Sui Chen | 03eba28 | 2021-02-11 11:35:56 -0800 | [diff] [blame] | 350 | return ret; |
| 351 | } |
| 352 | |
William A. Kennington III | 7f49370 | 2024-02-08 01:09:11 -0800 | [diff] [blame] | 353 | static bmcmetrics_metricproto_BmcUptimeMetric |
| 354 | getUptimeMetric(bool& use) noexcept |
Sui Chen | 03eba28 | 2021-02-11 11:35:56 -0800 | [diff] [blame] | 355 | { |
William A. Kennington III | 7f49370 | 2024-02-08 01:09:11 -0800 | [diff] [blame] | 356 | bmcmetrics_metricproto_BmcUptimeMetric ret = {}; |
Sui Chen | 03eba28 | 2021-02-11 11:35:56 -0800 | [diff] [blame] | 357 | |
Michael Shen | b63d631 | 2021-04-26 13:30:57 +0800 | [diff] [blame] | 358 | double uptime = 0; |
Michael Shen | b63d631 | 2021-04-26 13:30:57 +0800 | [diff] [blame] | 359 | { |
William A. Kennington III | 7f49370 | 2024-02-08 01:09:11 -0800 | [diff] [blame] | 360 | auto data = readFileThenGrepIntoString("/proc/uptime"); |
| 361 | double idleProcessTime = 0; |
| 362 | if (!parseProcUptime(data, uptime, idleProcessTime)) |
| 363 | { |
| 364 | log<level::ERR>("Error parsing /proc/uptime"); |
| 365 | return ret; |
| 366 | } |
| 367 | ret.uptime = uptime; |
| 368 | ret.idle_process_time = idleProcessTime; |
Michael Shen | b63d631 | 2021-04-26 13:30:57 +0800 | [diff] [blame] | 369 | } |
William A. Kennington III | 7f49370 | 2024-02-08 01:09:11 -0800 | [diff] [blame] | 370 | |
| 371 | BootTimesMonotonic btm; |
| 372 | if (!getBootTimesMonotonic(btm)) |
Michael Shen | b63d631 | 2021-04-26 13:30:57 +0800 | [diff] [blame] | 373 | { |
| 374 | log<level::ERR>("Could not get boot time"); |
William A. Kennington III | 7f49370 | 2024-02-08 01:09:11 -0800 | [diff] [blame] | 375 | return ret; |
| 376 | } |
| 377 | if (btm.firmwareTime == 0 && btm.powerOnSecCounterTime != 0) |
| 378 | { |
| 379 | ret.firmware_boot_time_sec = |
| 380 | static_cast<double>(btm.powerOnSecCounterTime) - uptime; |
Michael Shen | b63d631 | 2021-04-26 13:30:57 +0800 | [diff] [blame] | 381 | } |
| 382 | else |
Sui Chen | 03eba28 | 2021-02-11 11:35:56 -0800 | [diff] [blame] | 383 | { |
William A. Kennington III | 7f49370 | 2024-02-08 01:09:11 -0800 | [diff] [blame] | 384 | ret.firmware_boot_time_sec = |
| 385 | static_cast<double>(btm.firmwareTime - btm.loaderTime) / 1e6; |
| 386 | } |
| 387 | ret.loader_boot_time_sec = static_cast<double>(btm.loaderTime) / 1e6; |
| 388 | if (btm.initrdTime != 0) |
| 389 | { |
| 390 | ret.kernel_boot_time_sec = static_cast<double>(btm.initrdTime) / 1e6; |
| 391 | ret.initrd_boot_time_sec = |
| 392 | static_cast<double>(btm.userspaceTime - btm.initrdTime) / 1e6; |
| 393 | ret.userspace_boot_time_sec = |
| 394 | static_cast<double>(btm.finishTime - btm.userspaceTime) / 1e6; |
| 395 | } |
| 396 | else |
| 397 | { |
| 398 | ret.kernel_boot_time_sec = static_cast<double>(btm.userspaceTime) / 1e6; |
| 399 | ret.initrd_boot_time_sec = 0; |
| 400 | ret.userspace_boot_time_sec = |
| 401 | static_cast<double>(btm.finishTime - btm.userspaceTime) / 1e6; |
Sui Chen | 03eba28 | 2021-02-11 11:35:56 -0800 | [diff] [blame] | 402 | } |
Sui Chen | 03eba28 | 2021-02-11 11:35:56 -0800 | [diff] [blame] | 403 | |
William A. Kennington III | 7f49370 | 2024-02-08 01:09:11 -0800 | [diff] [blame] | 404 | use = true; |
| 405 | return ret; |
| 406 | } |
| 407 | |
| 408 | static bmcmetrics_metricproto_BmcDiskSpaceMetric |
| 409 | getStorageMetric(bool& use) noexcept |
| 410 | { |
| 411 | bmcmetrics_metricproto_BmcDiskSpaceMetric ret = {}; |
Sui Chen | 03eba28 | 2021-02-11 11:35:56 -0800 | [diff] [blame] | 412 | struct statvfs fiData; |
William A. Kennington III | 7f49370 | 2024-02-08 01:09:11 -0800 | [diff] [blame] | 413 | if (statvfs("/", &fiData) < 0) |
Sui Chen | 03eba28 | 2021-02-11 11:35:56 -0800 | [diff] [blame] | 414 | { |
| 415 | log<level::ERR>("Could not call statvfs"); |
| 416 | } |
| 417 | else |
| 418 | { |
William A. Kennington III | 7f49370 | 2024-02-08 01:09:11 -0800 | [diff] [blame] | 419 | ret.rwfs_kib_available = (fiData.f_bsize * fiData.f_bfree) / 1024; |
| 420 | use = true; |
Sui Chen | 03eba28 | 2021-02-11 11:35:56 -0800 | [diff] [blame] | 421 | } |
William A. Kennington III | 7f49370 | 2024-02-08 01:09:11 -0800 | [diff] [blame] | 422 | return ret; |
| 423 | } |
Sui Chen | 03eba28 | 2021-02-11 11:35:56 -0800 | [diff] [blame] | 424 | |
William A. Kennington III | 7f49370 | 2024-02-08 01:09:11 -0800 | [diff] [blame] | 425 | void BmcHealthSnapshot::doWork() |
| 426 | { |
Sui Chen | 03eba28 | 2021-02-11 11:35:56 -0800 | [diff] [blame] | 427 | // The next metrics require a sane ticks_per_sec value, typically 100 on |
| 428 | // the BMC. In the very rare circumstance when it's 0, exit early and return |
| 429 | // a partially complete snapshot (no process). |
| 430 | ticksPerSec = getTicksPerSec(); |
| 431 | |
William A. Kennington III | 7f49370 | 2024-02-08 01:09:11 -0800 | [diff] [blame] | 432 | static constexpr auto stcb = [](pb_ostream_t* stream, |
| 433 | const pb_field_t* field, |
| 434 | void* const* arg) noexcept { |
| 435 | auto& self = *reinterpret_cast<BmcHealthSnapshot*>(*arg); |
| 436 | std::vector<std::string_view> strs(self.stringTable.size()); |
| 437 | for (const auto& [str, i] : self.stringTable) |
| 438 | { |
| 439 | strs[i] = str; |
| 440 | } |
| 441 | for (auto& str : strs) |
| 442 | { |
| 443 | bmcmetrics_metricproto_BmcStringTable_StringEntry msg = { |
| 444 | .value = pbStrEncoder(str), |
| 445 | }; |
| 446 | if (!pb_encode_tag_for_field(stream, field) || |
| 447 | !pb_encode_submessage( |
| 448 | stream, |
| 449 | bmcmetrics_metricproto_BmcStringTable_StringEntry_fields, |
| 450 | &msg)) |
| 451 | { |
| 452 | return false; |
| 453 | } |
| 454 | } |
| 455 | return true; |
| 456 | }; |
| 457 | std::vector<bmcmetrics_metricproto_BmcProcStatMetric_BmcProcStat> procs; |
| 458 | std::vector<bmcmetrics_metricproto_BmcFdStatMetric_BmcFdStat> fds; |
| 459 | bmcmetrics_metricproto_BmcMetricSnapshot snapshot = { |
| 460 | .has_string_table = true, |
| 461 | .string_table = |
| 462 | { |
| 463 | .entries = {{.encode = stcb}, this}, |
| 464 | }, |
| 465 | .has_memory_metric = true, |
| 466 | .memory_metric = getMemMetric(), |
| 467 | .has_uptime_metric = false, |
| 468 | .uptime_metric = getUptimeMetric(snapshot.has_uptime_metric), |
| 469 | .has_storage_space_metric = false, |
| 470 | .storage_space_metric = |
| 471 | getStorageMetric(snapshot.has_storage_space_metric), |
| 472 | .has_procstat_metric = false, |
| 473 | .procstat_metric = getProcStatMetric(*this, ticksPerSec, procs, |
| 474 | snapshot.has_procstat_metric), |
| 475 | .has_fdstat_metric = false, |
| 476 | .fdstat_metric = getFdStatMetric(*this, ticksPerSec, fds, |
| 477 | snapshot.has_fdstat_metric), |
Willy Tu | 4dba220 | 2024-04-08 21:27:20 +0000 | [diff] [blame] | 478 | .has_ecc_metric = false, |
| 479 | .ecc_metric = getECCMetric(snapshot.has_ecc_metric), |
William A. Kennington III | 7f49370 | 2024-02-08 01:09:11 -0800 | [diff] [blame] | 480 | }; |
| 481 | pb_ostream_t nost = {}; |
| 482 | if (!pb_encode(&nost, bmcmetrics_metricproto_BmcMetricSnapshot_fields, |
| 483 | &snapshot)) |
Sui Chen | 03eba28 | 2021-02-11 11:35:56 -0800 | [diff] [blame] | 484 | { |
William A. Kennington III | 7f49370 | 2024-02-08 01:09:11 -0800 | [diff] [blame] | 485 | auto msg = std::format("Getting pb size: {}", PB_GET_ERROR(&nost)); |
| 486 | log<level::ERR>(msg.c_str()); |
Sui Chen | 03eba28 | 2021-02-11 11:35:56 -0800 | [diff] [blame] | 487 | return; |
| 488 | } |
William A. Kennington III | 7f49370 | 2024-02-08 01:09:11 -0800 | [diff] [blame] | 489 | pbDump.resize(nost.bytes_written); |
| 490 | auto ost = pb_ostream_from_buffer( |
| 491 | reinterpret_cast<pb_byte_t*>(pbDump.data()), pbDump.size()); |
| 492 | if (!pb_encode(&ost, bmcmetrics_metricproto_BmcMetricSnapshot_fields, |
| 493 | &snapshot)) |
Sui Chen | 03eba28 | 2021-02-11 11:35:56 -0800 | [diff] [blame] | 494 | { |
William A. Kennington III | 7f49370 | 2024-02-08 01:09:11 -0800 | [diff] [blame] | 495 | auto msg = std::format("Writing pb msg: {}", PB_GET_ERROR(&ost)); |
| 496 | log<level::ERR>(msg.c_str()); |
| 497 | return; |
Sui Chen | 03eba28 | 2021-02-11 11:35:56 -0800 | [diff] [blame] | 498 | } |
Sui Chen | 03eba28 | 2021-02-11 11:35:56 -0800 | [diff] [blame] | 499 | done = true; |
| 500 | } |
| 501 | |
| 502 | // BmcBlobSessionStat (9) but passing meta as reference instead of pointer, |
| 503 | // since the metadata must not be null at this point. |
| 504 | bool BmcHealthSnapshot::stat(blobs::BlobMeta& meta) |
| 505 | { |
| 506 | if (!done) |
| 507 | { |
| 508 | // Bits 8~15 are blob-specific state flags. |
| 509 | // For this blob, bit 8 is set when metric collection is still in |
| 510 | // progress. |
| 511 | meta.blobState |= (1 << 8); |
| 512 | } |
| 513 | else |
| 514 | { |
| 515 | meta.blobState = 0; |
| 516 | meta.blobState = blobs::StateFlags::open_read; |
| 517 | meta.size = pbDump.size(); |
| 518 | } |
| 519 | return true; |
| 520 | } |
| 521 | |
| 522 | std::string_view BmcHealthSnapshot::read(uint32_t offset, |
| 523 | uint32_t requestedSize) |
| 524 | { |
| 525 | uint32_t size = static_cast<uint32_t>(pbDump.size()); |
| 526 | if (offset >= size) |
| 527 | { |
| 528 | return {}; |
| 529 | } |
| 530 | return std::string_view(pbDump.data() + offset, |
| 531 | std::min(requestedSize, size - offset)); |
| 532 | } |
| 533 | |
| 534 | int BmcHealthSnapshot::getStringID(const std::string_view s) |
| 535 | { |
| 536 | int ret = 0; |
| 537 | auto itr = stringTable.find(s.data()); |
| 538 | if (itr == stringTable.end()) |
| 539 | { |
| 540 | stringTable[s.data()] = stringId; |
| 541 | ret = stringId; |
| 542 | ++stringId; |
| 543 | } |
| 544 | else |
| 545 | { |
| 546 | ret = itr->second; |
| 547 | } |
| 548 | return ret; |
| 549 | } |
| 550 | |
Patrick Williams | 2be4523 | 2023-05-10 07:51:22 -0500 | [diff] [blame] | 551 | } // namespace metric_blob |