Ed Tanous | 911ac31 | 2017-08-15 09:37:42 -0700 | [diff] [blame] | 1 | #pragma once |
| 2 | |
Ed Tanous | 3ccb3ad | 2023-01-13 17:40:03 -0800 | [diff] [blame] | 3 | #include "app.hpp" |
| 4 | #include "http_request.hpp" |
| 5 | #include "http_response.hpp" |
| 6 | #include "routing.hpp" |
James Feist | 3909dc8 | 2020-04-03 10:58:55 -0700 | [diff] [blame] | 7 | #include "webroutes.hpp" |
| 8 | |
Ed Tanous | 911ac31 | 2017-08-15 09:37:42 -0700 | [diff] [blame] | 9 | #include <boost/container/flat_set.hpp> |
Gunnar Mills | 1214b7e | 2020-06-04 10:11:30 -0500 | [diff] [blame] | 10 | |
Ed Tanous | ca89b20 | 2024-04-25 23:02:40 -0700 | [diff] [blame] | 11 | #include <algorithm> |
| 12 | #include <array> |
James Feist | 4418c7f | 2019-04-15 11:09:15 -0700 | [diff] [blame] | 13 | #include <filesystem> |
Ed Tanous | 1abe55e | 2018-09-05 08:30:59 -0700 | [diff] [blame] | 14 | #include <fstream> |
| 15 | #include <string> |
Ed Tanous | ca89b20 | 2024-04-25 23:02:40 -0700 | [diff] [blame] | 16 | #include <string_view> |
Ed Tanous | 911ac31 | 2017-08-15 09:37:42 -0700 | [diff] [blame] | 17 | |
Ed Tanous | 1abe55e | 2018-09-05 08:30:59 -0700 | [diff] [blame] | 18 | namespace crow |
| 19 | { |
| 20 | namespace webassets |
| 21 | { |
Ed Tanous | 911ac31 | 2017-08-15 09:37:42 -0700 | [diff] [blame] | 22 | |
Ed Tanous | 499b5b4 | 2024-04-06 08:39:18 -0700 | [diff] [blame] | 23 | inline std::string getStaticEtag(const std::filesystem::path& webpath) |
| 24 | { |
| 25 | // webpack outputs production chunks in the form: |
| 26 | // <filename>.<hash>.<extension> |
| 27 | // For example app.63e2c453.css |
| 28 | // Try to detect this, so we can use the hash as the ETAG |
| 29 | std::vector<std::string> split; |
| 30 | bmcweb::split(split, webpath.filename().string(), '.'); |
| 31 | BMCWEB_LOG_DEBUG("Checking {} split.size() {}", webpath.filename().string(), |
| 32 | split.size()); |
| 33 | if (split.size() < 3) |
| 34 | { |
| 35 | return ""; |
| 36 | } |
| 37 | |
| 38 | // get the second to last element |
| 39 | std::string hash = split.rbegin()[1]; |
| 40 | |
| 41 | // Webpack hashes are 8 characters long |
| 42 | if (hash.size() != 8) |
| 43 | { |
| 44 | return ""; |
| 45 | } |
| 46 | // Webpack hashes only include hex printable characters |
| 47 | if (hash.find_first_not_of("0123456789abcdefABCDEF") != std::string::npos) |
| 48 | { |
| 49 | return ""; |
| 50 | } |
| 51 | return std::format("\"{}\"", hash); |
| 52 | } |
| 53 | |
Ed Tanous | ca89b20 | 2024-04-25 23:02:40 -0700 | [diff] [blame] | 54 | static constexpr std::string_view rootpath("/usr/share/www/"); |
| 55 | |
| 56 | struct StaticFile |
Ed Tanous | 1abe55e | 2018-09-05 08:30:59 -0700 | [diff] [blame] | 57 | { |
Ed Tanous | ca89b20 | 2024-04-25 23:02:40 -0700 | [diff] [blame] | 58 | std::filesystem::path absolutePath; |
| 59 | std::string_view contentType; |
| 60 | std::string_view contentEncoding; |
| 61 | std::string etag; |
| 62 | bool renamed = false; |
| 63 | }; |
| 64 | |
| 65 | inline void |
| 66 | handleStaticAsset(const crow::Request& req, |
| 67 | const std::shared_ptr<bmcweb::AsyncResp>& asyncResp, |
| 68 | const StaticFile& file) |
| 69 | { |
| 70 | if (!file.contentType.empty()) |
| 71 | { |
| 72 | asyncResp->res.addHeader(boost::beast::http::field::content_type, |
| 73 | file.contentType); |
| 74 | } |
| 75 | |
| 76 | if (!file.contentEncoding.empty()) |
| 77 | { |
| 78 | asyncResp->res.addHeader(boost::beast::http::field::content_encoding, |
| 79 | file.contentEncoding); |
| 80 | } |
| 81 | |
| 82 | if (!file.etag.empty()) |
| 83 | { |
| 84 | asyncResp->res.addHeader(boost::beast::http::field::etag, file.etag); |
| 85 | // Don't cache paths that don't have the etag in them, like |
| 86 | // index, which gets transformed to / |
| 87 | if (!file.renamed) |
| 88 | { |
| 89 | // Anything with a hash can be cached forever and is |
| 90 | // immutable |
| 91 | asyncResp->res.addHeader(boost::beast::http::field::cache_control, |
| 92 | "max-age=31556926, immutable"); |
| 93 | } |
| 94 | |
| 95 | std::string_view cachedEtag = |
| 96 | req.getHeaderValue(boost::beast::http::field::if_none_match); |
| 97 | if (cachedEtag == file.etag) |
| 98 | { |
| 99 | asyncResp->res.result(boost::beast::http::status::not_modified); |
| 100 | return; |
| 101 | } |
| 102 | } |
| 103 | |
| 104 | if (!asyncResp->res.openFile(file.absolutePath)) |
| 105 | { |
| 106 | BMCWEB_LOG_DEBUG("failed to read file"); |
| 107 | asyncResp->res.result( |
| 108 | boost::beast::http::status::internal_server_error); |
| 109 | return; |
| 110 | } |
| 111 | } |
| 112 | |
| 113 | inline std::string_view getFiletypeForExtension(std::string_view extension) |
| 114 | { |
| 115 | constexpr static std::array<std::pair<std::string_view, std::string_view>, |
| 116 | 17> |
Ed Tanous | 1abe55e | 2018-09-05 08:30:59 -0700 | [diff] [blame] | 117 | contentTypes{ |
| 118 | {{".css", "text/css;charset=UTF-8"}, |
Ed Tanous | 1abe55e | 2018-09-05 08:30:59 -0700 | [diff] [blame] | 119 | {".eot", "application/vnd.ms-fontobject"}, |
Ed Tanous | ca89b20 | 2024-04-25 23:02:40 -0700 | [diff] [blame] | 120 | {".gif", "image/gif"}, |
| 121 | {".html", "text/html;charset=UTF-8"}, |
| 122 | {".ico", "image/x-icon"}, |
Ed Tanous | 1abe55e | 2018-09-05 08:30:59 -0700 | [diff] [blame] | 123 | {".jpeg", "image/jpeg"}, |
Ed Tanous | ca89b20 | 2024-04-25 23:02:40 -0700 | [diff] [blame] | 124 | {".jpg", "image/jpeg"}, |
| 125 | {".js", "application/javascript;charset=UTF-8"}, |
| 126 | {".json", "application/json"}, |
Ed Tanous | 1abe55e | 2018-09-05 08:30:59 -0700 | [diff] [blame] | 127 | // dev tools don't care about map type, setting to json causes |
| 128 | // browser to show as text |
| 129 | // https://stackoverflow.com/questions/19911929/what-mime-type-should-i-use-for-javascript-source-map-files |
Ed Tanous | ca89b20 | 2024-04-25 23:02:40 -0700 | [diff] [blame] | 130 | {".map", "application/json"}, |
| 131 | {".png", "image/png;charset=UTF-8"}, |
| 132 | {".svg", "image/svg+xml"}, |
| 133 | {".ttf", "application/x-font-ttf"}, |
| 134 | {".woff", "application/x-font-woff"}, |
| 135 | {".woff2", "application/x-font-woff2"}, |
| 136 | {".xml", "application/xml"}}}; |
Ed Tanous | a47f32b | 2019-10-24 10:08:04 -0700 | [diff] [blame] | 137 | |
Ed Tanous | ca89b20 | 2024-04-25 23:02:40 -0700 | [diff] [blame] | 138 | const auto* contentType = std::ranges::find_if( |
| 139 | contentTypes, |
| 140 | [&extension](const auto& val) { return val.first == extension; }); |
Ed Tanous | 153fdcf | 2021-03-04 16:43:14 -0800 | [diff] [blame] | 141 | |
Ed Tanous | ca89b20 | 2024-04-25 23:02:40 -0700 | [diff] [blame] | 142 | if (contentType == contentTypes.end()) |
| 143 | { |
| 144 | BMCWEB_LOG_ERROR( |
| 145 | "Cannot determine content-type for file with extension {}", |
| 146 | extension); |
| 147 | return ""; |
| 148 | } |
| 149 | return contentType->second; |
| 150 | } |
| 151 | |
| 152 | inline void addFile(App& app, const std::filesystem::directory_entry& dir) |
| 153 | { |
| 154 | StaticFile file; |
| 155 | file.absolutePath = dir.path(); |
| 156 | std::filesystem::path relativePath( |
| 157 | file.absolutePath.string().substr(rootpath.size() - 1)); |
| 158 | |
| 159 | std::string extension = relativePath.extension(); |
| 160 | std::filesystem::path webpath = relativePath; |
| 161 | |
| 162 | if (extension == ".gz") |
| 163 | { |
| 164 | webpath = webpath.replace_extension(""); |
| 165 | // Use the non-gzip version for determining content type |
| 166 | extension = webpath.extension().string(); |
| 167 | file.contentEncoding = "gzip"; |
| 168 | } |
Ed Tanous | 2b47f94 | 2024-03-12 15:43:16 -0700 | [diff] [blame^] | 169 | else if (extension == ".zstd") |
| 170 | { |
| 171 | webpath = webpath.replace_extension(""); |
| 172 | // Use the non-zstd version for determining content type |
| 173 | extension = webpath.extension().string(); |
| 174 | file.contentEncoding = "zstd"; |
| 175 | } |
Ed Tanous | ca89b20 | 2024-04-25 23:02:40 -0700 | [diff] [blame] | 176 | |
| 177 | file.etag = getStaticEtag(webpath); |
| 178 | |
| 179 | if (webpath.filename().string().starts_with("index.")) |
| 180 | { |
| 181 | webpath = webpath.parent_path(); |
| 182 | if (webpath.string().empty() || webpath.string().back() != '/') |
| 183 | { |
| 184 | // insert the non-directory version of this path |
| 185 | webroutes::routes.insert(webpath); |
| 186 | webpath += "/"; |
| 187 | file.renamed = true; |
| 188 | } |
| 189 | } |
| 190 | |
| 191 | std::pair<boost::container::flat_set<std::string>::iterator, bool> |
| 192 | inserted = webroutes::routes.insert(webpath); |
| 193 | |
| 194 | if (!inserted.second) |
| 195 | { |
| 196 | // Got a duplicated path. This is expected in certain |
| 197 | // situations |
| 198 | BMCWEB_LOG_DEBUG("Got duplicated path {}", webpath.string()); |
| 199 | return; |
| 200 | } |
| 201 | file.contentType = getFiletypeForExtension(extension); |
| 202 | |
| 203 | if (webpath == "/") |
| 204 | { |
| 205 | forward_unauthorized::hasWebuiRoute = true; |
| 206 | } |
| 207 | |
| 208 | app.routeDynamic(webpath)( |
| 209 | [file = std::move(file)]( |
| 210 | const crow::Request& req, |
| 211 | const std::shared_ptr<bmcweb::AsyncResp>& asyncResp) { |
| 212 | handleStaticAsset(req, asyncResp, file); |
| 213 | }); |
| 214 | } |
| 215 | |
| 216 | inline void requestRoutes(App& app) |
| 217 | { |
Ed Tanous | 153fdcf | 2021-03-04 16:43:14 -0800 | [diff] [blame] | 218 | std::error_code ec; |
Ed Tanous | ca89b20 | 2024-04-25 23:02:40 -0700 | [diff] [blame] | 219 | std::filesystem::recursive_directory_iterator dirIter({rootpath}, ec); |
Ed Tanous | 153fdcf | 2021-03-04 16:43:14 -0800 | [diff] [blame] | 220 | if (ec) |
| 221 | { |
Ed Tanous | 62598e3 | 2023-07-17 17:06:25 -0700 | [diff] [blame] | 222 | BMCWEB_LOG_ERROR( |
Ed Tanous | ca89b20 | 2024-04-25 23:02:40 -0700 | [diff] [blame] | 223 | "Unable to find or open {} static file hosting disabled", rootpath); |
Ed Tanous | 153fdcf | 2021-03-04 16:43:14 -0800 | [diff] [blame] | 224 | return; |
| 225 | } |
| 226 | |
Ed Tanous | 1abe55e | 2018-09-05 08:30:59 -0700 | [diff] [blame] | 227 | // In certain cases, we might have both a gzipped version of the file AND a |
| 228 | // non-gzipped version. To avoid duplicated routes, we need to make sure we |
| 229 | // get the gzipped version first. Because the gzipped path should be longer |
Ed Tanous | 8b15645 | 2018-10-12 11:09:26 -0700 | [diff] [blame] | 230 | // than the non gzipped path, if we sort in descending order, we should be |
Ed Tanous | 1abe55e | 2018-09-05 08:30:59 -0700 | [diff] [blame] | 231 | // guaranteed to get the gzip version first. |
Ed Tanous | a47f32b | 2019-10-24 10:08:04 -0700 | [diff] [blame] | 232 | std::vector<std::filesystem::directory_entry> paths( |
| 233 | std::filesystem::begin(dirIter), std::filesystem::end(dirIter)); |
Ed Tanous | 1abe55e | 2018-09-05 08:30:59 -0700 | [diff] [blame] | 234 | std::sort(paths.rbegin(), paths.rend()); |
Ed Tanous | 9dc2c4d | 2018-03-07 14:51:27 -0800 | [diff] [blame] | 235 | |
Ed Tanous | a47f32b | 2019-10-24 10:08:04 -0700 | [diff] [blame] | 236 | for (const std::filesystem::directory_entry& dir : paths) |
Ed Tanous | 1abe55e | 2018-09-05 08:30:59 -0700 | [diff] [blame] | 237 | { |
Ed Tanous | a47f32b | 2019-10-24 10:08:04 -0700 | [diff] [blame] | 238 | if (std::filesystem::is_directory(dir)) |
Ed Tanous | 1abe55e | 2018-09-05 08:30:59 -0700 | [diff] [blame] | 239 | { |
| 240 | // don't recurse into hidden directories or symlinks |
Ed Tanous | 11ba397 | 2022-07-11 09:50:41 -0700 | [diff] [blame] | 241 | if (dir.path().filename().string().starts_with(".") || |
Ed Tanous | a47f32b | 2019-10-24 10:08:04 -0700 | [diff] [blame] | 242 | std::filesystem::is_symlink(dir)) |
Ed Tanous | 1abe55e | 2018-09-05 08:30:59 -0700 | [diff] [blame] | 243 | { |
| 244 | dirIter.disable_recursion_pending(); |
| 245 | } |
Ed Tanous | ba9f9a6 | 2017-10-11 16:40:35 -0700 | [diff] [blame] | 246 | } |
Ed Tanous | a47f32b | 2019-10-24 10:08:04 -0700 | [diff] [blame] | 247 | else if (std::filesystem::is_regular_file(dir)) |
Ed Tanous | 1abe55e | 2018-09-05 08:30:59 -0700 | [diff] [blame] | 248 | { |
Ed Tanous | ca89b20 | 2024-04-25 23:02:40 -0700 | [diff] [blame] | 249 | addFile(app, dir); |
Ed Tanous | 1abe55e | 2018-09-05 08:30:59 -0700 | [diff] [blame] | 250 | } |
Ed Tanous | 911ac31 | 2017-08-15 09:37:42 -0700 | [diff] [blame] | 251 | } |
Ed Tanous | 99dc9c7 | 2019-10-24 10:09:03 -0700 | [diff] [blame] | 252 | } |
Ed Tanous | 1abe55e | 2018-09-05 08:30:59 -0700 | [diff] [blame] | 253 | } // namespace webassets |
| 254 | } // namespace crow |