0.6.1
C++ to UML diagram generator based on Clang
Loading...
Searching...
No Matches
util.cc
Go to the documentation of this file.
1/**
2 * @file src/util/util.cc
3 *
4 * Copyright (c) 2021-2025 Bartek Kryza <bkryza@gmail.com>
5 *
6 * Licensed under the Apache License, Version 2.0 (the "License");
7 * you may not use this file except in compliance with the License.
8 * You may obtain a copy of the License at
9 *
10 * http://www.apache.org/licenses/LICENSE-2.0
11 *
12 * Unless required by applicable law or agreed to in writing, software
13 * distributed under the License is distributed on an "AS IS" BASIS,
14 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
15 * See the License for the specific language governing permissions and
16 * limitations under the License.
17 */
18#include "util.h"
19
20#include <spdlog/spdlog.h>
21
22#include <regex>
23#if __has_include(<sys/utsname.h>)
24#include <sys/utsname.h>
25#endif
26
27namespace clanguml::util {
28
29static const auto WHITESPACE = " \n\r\t\f\v";
30
31namespace {
32class pipe_t {
33public:
34 explicit pipe_t(const std::string &command, int &result)
35 : result_{result}
36 ,
37#if defined(__linux) || defined(__unix) || defined(__APPLE__)
38 pipe_{popen(fmt::format("{} 2>&1", command).c_str(), "r")}
39#elif defined(_WIN32)
40 pipe_{_popen(command.c_str(), "r")}
41#endif
42 {
43 }
44
45 ~pipe_t() { reset(); }
46
47 operator bool() const { return pipe_ != nullptr; }
48
49 FILE *get() const { return pipe_; }
50
51 void reset()
52 {
53 if (pipe_ == nullptr)
54 return;
55
56#if defined(__linux) || defined(__unix) || defined(__APPLE__)
57 result_ = pclose(pipe_);
58#elif defined(_WIN32)
59 result_ = _pclose(pipe_);
60#endif
61 pipe_ = nullptr;
62 }
63
64private:
65 int &result_;
66 FILE *pipe_;
67};
68} // namespace
69
70std::string get_process_output(const std::string &command)
71{
72 constexpr size_t kBufferSize{1024};
73 std::array<char, kBufferSize> buffer{};
74 std::string output;
75 int result{EXIT_FAILURE};
76
77 pipe_t pipe{command, result};
78
79 if (!pipe) {
80 throw std::runtime_error("popen() failed!");
81 }
82
83 while (fgets(buffer.data(), buffer.size(), pipe.get()) != nullptr) {
84 output += buffer.data();
85 }
86
87 pipe.reset();
88
89 if (result != EXIT_SUCCESS) {
90 throw std::runtime_error(
91 fmt::format("External command '{}' failed: {}", command, output));
92 }
93
94 return output;
95}
96
97void check_process_output(const std::string &command)
98{
99 constexpr size_t kBufferSize{1024};
100 std::array<char, kBufferSize> buffer{};
101 int result{EXIT_FAILURE};
102 std::string output;
103 pipe_t pipe{command, result};
104
105 if (!pipe) {
106 throw std::runtime_error("popen() failed!");
107 }
108
109 while (fgets(buffer.data(), buffer.size(), pipe.get()) != nullptr) {
110 output += buffer.data();
111 }
112
113 pipe.reset();
114
115 if (result != EXIT_SUCCESS) {
116 throw std::runtime_error(
117 fmt::format("External command '{}' failed: {}", command, output));
118 }
119}
120
121std::string get_env(const std::string &name)
122{
123#if defined(__linux) || defined(__unix)
124 const char *value = std::getenv(name.c_str()); // NOLINT
125
126 if (value == nullptr)
127 return {};
128
129 return std::string{value};
130#elif defined(WINDOWS) || defined(_WIN32) || defined(WIN32)
131 static constexpr auto kMaxEnvLength = 2096U;
132 static char value[kMaxEnvLength];
133 const DWORD ret =
134 GetEnvironmentVariableA(name.c_str(), value, kMaxEnvLength);
135 if (ret == 0 || ret > kMaxEnvLength)
136 return {};
137 else
138 return value;
139#else
140 return {};
141#endif
142}
143
145{
146 const auto env = get_env("CLANGUML_GIT_COMMIT");
147
148 if (!env.empty())
149 return true;
150
151 std::string output;
152
153 try {
154 output = get_process_output("git rev-parse --git-dir");
155 }
156 catch (std::runtime_error &e) {
157 return false;
158 }
159
160 return contains(trim(output), ".git");
161}
162
163std::string run_git_command(
164 const std::string &cmd, const std::string &env_override)
165{
166 auto env = get_env(env_override);
167
168 if (!env.empty())
169 return env;
170
171 std::string output;
172
173 try {
174 output = get_process_output(cmd);
175 }
176 catch (std::runtime_error &e) {
177 return {};
178 }
179
180 return trim(output);
181}
182
183std::string get_git_branch()
184{
185 return run_git_command(
186 "git rev-parse --abbrev-ref HEAD", "CLANGUML_GIT_BRANCH");
187}
188
189std::string get_git_revision()
190{
191 return run_git_command(
192 "git describe --tags --always", "CLANGUML_GIT_REVISION");
193}
194
195std::string get_git_commit()
196{
197 return run_git_command("git rev-parse HEAD", "CLANGUML_GIT_COMMIT");
198}
199
201{
202 return run_git_command(
203 "git rev-parse --show-toplevel", "CLANGUML_GIT_TOPLEVEL_DIR");
204}
205
206std::string get_os_name()
207{
208#ifdef _WIN32
209 return "Windows, 32-bit";
210#elif _WIN64
211 return "Windows, 64-bit";
212#elif __has_include(<sys/utsname.h>)
213 struct utsname utsn; // NOLINT
214 uname(&utsn);
215 return fmt::format("{} {} {}", utsn.sysname, utsn.machine, utsn.release);
216#elif __linux__
217 return "Linux";
218#elif __APPLE__ || __MACH__
219 return "macOS";
220#elif __FreeBSD__
221 return "FreeBSD";
222#elif __unix__ || __unix
223 return "Unix";
224#else
225 return "Unknown";
226#endif
227}
228
229std::string ltrim(const std::string &s)
230{
231 const size_t start = s.find_first_not_of(WHITESPACE);
232 return (start == std::string::npos) ? "" : s.substr(start);
233}
234
235std::string rtrim(const std::string &s)
236{
237 const size_t end = s.find_last_not_of(WHITESPACE);
238 return (end == std::string::npos) ? "" : s.substr(0, end + 1);
239}
240
241std::string trim_typename(const std::string &s)
242{
243 auto res = trim(s);
244 if (res.find("typename ") == 0)
245 return res.substr(strlen("typename "));
246
247 return res;
248}
249
250std::string trim(const std::string &s) { return rtrim(ltrim(s)); }
251
252std::optional<std::pair<std::string, std::string>> split_at_first(
253 const std::string &separator, const std::string &input)
254{
255 std::optional<std::pair<std::string, std::string>> res;
256
257 std::size_t pos = input.find(separator);
258
259 if (pos == std::string::npos) {
260 return res;
261 }
262
263 auto before = input.substr(0, pos);
264 auto after = input.substr(pos + separator.size());
265
266 return std::make_optional<std::pair<std::string, std::string>>(
267 std::move(before), std::move(after));
268}
269
270std::vector<std::string> split(
271 std::string str, std::string_view delimiter, bool skip_empty)
272{
273 std::vector<std::string> result;
274
275 if (!contains(str, delimiter)) {
276 if (!str.empty())
277 result.push_back(std::move(str));
278 else if (!skip_empty)
279 result.push_back(std::move(str));
280 }
281 else
282 while (static_cast<unsigned int>(!str.empty()) != 0U) {
283 auto index = str.find(delimiter);
284 if (index != std::string::npos) {
285 auto tok = str.substr(0, index);
286 if (!tok.empty())
287 result.push_back(std::move(tok));
288 else if (!skip_empty)
289 result.push_back(std::move(tok));
290
291 str = str.substr(index + delimiter.size());
292 }
293 else {
294 if (!str.empty())
295 result.push_back(std::move(str));
296 else if (!skip_empty)
297 result.push_back(std::move(str));
298 str = "";
299 }
300 }
301
302 return result;
303}
304
305std::vector<std::string> split_isspace(std::string str)
306{
307 std::vector<std::string> result;
308
309 while (static_cast<unsigned int>(!str.empty()) != 0U) {
310 auto index = std::find_if(
311 str.begin(), str.end(), [](auto c) { return std::isspace(c); });
312 if (index != str.end()) {
313 auto tok = str.substr(0, std::distance(str.begin(), index));
314 if (!tok.empty())
315 result.push_back(std::move(tok));
316 str = str.substr(std::distance(str.begin(), index) + 1);
317 }
318 else {
319 if (!str.empty())
320 result.push_back(str);
321 str = "";
322 }
323 }
324 return result;
325}
326
327std::string join(
328 const std::vector<std::string> &toks, std::string_view delimiter)
329{
330 return fmt::format("{}", fmt::join(toks, delimiter));
331}
332
333std::string abbreviate(const std::string &s, const unsigned int max_length)
334{
335 if (s.size() <= max_length)
336 return s;
337
338 auto res = s;
339
340 res.resize(max_length);
341
342 if (res.size() > 3) {
343 res.replace(res.size() - 3, 3, 3, '.');
344 }
345
346 return res;
347}
348
350 const std::string &input, std::tuple<std::string, size_t, size_t> &result)
351{
352 const std::regex alias_regex(R"((@A\‍([^\).]+\)))");
353
354 auto alias_it =
355 std::sregex_iterator(input.begin(), input.end(), alias_regex);
356 auto end_it = std::sregex_iterator();
357
358 if (alias_it == end_it)
359 return false;
360
361 const std::smatch &match = *alias_it;
362 const std::string alias = match.str().substr(3, match.str().size() - 4);
363
364 std::get<0>(result) = alias;
365 std::get<1>(result) = match.position();
366 std::get<2>(result) = match.length();
367
368 return true;
369}
370
371bool replace_all(std::string &input, const std::string &pattern,
372 const std::string &replace_with)
373{
374 bool replaced{false};
375
376 auto pos = input.find(pattern);
377 while (pos < input.size()) {
378 input.replace(pos, pattern.size(), replace_with);
379 pos = input.find(pattern, pos + replace_with.size());
380 replaced = true;
381 }
382
383 return replaced;
384}
385
386std::string condense_whitespace(const std::string &input)
387{
388 std::string output;
389 output.reserve(input.size());
390
391 bool in_whitespace = false;
392 for (char ch : input) {
393 if (std::isspace(ch) != 0) {
394 if (!in_whitespace) {
395 output.push_back(' ');
396 in_whitespace = true;
397 }
398 }
399 else {
400 output.push_back(ch);
401 in_whitespace = false;
402 }
403 }
404
405 return output;
406}
407
408template <> bool starts_with(const std::string &s, const std::string &prefix)
409{
410 return s.rfind(prefix, 0) == 0;
411}
412
413template <> bool ends_with(const std::string &value, const std::string &suffix)
414{
415 if (suffix.size() > value.size())
416 return false;
417 return std::equal(suffix.rbegin(), suffix.rend(), value.rbegin());
418}
419
420std::size_t hash_seed(std::size_t seed)
421{
422 constexpr auto kSeedStart{0x6a3712b5};
423 constexpr auto kSeedShiftFirst{6};
424 constexpr auto kSeedShiftSecond{2};
425
426 return kSeedStart + (seed << kSeedShiftFirst) + (seed >> kSeedShiftSecond);
427}
428
429std::string path_to_url(const std::filesystem::path &p)
430{
431 std::vector<std::string> path_tokens;
432 auto it = p.begin();
433 if (p.has_root_directory()) {
434#ifdef _MSC_VER
435 // On Windows convert the root path using its drive letter, e.g.:
436 // C:\A\B\include.h -> /c/A/B/include.h
437 if (p.root_name().string().size() > 1) {
438 if (p.is_absolute()) {
439 path_tokens.push_back(std::string{
440 std::tolower(p.root_name().string().at(0), std::locale())});
441 }
442 it++;
443 }
444#endif
445 it++;
446 }
447
448 for (; it != p.end(); it++)
449 path_tokens.push_back(it->string());
450
451 if (p.has_root_directory())
452 return fmt::format("/{}", fmt::join(path_tokens, "/"));
453
454 return fmt::format("{}", fmt::join(path_tokens, "/"));
455}
456
457std::filesystem::path ensure_path_is_absolute(
458 const std::filesystem::path &p, const std::filesystem::path &root)
459{
460 if (p.is_absolute())
461 return p;
462
463 auto result = root / p;
464 result = result.lexically_normal();
465 result.make_preferred();
466
467 return result;
468}
469
471 const std::filesystem::path &child, const std::filesystem::path &base)
472{
473 if (child.has_root_directory() != base.has_root_directory())
474 return false;
475
476 const auto child_ln = child.lexically_normal();
477 const auto base_ln = base.lexically_normal();
478
479 if (child_ln == base_ln)
480 return true;
481
482 auto rel = child_ln.lexically_relative(base_ln);
483 return !rel.empty() && rel.native()[0] != '.';
484}
485
486std::string format_message_comment(const std::string &comment, unsigned width)
487{
488 if (width == 0)
489 return comment;
490
491 std::string result;
492
493 if (comment.empty())
494 return result;
495
496 auto tokens = split_isspace(comment);
497
498 if (tokens.empty())
499 return result;
500
501 unsigned current_line_length{0};
502 for (const auto &token : tokens) {
503 if (current_line_length < width) {
504 result += token;
505 result += ' ';
506 }
507 else {
508 result.back() = '\n';
509 current_line_length = 0;
510 result += token;
511 result += ' ';
512 }
513
514 current_line_length += token.size() + 1;
515 }
516
517 result.pop_back();
518
519 return result;
520}
521
522std::optional<std::pair<std::string, std::string>> find_entry_by_path_prefix(
523 const std::map<std::string, std::string> &m, const std::string &path)
524{
525 if (m.empty())
526 return {};
527
528 // Extract keys and sort them by length in descending order
529 std::vector<std::string> keys;
530 keys.reserve(m.size());
531 for (const auto &[key, pattern] : m) {
532 keys.push_back(key);
533 }
534
535 std::sort(keys.begin(), keys.end(),
536 [](const std::string &a, const std::string &b) {
537 return a.size() > b.size();
538 });
539
540 std::filesystem::path file_path{path};
541
542 for (const auto &key : keys) {
543 const auto &pattern = m.at(key);
544 std::filesystem::path key_path{key};
545
546 if (is_relative_to(file_path, key_path)) {
547 return {{key, pattern}};
548 }
549 }
550
551 if ((path.empty() || file_path.is_relative() || path == ".") &&
552 m.count(".") > 0) {
553 return {{".", m.at(".")}};
554 }
555
556 return {};
557}
558} // namespace clanguml::util