| Directory: | cvmfs/ |
|---|---|
| File: | cvmfs/sanitizer.cc |
| Date: | 2025-10-19 02:35:28 |
| Exec | Total | Coverage | |
|---|---|---|---|
| Lines: | 69 | 71 | 97.2% |
| Branches: | 40 | 49 | 81.6% |
| Line | Branch | Exec | Source |
|---|---|---|---|
| 1 | /** | ||
| 2 | * This file is part of the CernVM File System. | ||
| 3 | * | ||
| 4 | * Provides input data sanitizer in the form of whitelist of character ranges. | ||
| 5 | */ | ||
| 6 | |||
| 7 | |||
| 8 | #include "sanitizer.h" | ||
| 9 | |||
| 10 | #include <cassert> | ||
| 11 | |||
| 12 | using namespace std; // NOLINT | ||
| 13 | |||
| 14 | #ifdef CVMFS_NAMESPACE_GUARD | ||
| 15 | namespace CVMFS_NAMESPACE_GUARD { | ||
| 16 | #endif | ||
| 17 | |||
| 18 | namespace sanitizer { | ||
| 19 | |||
| 20 | 30796 | CharRange::CharRange(const char range_begin, const char range_end) { | |
| 21 | 30796 | range_begin_ = range_begin; | |
| 22 | 30796 | range_end_ = range_end; | |
| 23 | 30796 | } | |
| 24 | |||
| 25 | |||
| 26 | 29503 | CharRange::CharRange(const char single_char) { | |
| 27 | 29503 | range_begin_ = range_end_ = single_char; | |
| 28 | 29503 | } | |
| 29 | |||
| 30 | |||
| 31 | 290931 | bool CharRange::InRange(const char c) const { | |
| 32 |
4/4✓ Branch 0 taken 238237 times.
✓ Branch 1 taken 52694 times.
✓ Branch 2 taken 193442 times.
✓ Branch 3 taken 44795 times.
|
290931 | return (c >= range_begin_) && (c <= range_end_); |
| 33 | } | ||
| 34 | |||
| 35 | |||
| 36 | //------------------------------------------------------------------------------ | ||
| 37 | |||
| 38 | |||
| 39 | 28760 | InputSanitizer::InputSanitizer(const string &whitelist) : max_length_(-1) { | |
| 40 |
1/2✓ Branch 1 taken 28760 times.
✗ Branch 2 not taken.
|
28760 | InitValidRanges(whitelist); |
| 41 | 28760 | } | |
| 42 | |||
| 43 | |||
| 44 | 131 | InputSanitizer::InputSanitizer(const string &whitelist, int max_length) | |
| 45 | 131 | : max_length_(max_length) { | |
| 46 |
1/2✓ Branch 1 taken 131 times.
✗ Branch 2 not taken.
|
131 | InitValidRanges(whitelist); |
| 47 | 131 | } | |
| 48 | |||
| 49 | |||
| 50 | 28891 | void InputSanitizer::InitValidRanges(const std::string &whitelist) { | |
| 51 | // Parse the whitelist | ||
| 52 | 28891 | const unsigned length = whitelist.length(); | |
| 53 | 28891 | unsigned pickup_pos = 0; | |
| 54 |
2/2✓ Branch 0 taken 91095 times.
✓ Branch 1 taken 28891 times.
|
119986 | for (unsigned i = 0; i < length; ++i) { |
| 55 |
7/8✓ Branch 0 taken 62205 times.
✓ Branch 1 taken 28890 times.
✓ Branch 3 taken 30796 times.
✓ Branch 4 taken 31409 times.
✗ Branch 5 not taken.
✓ Branch 6 taken 30796 times.
✓ Branch 7 taken 60299 times.
✓ Branch 8 taken 30796 times.
|
91095 | if ((i + 1 >= length) || (whitelist[i + 1] == ' ') || (i == length - 1)) { |
| 56 |
1/2✓ Branch 1 taken 60299 times.
✗ Branch 2 not taken.
|
60299 | const string range = whitelist.substr(pickup_pos, i - pickup_pos + 1); |
| 57 |
2/3✓ Branch 1 taken 29503 times.
✓ Branch 2 taken 30796 times.
✗ Branch 3 not taken.
|
60299 | switch (range.length()) { |
| 58 | 29503 | case 1: | |
| 59 |
1/2✓ Branch 3 taken 29503 times.
✗ Branch 4 not taken.
|
29503 | valid_ranges_.push_back(CharRange(range[0])); |
| 60 | 29503 | break; | |
| 61 | 30796 | case 2: | |
| 62 |
1/2✓ Branch 4 taken 30796 times.
✗ Branch 5 not taken.
|
30796 | valid_ranges_.push_back(CharRange(range[0], range[1])); |
| 63 | 30796 | break; | |
| 64 | ✗ | default: | |
| 65 | ✗ | assert(false); | |
| 66 | } | ||
| 67 | 60299 | ++i; | |
| 68 | 60299 | pickup_pos = i + 1; | |
| 69 | 60299 | } | |
| 70 | } | ||
| 71 | 28891 | } | |
| 72 | |||
| 73 | |||
| 74 | 29614 | bool InputSanitizer::Sanitize(std::string::const_iterator begin, | |
| 75 | std::string::const_iterator end, | ||
| 76 | std::string *filtered_output) const { | ||
| 77 | 29614 | int pos = 0; | |
| 78 | 29614 | bool is_sane = true; | |
| 79 |
2/2✓ Branch 2 taken 215988 times.
✓ Branch 3 taken 29610 times.
|
245598 | for (; begin != end; ++begin) { |
| 80 |
2/2✓ Branch 2 taken 193442 times.
✓ Branch 3 taken 22546 times.
|
215988 | if (CheckRanges(*begin)) { |
| 81 |
4/4✓ Branch 0 taken 1435 times.
✓ Branch 1 taken 192007 times.
✓ Branch 2 taken 4 times.
✓ Branch 3 taken 1431 times.
|
193442 | if ((max_length_ >= 0) && (pos >= max_length_)) { |
| 82 | 4 | is_sane = false; | |
| 83 | 4 | break; | |
| 84 | } | ||
| 85 | 193438 | filtered_output->push_back(*begin); | |
| 86 | 193438 | pos++; | |
| 87 | } else { | ||
| 88 | 22546 | is_sane = false; | |
| 89 | } | ||
| 90 | } | ||
| 91 | 29614 | return is_sane; | |
| 92 | } | ||
| 93 | |||
| 94 | |||
| 95 | 215988 | bool InputSanitizer::CheckRanges(const char chr) const { | |
| 96 |
2/2✓ Branch 1 taken 290931 times.
✓ Branch 2 taken 22546 times.
|
313477 | for (unsigned j = 0; j < valid_ranges_.size(); ++j) { |
| 97 |
2/2✓ Branch 2 taken 193442 times.
✓ Branch 3 taken 97489 times.
|
290931 | if (valid_ranges_[j].InRange(chr)) { |
| 98 | 193442 | return true; | |
| 99 | } | ||
| 100 | } | ||
| 101 | 22546 | return false; | |
| 102 | } | ||
| 103 | |||
| 104 | |||
| 105 | 492 | string InputSanitizer::Filter(const std::string &input) const { | |
| 106 | 492 | string filtered_output; | |
| 107 |
1/2✓ Branch 1 taken 492 times.
✗ Branch 2 not taken.
|
492 | Sanitize(input, &filtered_output); |
| 108 | 492 | return filtered_output; | |
| 109 | } | ||
| 110 | |||
| 111 | |||
| 112 | 29124 | bool InputSanitizer::IsValid(const std::string &input) const { | |
| 113 | 29124 | string dummy; | |
| 114 |
1/2✓ Branch 1 taken 29124 times.
✗ Branch 2 not taken.
|
58248 | return Sanitize(input, &dummy); |
| 115 | 29124 | } | |
| 116 | |||
| 117 | |||
| 118 | 502 | bool IntegerSanitizer::Sanitize(std::string::const_iterator begin, | |
| 119 | std::string::const_iterator end, | ||
| 120 | std::string *filtered_output) const { | ||
| 121 |
2/2✓ Branch 1 taken 1 times.
✓ Branch 2 taken 501 times.
|
502 | if (std::distance(begin, end) == 0) { |
| 122 | 1 | return false; | |
| 123 | } | ||
| 124 | |||
| 125 |
2/2✓ Branch 1 taken 2 times.
✓ Branch 2 taken 499 times.
|
501 | if (*begin == '-') { |
| 126 | // minus is allowed as the first character! | ||
| 127 | 2 | filtered_output->push_back('-'); | |
| 128 | 2 | begin++; | |
| 129 | } | ||
| 130 | |||
| 131 | 501 | return InputSanitizer::Sanitize(begin, end, filtered_output); | |
| 132 | } | ||
| 133 | |||
| 134 | |||
| 135 | 10 | bool PositiveIntegerSanitizer::Sanitize(std::string::const_iterator begin, | |
| 136 | std::string::const_iterator end, | ||
| 137 | std::string *filtered_output) const { | ||
| 138 |
2/2✓ Branch 1 taken 1 times.
✓ Branch 2 taken 9 times.
|
10 | if (std::distance(begin, end) == 0) { |
| 139 | 1 | return false; | |
| 140 | } | ||
| 141 | |||
| 142 | 9 | return InputSanitizer::Sanitize(begin, end, filtered_output); | |
| 143 | } | ||
| 144 | |||
| 145 | } // namespace sanitizer | ||
| 146 | |||
| 147 | #ifdef CVMFS_NAMESPACE_GUARD | ||
| 148 | } // namespace CVMFS_NAMESPACE_GUARD | ||
| 149 | #endif | ||
| 150 |