| Directory: | cvmfs/ |
|---|---|
| File: | cvmfs/ingestion/item.cc |
| Date: | 2025-11-09 02:35:23 |
| Exec | Total | Coverage | |
|---|---|---|---|
| Lines: | 142 | 142 | 100.0% |
| Branches: | 35 | 64 | 54.7% |
| Line | Branch | Exec | Source |
|---|---|---|---|
| 1 | /** | ||
| 2 | * This file is part of the CernVM File System. | ||
| 3 | */ | ||
| 4 | |||
| 5 | #include "item.h" | ||
| 6 | |||
| 7 | #include <algorithm> | ||
| 8 | #include <cassert> | ||
| 9 | #include <cstdlib> | ||
| 10 | #include <cstring> | ||
| 11 | |||
| 12 | #include "ingestion/ingestion_source.h" | ||
| 13 | #include "item_mem.h" | ||
| 14 | #include "util/concurrency.h" | ||
| 15 | #include "util/smalloc.h" | ||
| 16 | |||
| 17 | 7341859 | FileItem::FileItem(IngestionSource *source, | |
| 18 | uint64_t min_chunk_size, | ||
| 19 | uint64_t avg_chunk_size, | ||
| 20 | uint64_t max_chunk_size, | ||
| 21 | zlib::Algorithms compression_algorithm, | ||
| 22 | shash::Algorithms hash_algorithm, | ||
| 23 | shash::Suffix hash_suffix, | ||
| 24 | bool may_have_chunks, | ||
| 25 | 7341859 | bool has_legacy_bulk_chunk) | |
| 26 | 7341859 | : source_(source) | |
| 27 | 7341859 | , compression_algorithm_(compression_algorithm) | |
| 28 | 7341859 | , hash_algorithm_(hash_algorithm) | |
| 29 | 7341859 | , hash_suffix_(hash_suffix) | |
| 30 | 7341859 | , has_legacy_bulk_chunk_(has_legacy_bulk_chunk) | |
| 31 | 7341859 | , size_(kSizeUnknown) | |
| 32 | 7341859 | , may_have_chunks_(may_have_chunks) | |
| 33 |
1/2✓ Branch 1 taken 7341859 times.
✗ Branch 2 not taken.
|
7341859 | , chunk_detector_(min_chunk_size, avg_chunk_size, max_chunk_size) |
| 34 |
1/2✓ Branch 1 taken 7341859 times.
✗ Branch 2 not taken.
|
7341859 | , bulk_hash_(hash_algorithm) |
| 35 |
1/2✓ Branch 2 taken 7341859 times.
✗ Branch 3 not taken.
|
14683718 | , chunks_(1) { |
| 36 | 7341859 | const int retval = pthread_mutex_init(&lock_, NULL); | |
| 37 |
1/2✗ Branch 0 not taken.
✓ Branch 1 taken 7341859 times.
|
7341859 | assert(retval == 0); |
| 38 | 7341859 | atomic_init64(&nchunks_in_fly_); | |
| 39 | 7341859 | atomic_init32(&is_fully_chunked_); | |
| 40 | 7341859 | } | |
| 41 | |||
| 42 | 7337260 | FileItem::~FileItem() { pthread_mutex_destroy(&lock_); } | |
| 43 | |||
| 44 | 7265303 | void FileItem::RegisterChunk(const FileChunk &file_chunk) { | |
| 45 | 7265303 | const MutexLockGuard lock_guard(lock_); | |
| 46 | |||
| 47 |
2/2✓ Branch 1 taken 12501 times.
✓ Branch 2 taken 7252802 times.
|
7265303 | switch (file_chunk.content_hash().suffix) { |
| 48 | 12501 | case shash::kSuffixPartial: | |
| 49 |
1/2✓ Branch 1 taken 12501 times.
✗ Branch 2 not taken.
|
12501 | chunks_.PushBack(file_chunk); |
| 50 | 12501 | break; | |
| 51 | |||
| 52 | 7252802 | default: | |
| 53 |
1/2✗ Branch 1 not taken.
✓ Branch 2 taken 7252802 times.
|
7252802 | assert(file_chunk.offset() == 0); |
| 54 |
1/2✗ Branch 1 not taken.
✓ Branch 2 taken 7252802 times.
|
7252802 | assert(file_chunk.size() == size_); |
| 55 | 7252802 | bulk_hash_ = file_chunk.content_hash(); | |
| 56 | 7252802 | break; | |
| 57 | } | ||
| 58 | 7265303 | atomic_dec64(&nchunks_in_fly_); | |
| 59 | 7265303 | } | |
| 60 | |||
| 61 | |||
| 62 | //------------------------------------------------------------------------------ | ||
| 63 | |||
| 64 | |||
| 65 | 7353314 | ChunkItem::ChunkItem(FileItem *file_item, uint64_t offset) | |
| 66 | 7348210 | : file_item_(file_item) | |
| 67 | 7348210 | , offset_(offset) | |
| 68 | 7348210 | , size_(0) | |
| 69 | 7348210 | , is_bulk_chunk_(false) | |
| 70 | 7348210 | , upload_handle_(NULL) | |
| 71 |
1/2✓ Branch 4 taken 7347688 times.
✗ Branch 5 not taken.
|
7353314 | , compressor_(NULL) { |
| 72 | 7347688 | hash_ctx_.algorithm = file_item->hash_algorithm(); | |
| 73 |
1/2✓ Branch 1 taken 7345716 times.
✗ Branch 2 not taken.
|
7346934 | hash_ctx_.size = shash::GetContextSize(hash_ctx_.algorithm); |
| 74 | 7345716 | hash_ctx_.buffer = hash_ctx_buffer_; | |
| 75 |
1/2✓ Branch 1 taken 7346731 times.
✗ Branch 2 not taken.
|
7345716 | shash::Init(hash_ctx_); |
| 76 | 7346731 | hash_value_.algorithm = hash_ctx_.algorithm; | |
| 77 | 7346731 | hash_value_.suffix = shash::kSuffixPartial; | |
| 78 | 7346731 | file_item_->IncNchunksInFly(); | |
| 79 | 7360245 | } | |
| 80 | |||
| 81 | |||
| 82 | 7235897 | void ChunkItem::MakeBulkChunk() { | |
| 83 | 7235897 | is_bulk_chunk_ = true; | |
| 84 | 7235897 | hash_value_.suffix = file_item_->hash_suffix(); | |
| 85 | 7233954 | } | |
| 86 | |||
| 87 | |||
| 88 | 16724897 | zlib::Compressor *ChunkItem::GetCompressor() { | |
| 89 |
2/2✓ Branch 1 taken 7227911 times.
✓ Branch 2 taken 9501771 times.
|
16724897 | if (!compressor_.IsValid()) { |
| 90 | compressor_ = zlib::Compressor::Construct( | ||
| 91 |
2/4✓ Branch 2 taken 7252445 times.
✗ Branch 3 not taken.
✓ Branch 5 taken 7249110 times.
✗ Branch 6 not taken.
|
7227911 | file_item_->compression_algorithm()); |
| 92 | } | ||
| 93 | 16750881 | return compressor_.weak_ref(); | |
| 94 | } | ||
| 95 | |||
| 96 | |||
| 97 | 7244441 | void ChunkItem::ReleaseCompressor() { compressor_.Destroy(); } | |
| 98 | |||
| 99 | |||
| 100 | //------------------------------------------------------------------------------ | ||
| 101 | |||
| 102 | atomic_int64 BlockItem::managed_bytes_ = 0; | ||
| 103 | |||
| 104 | |||
| 105 | 94976 | BlockItem::BlockItem(ItemAllocator *allocator) | |
| 106 | 94976 | : allocator_(allocator) | |
| 107 | 94976 | , type_(kBlockHollow) | |
| 108 | 94976 | , tag_(-1) | |
| 109 | 94976 | , file_item_(NULL) | |
| 110 | 94976 | , chunk_item_(NULL) | |
| 111 | 94976 | , data_(NULL) | |
| 112 | 94976 | , capacity_(0) | |
| 113 | 94976 | , size_(0) { } | |
| 114 | |||
| 115 | |||
| 116 | 52195591 | BlockItem::BlockItem(int64_t tag, ItemAllocator *allocator) | |
| 117 | 51863530 | : allocator_(allocator) | |
| 118 | 51863530 | , type_(kBlockHollow) | |
| 119 | 51863530 | , tag_(tag) | |
| 120 | 51863530 | , file_item_(NULL) | |
| 121 | 51863530 | , chunk_item_(NULL) | |
| 122 | 51863530 | , data_(NULL) | |
| 123 | 51863530 | , capacity_(0) | |
| 124 | 52195591 | , size_(0) { | |
| 125 |
1/2✗ Branch 0 not taken.
✓ Branch 1 taken 51863530 times.
|
51863530 | assert(tag_ >= 0); |
| 126 | 51863530 | } | |
| 127 | |||
| 128 | |||
| 129 | 51981490 | BlockItem::~BlockItem() { | |
| 130 |
2/2✓ Branch 0 taken 21743720 times.
✓ Branch 1 taken 30237770 times.
|
51981490 | if (data_) |
| 131 | 21743720 | allocator_->Free(data_); | |
| 132 | 52014840 | atomic_xadd64(&managed_bytes_, -static_cast<int64_t>(capacity_)); | |
| 133 | 52445026 | } | |
| 134 | |||
| 135 | |||
| 136 | 7996175 | void BlockItem::Discharge() { | |
| 137 | 7996175 | data_ = NULL; | |
| 138 | 7996175 | size_ = capacity_ = 0; | |
| 139 | 7996175 | } | |
| 140 | |||
| 141 | |||
| 142 | 21723824 | void BlockItem::MakeStop() { | |
| 143 |
1/2✗ Branch 0 not taken.
✓ Branch 1 taken 21723824 times.
|
21723824 | assert(type_ == kBlockHollow); |
| 144 | 21723824 | type_ = kBlockStop; | |
| 145 | 21723824 | } | |
| 146 | |||
| 147 | |||
| 148 | 11173905 | void BlockItem::MakeData(uint32_t capacity) { | |
| 149 |
1/2✗ Branch 0 not taken.
✓ Branch 1 taken 11173905 times.
|
11173905 | assert(type_ == kBlockHollow); |
| 150 |
1/2✗ Branch 0 not taken.
✓ Branch 1 taken 11173905 times.
|
11173905 | assert(allocator_ != NULL); |
| 151 |
1/2✗ Branch 0 not taken.
✓ Branch 1 taken 11173905 times.
|
11173905 | assert(capacity > 0); |
| 152 | |||
| 153 | 11173905 | type_ = kBlockData; | |
| 154 | 11173905 | capacity_ = capacity; | |
| 155 | 11173905 | data_ = reinterpret_cast<unsigned char *>(allocator_->Malloc(capacity_)); | |
| 156 | 11209082 | atomic_xadd64(&managed_bytes_, static_cast<int64_t>(capacity_)); | |
| 157 | 11212591 | } | |
| 158 | |||
| 159 | |||
| 160 | /** | ||
| 161 | * Move data from one block to another. | ||
| 162 | */ | ||
| 163 | 7995334 | void BlockItem::MakeDataMove(BlockItem *other) { | |
| 164 |
1/2✗ Branch 0 not taken.
✓ Branch 1 taken 7995334 times.
|
7995334 | assert(type_ == kBlockHollow); |
| 165 |
1/2✗ Branch 0 not taken.
✓ Branch 1 taken 7995334 times.
|
7995334 | assert(other->type_ == kBlockData); |
| 166 |
1/2✗ Branch 0 not taken.
✓ Branch 1 taken 7995334 times.
|
7995334 | assert(other->size_ > 0); |
| 167 | |||
| 168 | 7995334 | type_ = kBlockData; | |
| 169 | 7995334 | capacity_ = size_ = other->size_; | |
| 170 | 7995334 | data_ = other->data_; | |
| 171 | 7995334 | allocator_ = other->allocator_; | |
| 172 | |||
| 173 | 7995334 | other->Discharge(); | |
| 174 | 7997277 | } | |
| 175 | |||
| 176 | |||
| 177 | /** | ||
| 178 | * Copy a piece of one block's data into a new block. | ||
| 179 | */ | ||
| 180 | 11546498 | void BlockItem::MakeDataCopy(const unsigned char *data, uint32_t size) { | |
| 181 |
1/2✗ Branch 0 not taken.
✓ Branch 1 taken 11546498 times.
|
11546498 | assert(type_ == kBlockHollow); |
| 182 |
1/2✗ Branch 0 not taken.
✓ Branch 1 taken 11546498 times.
|
11546498 | assert(allocator_ != NULL); |
| 183 |
1/2✗ Branch 0 not taken.
✓ Branch 1 taken 11546498 times.
|
11546498 | assert(size > 0); |
| 184 | |||
| 185 | 11546498 | type_ = kBlockData; | |
| 186 | 11546498 | capacity_ = size_ = size; | |
| 187 | 11546498 | data_ = reinterpret_cast<unsigned char *>(allocator_->Malloc(capacity_)); | |
| 188 | 11570678 | memcpy(data_, data, size); | |
| 189 | 11570678 | atomic_xadd64(&managed_bytes_, static_cast<int64_t>(capacity_)); | |
| 190 | 11570715 | } | |
| 191 | |||
| 192 | |||
| 193 | 994050 | void BlockItem::Reset() { | |
| 194 |
1/2✗ Branch 0 not taken.
✓ Branch 1 taken 994050 times.
|
994050 | assert(type_ == kBlockData); |
| 195 | |||
| 196 | 994050 | atomic_xadd64(&managed_bytes_, -static_cast<int64_t>(capacity_)); | |
| 197 | 994659 | allocator_->Free(data_); | |
| 198 | 994456 | data_ = NULL; | |
| 199 | 994456 | size_ = capacity_ = 0; | |
| 200 | 994456 | type_ = kBlockHollow; | |
| 201 | 994456 | } | |
| 202 | |||
| 203 | |||
| 204 | 35967890 | void BlockItem::SetChunkItem(ChunkItem *value) { | |
| 205 |
1/2✗ Branch 0 not taken.
✓ Branch 1 taken 35967890 times.
|
35967890 | assert(value != NULL); |
| 206 |
1/2✗ Branch 0 not taken.
✓ Branch 1 taken 35967890 times.
|
35967890 | assert(chunk_item_ == NULL); |
| 207 | 35967890 | chunk_item_ = value; | |
| 208 | 35967890 | } | |
| 209 | |||
| 210 | |||
| 211 | 51725912 | void BlockItem::SetFileItem(FileItem *value) { | |
| 212 |
1/2✗ Branch 0 not taken.
✓ Branch 1 taken 51725912 times.
|
51725912 | assert(value != NULL); |
| 213 |
1/2✗ Branch 0 not taken.
✓ Branch 1 taken 51725912 times.
|
51725912 | assert(file_item_ == NULL); |
| 214 | 51725912 | file_item_ = value; | |
| 215 | 51725912 | } | |
| 216 | |||
| 217 | |||
| 218 | 10240 | uint32_t BlockItem::Write(void *buf, uint32_t count) { | |
| 219 |
1/2✗ Branch 0 not taken.
✓ Branch 1 taken 10240 times.
|
10240 | assert(type_ == kBlockData); |
| 220 | |||
| 221 | 10240 | const uint32_t remaining = capacity_ - size_; | |
| 222 | 10240 | const uint32_t nbytes = std::min(remaining, count); | |
| 223 | 10240 | memcpy(data_ + size_, buf, nbytes); | |
| 224 | 10240 | size_ += nbytes; | |
| 225 | 10240 | return nbytes; | |
| 226 | } | ||
| 227 |