| Directory: | cvmfs/ |
|---|---|
| File: | cvmfs/ingestion/item.cc |
| Date: | 2025-11-30 02:35:17 |
| Exec | Total | Coverage | |
|---|---|---|---|
| Lines: | 142 | 142 | 100.0% |
| Branches: | 35 | 64 | 54.7% |
| Line | Branch | Exec | Source |
|---|---|---|---|
| 1 | /** | ||
| 2 | * This file is part of the CernVM File System. | ||
| 3 | */ | ||
| 4 | |||
| 5 | #include "item.h" | ||
| 6 | |||
| 7 | #include <algorithm> | ||
| 8 | #include <cassert> | ||
| 9 | #include <cstdlib> | ||
| 10 | #include <cstring> | ||
| 11 | |||
| 12 | #include "ingestion/ingestion_source.h" | ||
| 13 | #include "item_mem.h" | ||
| 14 | #include "util/concurrency.h" | ||
| 15 | #include "util/smalloc.h" | ||
| 16 | |||
| 17 | 11609330 | FileItem::FileItem(IngestionSource *source, | |
| 18 | uint64_t min_chunk_size, | ||
| 19 | uint64_t avg_chunk_size, | ||
| 20 | uint64_t max_chunk_size, | ||
| 21 | zlib::Algorithms compression_algorithm, | ||
| 22 | shash::Algorithms hash_algorithm, | ||
| 23 | shash::Suffix hash_suffix, | ||
| 24 | bool may_have_chunks, | ||
| 25 | 11609330 | bool has_legacy_bulk_chunk) | |
| 26 | 11609330 | : source_(source) | |
| 27 | 11609330 | , compression_algorithm_(compression_algorithm) | |
| 28 | 11609330 | , hash_algorithm_(hash_algorithm) | |
| 29 | 11609330 | , hash_suffix_(hash_suffix) | |
| 30 | 11609330 | , has_legacy_bulk_chunk_(has_legacy_bulk_chunk) | |
| 31 | 11609330 | , size_(kSizeUnknown) | |
| 32 | 11609330 | , may_have_chunks_(may_have_chunks) | |
| 33 |
1/2✓ Branch 1 taken 11609330 times.
✗ Branch 2 not taken.
|
11609330 | , chunk_detector_(min_chunk_size, avg_chunk_size, max_chunk_size) |
| 34 |
1/2✓ Branch 1 taken 11609330 times.
✗ Branch 2 not taken.
|
11609330 | , bulk_hash_(hash_algorithm) |
| 35 |
1/2✓ Branch 2 taken 11609330 times.
✗ Branch 3 not taken.
|
23218660 | , chunks_(1) { |
| 36 | 11609330 | const int retval = pthread_mutex_init(&lock_, NULL); | |
| 37 |
1/2✗ Branch 0 not taken.
✓ Branch 1 taken 11609330 times.
|
11609330 | assert(retval == 0); |
| 38 | 11609330 | atomic_init64(&nchunks_in_fly_); | |
| 39 | 11609330 | atomic_init32(&is_fully_chunked_); | |
| 40 | 11609330 | } | |
| 41 | |||
| 42 | 11605602 | FileItem::~FileItem() { pthread_mutex_destroy(&lock_); } | |
| 43 | |||
| 44 | 11523532 | void FileItem::RegisterChunk(const FileChunk &file_chunk) { | |
| 45 | 11523532 | const MutexLockGuard lock_guard(lock_); | |
| 46 | |||
| 47 |
2/2✓ Branch 1 taken 20286 times.
✓ Branch 2 taken 11503246 times.
|
11523532 | switch (file_chunk.content_hash().suffix) { |
| 48 | 20286 | case shash::kSuffixPartial: | |
| 49 |
1/2✓ Branch 1 taken 20286 times.
✗ Branch 2 not taken.
|
20286 | chunks_.PushBack(file_chunk); |
| 50 | 20286 | break; | |
| 51 | |||
| 52 | 11503246 | default: | |
| 53 |
1/2✗ Branch 1 not taken.
✓ Branch 2 taken 11503246 times.
|
11503246 | assert(file_chunk.offset() == 0); |
| 54 |
1/2✗ Branch 1 not taken.
✓ Branch 2 taken 11503246 times.
|
11503246 | assert(file_chunk.size() == size_); |
| 55 | 11503246 | bulk_hash_ = file_chunk.content_hash(); | |
| 56 | 11503246 | break; | |
| 57 | } | ||
| 58 | 11523532 | atomic_dec64(&nchunks_in_fly_); | |
| 59 | 11523532 | } | |
| 60 | |||
| 61 | |||
| 62 | //------------------------------------------------------------------------------ | ||
| 63 | |||
| 64 | |||
| 65 | 11742630 | ChunkItem::ChunkItem(FileItem *file_item, uint64_t offset) | |
| 66 | 11738536 | : file_item_(file_item) | |
| 67 | 11738536 | , offset_(offset) | |
| 68 | 11738536 | , size_(0) | |
| 69 | 11738536 | , is_bulk_chunk_(false) | |
| 70 | 11738536 | , upload_handle_(NULL) | |
| 71 |
1/2✓ Branch 4 taken 11736374 times.
✗ Branch 5 not taken.
|
11742630 | , compressor_(NULL) { |
| 72 | 11736374 | hash_ctx_.algorithm = file_item->hash_algorithm(); | |
| 73 |
1/2✓ Branch 1 taken 11735178 times.
✗ Branch 2 not taken.
|
11736006 | hash_ctx_.size = shash::GetContextSize(hash_ctx_.algorithm); |
| 74 | 11735178 | hash_ctx_.buffer = hash_ctx_buffer_; | |
| 75 |
1/2✓ Branch 1 taken 11738168 times.
✗ Branch 2 not taken.
|
11735178 | shash::Init(hash_ctx_); |
| 76 | 11738168 | hash_value_.algorithm = hash_ctx_.algorithm; | |
| 77 | 11738168 | hash_value_.suffix = shash::kSuffixPartial; | |
| 78 | 11738168 | file_item_->IncNchunksInFly(); | |
| 79 | 11748472 | } | |
| 80 | |||
| 81 | |||
| 82 | 11487284 | void ChunkItem::MakeBulkChunk() { | |
| 83 | 11487284 | is_bulk_chunk_ = true; | |
| 84 | 11487284 | hash_value_.suffix = file_item_->hash_suffix(); | |
| 85 | 11485628 | } | |
| 86 | |||
| 87 | |||
| 88 | 26637044 | zlib::Compressor *ChunkItem::GetCompressor() { | |
| 89 |
2/2✓ Branch 1 taken 11497496 times.
✓ Branch 2 taken 15147828 times.
|
26637044 | if (!compressor_.IsValid()) { |
| 90 | compressor_ = zlib::Compressor::Construct( | ||
| 91 |
2/4✓ Branch 2 taken 11515160 times.
✗ Branch 3 not taken.
✓ Branch 5 taken 11515160 times.
✗ Branch 6 not taken.
|
11497496 | file_item_->compression_algorithm()); |
| 92 | } | ||
| 93 | 26662988 | return compressor_.weak_ref(); | |
| 94 | } | ||
| 95 | |||
| 96 | |||
| 97 | 11496484 | void ChunkItem::ReleaseCompressor() { compressor_.Destroy(); } | |
| 98 | |||
| 99 | |||
| 100 | //------------------------------------------------------------------------------ | ||
| 101 | |||
| 102 | atomic_int64 BlockItem::managed_bytes_ = 0; | ||
| 103 | |||
| 104 | |||
| 105 | 96080 | BlockItem::BlockItem(ItemAllocator *allocator) | |
| 106 | 96080 | : allocator_(allocator) | |
| 107 | 96080 | , type_(kBlockHollow) | |
| 108 | 96080 | , tag_(-1) | |
| 109 | 96080 | , file_item_(NULL) | |
| 110 | 96080 | , chunk_item_(NULL) | |
| 111 | 96080 | , data_(NULL) | |
| 112 | 96080 | , capacity_(0) | |
| 113 | 96080 | , size_(0) { } | |
| 114 | |||
| 115 | |||
| 116 | 83868234 | BlockItem::BlockItem(int64_t tag, ItemAllocator *allocator) | |
| 117 | 83529812 | : allocator_(allocator) | |
| 118 | 83529812 | , type_(kBlockHollow) | |
| 119 | 83529812 | , tag_(tag) | |
| 120 | 83529812 | , file_item_(NULL) | |
| 121 | 83529812 | , chunk_item_(NULL) | |
| 122 | 83529812 | , data_(NULL) | |
| 123 | 83529812 | , capacity_(0) | |
| 124 | 83868234 | , size_(0) { | |
| 125 |
1/2✗ Branch 0 not taken.
✓ Branch 1 taken 83529812 times.
|
83529812 | assert(tag_ >= 0); |
| 126 | 83529812 | } | |
| 127 | |||
| 128 | |||
| 129 | 83553526 | BlockItem::~BlockItem() { | |
| 130 |
2/2✓ Branch 0 taken 35167820 times.
✓ Branch 1 taken 48385706 times.
|
83553526 | if (data_) |
| 131 | 35167820 | allocator_->Free(data_); | |
| 132 | 83600400 | atomic_xadd64(&managed_bytes_, -static_cast<int64_t>(capacity_)); | |
| 133 | 84147582 | } | |
| 134 | |||
| 135 | |||
| 136 | 12696258 | void BlockItem::Discharge() { | |
| 137 | 12696258 | data_ = NULL; | |
| 138 | 12696258 | size_ = capacity_ = 0; | |
| 139 | 12696258 | } | |
| 140 | |||
| 141 | |||
| 142 | 34575288 | void BlockItem::MakeStop() { | |
| 143 |
1/2✗ Branch 0 not taken.
✓ Branch 1 taken 34575288 times.
|
34575288 | assert(type_ == kBlockHollow); |
| 144 | 34575288 | type_ = kBlockStop; | |
| 145 | 34575288 | } | |
| 146 | |||
| 147 | |||
| 148 | 17734250 | void BlockItem::MakeData(uint32_t capacity) { | |
| 149 |
1/2✗ Branch 0 not taken.
✓ Branch 1 taken 17734250 times.
|
17734250 | assert(type_ == kBlockHollow); |
| 150 |
1/2✗ Branch 0 not taken.
✓ Branch 1 taken 17734250 times.
|
17734250 | assert(allocator_ != NULL); |
| 151 |
1/2✗ Branch 0 not taken.
✓ Branch 1 taken 17734250 times.
|
17734250 | assert(capacity > 0); |
| 152 | |||
| 153 | 17734250 | type_ = kBlockData; | |
| 154 | 17734250 | capacity_ = capacity; | |
| 155 | 17734250 | data_ = reinterpret_cast<unsigned char *>(allocator_->Malloc(capacity_)); | |
| 156 | 17758400 | atomic_xadd64(&managed_bytes_, static_cast<int64_t>(capacity_)); | |
| 157 | 17763460 | } | |
| 158 | |||
| 159 | |||
| 160 | /** | ||
| 161 | * Move data from one block to another. | ||
| 162 | */ | ||
| 163 | 12694832 | void BlockItem::MakeDataMove(BlockItem *other) { | |
| 164 |
1/2✗ Branch 0 not taken.
✓ Branch 1 taken 12694832 times.
|
12694832 | assert(type_ == kBlockHollow); |
| 165 |
1/2✗ Branch 0 not taken.
✓ Branch 1 taken 12694832 times.
|
12694832 | assert(other->type_ == kBlockData); |
| 166 |
1/2✗ Branch 0 not taken.
✓ Branch 1 taken 12694832 times.
|
12694832 | assert(other->size_ > 0); |
| 167 | |||
| 168 | 12694832 | type_ = kBlockData; | |
| 169 | 12694832 | capacity_ = size_ = other->size_; | |
| 170 | 12694832 | data_ = other->data_; | |
| 171 | 12694832 | allocator_ = other->allocator_; | |
| 172 | |||
| 173 | 12694832 | other->Discharge(); | |
| 174 | 12695844 | } | |
| 175 | |||
| 176 | |||
| 177 | /** | ||
| 178 | * Copy a piece of one block's data into a new block. | ||
| 179 | */ | ||
| 180 | 19162388 | void BlockItem::MakeDataCopy(const unsigned char *data, uint32_t size) { | |
| 181 |
1/2✗ Branch 0 not taken.
✓ Branch 1 taken 19162388 times.
|
19162388 | assert(type_ == kBlockHollow); |
| 182 |
1/2✗ Branch 0 not taken.
✓ Branch 1 taken 19162388 times.
|
19162388 | assert(allocator_ != NULL); |
| 183 |
1/2✗ Branch 0 not taken.
✓ Branch 1 taken 19162388 times.
|
19162388 | assert(size > 0); |
| 184 | |||
| 185 | 19162388 | type_ = kBlockData; | |
| 186 | 19162388 | capacity_ = size_ = size; | |
| 187 | 19162388 | data_ = reinterpret_cast<unsigned char *>(allocator_->Malloc(capacity_)); | |
| 188 | 19184790 | memcpy(data_, data, size); | |
| 189 | 19184790 | atomic_xadd64(&managed_bytes_, static_cast<int64_t>(capacity_)); | |
| 190 | 19183180 | } | |
| 191 | |||
| 192 | |||
| 193 | 1720032 | void BlockItem::Reset() { | |
| 194 |
1/2✗ Branch 0 not taken.
✓ Branch 1 taken 1720032 times.
|
1720032 | assert(type_ == kBlockData); |
| 195 | |||
| 196 | 1720032 | atomic_xadd64(&managed_bytes_, -static_cast<int64_t>(capacity_)); | |
| 197 | 1720584 | allocator_->Free(data_); | |
| 198 | 1720308 | data_ = NULL; | |
| 199 | 1720308 | size_ = capacity_ = 0; | |
| 200 | 1720308 | type_ = kBlockHollow; | |
| 201 | 1720308 | } | |
| 202 | |||
| 203 | |||
| 204 | 57995664 | void BlockItem::SetChunkItem(ChunkItem *value) { | |
| 205 |
1/2✗ Branch 0 not taken.
✓ Branch 1 taken 57995664 times.
|
57995664 | assert(value != NULL); |
| 206 |
1/2✗ Branch 0 not taken.
✓ Branch 1 taken 57995664 times.
|
57995664 | assert(chunk_item_ == NULL); |
| 207 | 57995664 | chunk_item_ = value; | |
| 208 | 57995664 | } | |
| 209 | |||
| 210 | |||
| 211 | 83316188 | void BlockItem::SetFileItem(FileItem *value) { | |
| 212 |
1/2✗ Branch 0 not taken.
✓ Branch 1 taken 83316188 times.
|
83316188 | assert(value != NULL); |
| 213 |
1/2✗ Branch 0 not taken.
✓ Branch 1 taken 83316188 times.
|
83316188 | assert(file_item_ == NULL); |
| 214 | 83316188 | file_item_ = value; | |
| 215 | 83316188 | } | |
| 216 | |||
| 217 | |||
| 218 | 23552 | uint32_t BlockItem::Write(void *buf, uint32_t count) { | |
| 219 |
1/2✗ Branch 0 not taken.
✓ Branch 1 taken 23552 times.
|
23552 | assert(type_ == kBlockData); |
| 220 | |||
| 221 | 23552 | const uint32_t remaining = capacity_ - size_; | |
| 222 | 23552 | const uint32_t nbytes = std::min(remaining, count); | |
| 223 | 23552 | memcpy(data_ + size_, buf, nbytes); | |
| 224 | 23552 | size_ += nbytes; | |
| 225 | 23552 | return nbytes; | |
| 226 | } | ||
| 227 |