GCC Code Coverage Report


Directory: cvmfs/
File: cvmfs/sync_mediator.h
Date: 2026-05-03 02:36:16
Exec Total Coverage
Lines: 0 13 0.0%
Branches: 0 12 0.0%

Line Branch Exec Source
1 /**
2 * This file is part of the CernVM File System.
3 *
4 * The SyncMediator is an intermediate layer between the UnionSync
5 * implementation and the CatalogManager.
6 * It's main responsibility is to unwind file system intrinsics as
7 * deleting all files in a deleted directory. Furthermore newly
8 * created directories are recursed and all included files are
9 * added as a whole (performance improvement).
10 *
11 * Furthermore it keeps track of hard link relations. As we cannot store the
12 * transient inode of the union file system in cvmfs, we just keep track of
13 * hard link relations itself. Inodes will be assigned at run time of the CVMFS
14 * client taking these relations into account.
15 *
16 * Another responsibility of this class is the creation and destruction
17 * of nested catalogs. If a .cvmfscatalog magic file is encountered,
18 * either on delete or add, it will be treated as nested catalog change.
19 *
20 * New and modified files are piped to external processes for hashing and
21 * compression. Results come back in a pipe.
22 */
23
24 #ifndef CVMFS_SYNC_MEDIATOR_H_
25 #define CVMFS_SYNC_MEDIATOR_H_
26
27 #include <pthread.h>
28
29 #include <map>
30 #include <stack>
31 #include <string>
32 #include <vector>
33
34 #include "catalog_mgr_rw.h"
35 #include "compression/compression.h"
36 #include "file_chunk.h"
37 #include "publish/repository.h"
38 #include "statistics.h"
39 #include "swissknife_sync.h"
40 #include "sync_item.h"
41 #include "util/pointer.h"
42 #include "util/shared_ptr.h"
43 #include "xattr.h"
44
45 namespace manifest {
46 class Manifest;
47 }
48
49 namespace publish {
50
51 class SyncDiffReporter : public DiffListener {
52 public:
53 enum PrintAction {
54 kPrintDots,
55 kPrintChanges
56 };
57
58 explicit SyncDiffReporter(PrintAction print_action = kPrintChanges,
59 unsigned int processing_dot_interval = 100)
60 : print_action_(print_action)
61 , processing_dot_interval_(processing_dot_interval)
62 , changed_items_(0) { }
63
64 virtual void OnInit(const history::History::Tag &from_tag,
65 const history::History::Tag &to_tag);
66 virtual void OnStats(const catalog::DeltaCounters &delta);
67
68 virtual void OnAdd(const std::string &path,
69 const catalog::DirectoryEntry &entry);
70 virtual void OnRemove(const std::string &path,
71 const catalog::DirectoryEntry &entry);
72 virtual void OnModify(const std::string &path,
73 const catalog::DirectoryEntry &entry_from,
74 const catalog::DirectoryEntry &entry_to);
75 void CommitReport();
76
77 private:
78 void PrintDots();
79 void AddImpl(const std::string &path);
80 void RemoveImpl(const std::string &path);
81 void ModifyImpl(const std::string &path);
82
83 PrintAction print_action_;
84 unsigned int processing_dot_interval_;
85 unsigned int changed_items_;
86 };
87
88 /**
89 * If we encounter a file with linkcount > 1 it will be added to a HardlinkGroup
90 * After processing all files, the HardlinkGroups are populated with
91 * related hardlinks
92 * Assertion: linkcount == HardlinkGroup::hardlinks.size() at the end
93 */
94 struct HardlinkGroup {
95 explicit HardlinkGroup(const SharedPtr<SyncItem> &item) : master(item) {
96 hardlinks[master->GetRelativePath()] = item;
97 }
98
99 void AddHardlink(const SharedPtr<SyncItem> &entry) {
100 hardlinks[entry->GetRelativePath()] = entry;
101 }
102
103 SharedPtr<SyncItem> master;
104 SyncItemList hardlinks;
105 FileChunkList file_chunks;
106 };
107
108 class AbstractSyncMediator {
109 public:
110 virtual ~AbstractSyncMediator() = 0;
111
112 virtual void RegisterUnionEngine(SyncUnion *engine) = 0;
113
114 virtual void Add(SharedPtr<SyncItem> entry) = 0;
115 virtual void Touch(SharedPtr<SyncItem> entry) = 0;
116 virtual void Remove(SharedPtr<SyncItem> entry, bool fast_delete = false) = 0;
117 virtual void Replace(SharedPtr<SyncItem> entry) = 0;
118 virtual void Clone(const std::string from, const std::string to) = 0;
119
120 virtual void AddUnmaterializedDirectory(SharedPtr<SyncItem> entry) = 0;
121
122 virtual void EnterDirectory(SharedPtr<SyncItem> entry) = 0;
123 virtual void LeaveDirectory(SharedPtr<SyncItem> entry) = 0;
124
125 virtual bool Commit(manifest::Manifest *manifest) = 0;
126
127 virtual bool IsExternalData() const = 0;
128 virtual bool IsDirectIo() const = 0;
129 virtual zlib::Algorithms GetCompressionAlgorithm() const = 0;
130 };
131
132 /**
133 * Mapping of inode number to the related HardlinkGroup.
134 */
135 typedef std::map<uint64_t, HardlinkGroup> HardlinkGroupMap;
136
137 /**
138 * The SyncMediator refines the input received from a concrete UnionSync object.
139 * For example, it resolves the insertion and deletion of complete directories
140 * by recursing them. It works as a mediator between the union file system and
141 * forwards the correct database commands to the catalog handler to sync the
142 * changes into the repository.
143 * Furthermore it sends new and modified files to the spooler for compression
144 * and hashing.
145 */
146 class SyncMediator : public virtual AbstractSyncMediator {
147 public:
148 static const unsigned int processing_dot_interval = 100;
149
150 SyncMediator(catalog::WritableCatalogManager *catalog_manager,
151 const SyncParameters *params,
152 perf::StatisticsTemplate statistics);
153 void RegisterUnionEngine(SyncUnion *engine);
154 // Final class, it is not meant to be derived any further
155 ~SyncMediator();
156
157 void Add(SharedPtr<SyncItem> entry);
158 void Touch(SharedPtr<SyncItem> entry);
159 void Remove(SharedPtr<SyncItem> entry, bool fast_delete = false);
160 void Replace(SharedPtr<SyncItem> entry);
161 void Clone(const std::string from, const std::string to);
162
163 void AddUnmaterializedDirectory(SharedPtr<SyncItem> entry);
164
165 void EnterDirectory(SharedPtr<SyncItem> entry);
166 void LeaveDirectory(SharedPtr<SyncItem> entry);
167
168 bool Commit(manifest::Manifest *manifest);
169
170 // The sync union engine uses this information to create properly initialized
171 // sync items
172 bool IsExternalData() const { return params_->external_data; }
173 bool IsDirectIo() const { return params_->direct_io; }
174 zlib::Algorithms GetCompressionAlgorithm() const {
175 return params_->compression_alg;
176 }
177
178 private:
179 typedef std::stack<HardlinkGroupMap> HardlinkGroupMapStack;
180 typedef std::vector<HardlinkGroup> HardlinkGroupList;
181
182 void EnsureAllowed(SharedPtr<SyncItem> entry);
183
184 // Called after figuring out the type of a path (file, symlink, dir)
185 void AddFile(SharedPtr<SyncItem> entry);
186 void RemoveFile(SharedPtr<SyncItem> entry);
187
188 void AddDirectory(SharedPtr<SyncItem> entry);
189 void RemoveDirectory(SharedPtr<SyncItem> entry);
190 void TouchDirectory(SharedPtr<SyncItem> entry);
191
192 void CreateNestedCatalog(SharedPtr<SyncItem> directory);
193 void RemoveNestedCatalog(SharedPtr<SyncItem> directory);
194
195 void TouchDirectoryRecursively(SharedPtr<SyncItem> entry);
196 void TouchingFileCallback(const std::string &parent_dir,
197 const std::string &file_name);
198 void TouchingSymlinkCallback(const std::string &parent_dir,
199 const std::string &link_name);
200 void TouchDirectoryCallback(const std::string &parent_dir,
201 const std::string &dir_name);
202 void RemoveDirectoryRecursively(SharedPtr<SyncItem> entry,
203 bool fast_delete = false);
204 void RemoveFileCallback(const std::string &parent_dir,
205 const std::string &file_name);
206 void RemoveSymlinkCallback(const std::string &parent_dir,
207 const std::string &link_name);
208 void RemoveCharacterDeviceCallback(const std::string &parent_dir,
209 const std::string &link_name);
210 void RemoveBlockDeviceCallback(const std::string &parent_dir,
211 const std::string &link_name);
212 void RemoveFifoCallback(const std::string &parent_dir,
213 const std::string &link_name);
214 void RemoveSocketCallback(const std::string &parent_dir,
215 const std::string &link_name);
216 void RemoveDirectoryCallback(const std::string &parent_dir,
217 const std::string &dir_name);
218 bool IgnoreFileCallback(const std::string &parent_dir,
219 const std::string &file_name);
220 // Called by file system traversal
221 void EnterAddedDirectoryCallback(const std::string &parent_dir,
222 const std::string &dir_name);
223 void LeaveAddedDirectoryCallback(const std::string &parent_dir,
224 const std::string &dir_name);
225 void AddDirectoryRecursively(SharedPtr<SyncItem> entry);
226 bool AddDirectoryCallback(const std::string &parent_dir,
227 const std::string &dir_name);
228 void AddFileCallback(const std::string &parent_dir,
229 const std::string &file_name);
230 void AddCharacterDeviceCallback(const std::string &parent_dir,
231 const std::string &file_name);
232 void AddBlockDeviceCallback(const std::string &parent_dir,
233 const std::string &file_name);
234 void AddFifoCallback(const std::string &parent_dir,
235 const std::string &file_name);
236 void AddSocketCallback(const std::string &parent_dir,
237 const std::string &file_name);
238 void AddSymlinkCallback(const std::string &parent_dir,
239 const std::string &link_name);
240 SharedPtr<SyncItem> CreateSyncItem(const std::string &relative_parent_path,
241 const std::string &filename,
242 const SyncItemType entry_type) const;
243
244 // Called by Upload Spooler
245 void PublishFilesCallback(const upload::SpoolerResult &result);
246 void PublishHardlinksCallback(const upload::SpoolerResult &result);
247
248 // Hardlink handling
249 void CompleteHardlinks(SharedPtr<SyncItem> entry);
250 HardlinkGroupMap &GetHardlinkMap() { return hardlink_stack_.top(); }
251 void LegacyRegularHardlinkCallback(const std::string &parent_dir,
252 const std::string &file_name);
253 void LegacySymlinkHardlinkCallback(const std::string &parent_dir,
254 const std::string &file_name);
255 void LegacyCharacterDeviceHardlinkCallback(const std::string &parent_dir,
256 const std::string &file_name);
257 void LegacyBlockDeviceHardlinkCallback(const std::string &parent_dir,
258 const std::string &file_name);
259 void LegacyFifoHardlinkCallback(const std::string &parent_dir,
260 const std::string &file_name);
261 void LegacySocketHardlinkCallback(const std::string &parent_dir,
262 const std::string &file_name);
263 void InsertLegacyHardlink(SharedPtr<SyncItem> entry);
264 uint64_t GetTemporaryHardlinkGroupNumber(SharedPtr<SyncItem> entry) const;
265 void InsertHardlink(SharedPtr<SyncItem> entry);
266
267 void AddLocalHardlinkGroups(const HardlinkGroupMap &hardlinks);
268 void AddHardlinkGroup(const HardlinkGroup &group);
269
270 catalog::WritableCatalogManager *catalog_manager_;
271 SyncUnion *union_engine_;
272
273 bool handle_hardlinks_;
274
275 /**
276 * When fast_delete is requested but the target path is not a nested catalog
277 * transition point, we fall back to filesystem traversal. This flag ensures
278 * that any nested catalog transition points encountered during the traversal
279 * are still fast-deleted instead of being recursively traversed.
280 */
281 bool recursive_fast_delete_;
282
283 /**
284 * Hardlinks are supported as long as they all reside in the same directory.
285 * If a recursion enters a directory, we push an empty HardlinkGroupMap to
286 * keep track of the hardlinks of this directory.
287 * When leaving a directory (i.e. it is completely processed) the stack is
288 * popped and the HardlinkGroupMap is processed.
289 */
290 HardlinkGroupMapStack hardlink_stack_;
291
292 /**
293 * New and modified files are sent to an external spooler for hashing and
294 * compression. A spooler callback adds them to the catalogs, once processed.
295 */
296 pthread_mutex_t lock_file_queue_;
297 SyncItemList file_queue_;
298
299 HardlinkGroupList hardlink_queue_;
300
301 const SyncParameters *params_;
302 mutable unsigned int changed_items_;
303
304 /**
305 * By default, files have no extended attributes.
306 */
307 XattrList default_xattrs_;
308 UniquePtr<perf::FsCounters> counters_;
309
310 UniquePtr<SyncDiffReporter> reporter_;
311 }; // class SyncMediator
312
313 } // namespace publish
314
315 #endif // CVMFS_SYNC_MEDIATOR_H_
316