mirror of
				https://github.com/usatiuk/backup.git
				synced 2025-10-26 17:37:47 +01:00 
			
		
		
		
	draft
This commit is contained in:
		| @@ -1,6 +1,16 @@ | |||||||
| cmake_minimum_required(VERSION 3.18) | cmake_minimum_required(VERSION 3.18) | ||||||
|  |  | ||||||
| add_library(commands srcs/CommandDiff.cpp srcs/CommandList.cpp srcs/CommandListFiles.cpp srcs/CommandRestore.cpp srcs/CommandRun.cpp srcs/CommandsCommon.cpp srcs/Diff.cpp srcs/CommandMount.cpp) | add_library(commands | ||||||
|  |         srcs/CommandDiff.cpp | ||||||
|  |         srcs/CommandList.cpp | ||||||
|  |         srcs/CommandListFiles.cpp | ||||||
|  |         srcs/CommandRestore.cpp | ||||||
|  |         srcs/CommandRun.cpp | ||||||
|  |         srcs/CommandsCommon.cpp | ||||||
|  |         srcs/Diff.cpp | ||||||
|  |         srcs/CommandMount.cpp | ||||||
|  |         srcs/CommandDelete.cpp | ||||||
|  | ) | ||||||
|  |  | ||||||
| target_include_directories(commands PUBLIC includes) | target_include_directories(commands PUBLIC includes) | ||||||
|  |  | ||||||
|   | |||||||
							
								
								
									
										18
									
								
								src/commands/includes/CommandDelete.h
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										18
									
								
								src/commands/includes/CommandDelete.h
									
									
									
									
									
										Normal file
									
								
							| @@ -0,0 +1,18 @@ | |||||||
|  | // | ||||||
|  | // Created by Stepan Usatiuk on 06.08.2023. | ||||||
|  | // | ||||||
|  |  | ||||||
|  | #ifndef BACKUP_COMMANDDELETE_H | ||||||
|  | #define BACKUP_COMMANDDELETE_H | ||||||
|  |  | ||||||
|  | #include "Command.h" | ||||||
|  |  | ||||||
|  | class CommandDelete : public Command { | ||||||
|  | public: | ||||||
|  |     CommandDelete(); | ||||||
|  |     void run(Context ctx) override; | ||||||
|  |     static constexpr std::string_view name{"delete"}; | ||||||
|  | }; | ||||||
|  |  | ||||||
|  |  | ||||||
|  | #endif//BACKUP_COMMANDDELETE_H | ||||||
							
								
								
									
										15
									
								
								src/commands/srcs/CommandDelete.cpp
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										15
									
								
								src/commands/srcs/CommandDelete.cpp
									
									
									
									
									
										Normal file
									
								
							| @@ -0,0 +1,15 @@ | |||||||
|  | // | ||||||
|  | // Created by Stepan Usatiuk on 06.08.2023. | ||||||
|  | // | ||||||
|  |  | ||||||
|  | #include "CommandDelete.h" | ||||||
|  |  | ||||||
|  | #include "CommandsCommon.h" | ||||||
|  |  | ||||||
|  | using namespace CommandsCommon; | ||||||
|  |  | ||||||
|  | CommandDelete::CommandDelete() {} | ||||||
|  |  | ||||||
|  | void CommandDelete::run(Context ctx) { | ||||||
|  |     ctx.repo->deleteObjects({static_cast<unsigned long long>(ctx.repo->getConfig().getInt("aid"))}); | ||||||
|  | } | ||||||
| @@ -3,6 +3,7 @@ | |||||||
|  |  | ||||||
| #include "BytesFormatter.h" | #include "BytesFormatter.h" | ||||||
| #include "Command.h" | #include "Command.h" | ||||||
|  | #include "CommandDelete.h" | ||||||
| #include "CommandDiff.h" | #include "CommandDiff.h" | ||||||
| #include "CommandList.h" | #include "CommandList.h" | ||||||
| #include "CommandListFiles.h" | #include "CommandListFiles.h" | ||||||
| @@ -109,6 +110,7 @@ int main(int argc, char *argv[]) { | |||||||
|         commands.emplace(CommandListFiles::name, std::make_unique<CommandListFiles>()); |         commands.emplace(CommandListFiles::name, std::make_unique<CommandListFiles>()); | ||||||
|         commands.emplace(CommandList::name, std::make_unique<CommandList>()); |         commands.emplace(CommandList::name, std::make_unique<CommandList>()); | ||||||
|         commands.emplace(CommandMount::name, std::make_unique<CommandMount>()); |         commands.emplace(CommandMount::name, std::make_unique<CommandMount>()); | ||||||
|  |         commands.emplace(CommandDelete::name, std::make_unique<CommandDelete>()); | ||||||
|  |  | ||||||
|         if (commands.count(opt) == 0) { |         if (commands.count(opt) == 0) { | ||||||
|             std::cerr << "Unknown argument" << std::endl; |             std::cerr << "Unknown argument" << std::endl; | ||||||
|   | |||||||
| @@ -37,7 +37,7 @@ public: | |||||||
|  |  | ||||||
|     std::vector<char> getObjectRaw(Object::idType id) const override; |     std::vector<char> getObjectRaw(Object::idType id) const override; | ||||||
|     bool putObject(const Object &obj) override; |     bool putObject(const Object &obj) override; | ||||||
|     bool deleteObject(const Object &obj) override; |     bool deleteObjects(const std::vector<Object::idType> &objs) override; | ||||||
|  |  | ||||||
|     std::vector<char> getObjectRaw(Object::ObjectType type, const std::string &key) const override; |     std::vector<char> getObjectRaw(Object::ObjectType type, const std::string &key) const override; | ||||||
|     Object::idType getObjectId(Object::ObjectType type, const std::string &key) const override; |     Object::idType getObjectId(Object::ObjectType type, const std::string &key) const override; | ||||||
| @@ -104,6 +104,8 @@ private: | |||||||
|  |  | ||||||
|     unsigned long long maxFileId = 1;                           ///< Largest ID of object storage file |     unsigned long long maxFileId = 1;                           ///< Largest ID of object storage file | ||||||
|     std::unordered_map<Object::idType, OffsetEntry> offsetIndex;///< Used to locate Object%s in the filesystem |     std::unordered_map<Object::idType, OffsetEntry> offsetIndex;///< Used to locate Object%s in the filesystem | ||||||
|  |     std::unordered_map<Object::idType, std::set<Object::idType>> | ||||||
|  |             fileToObjs;///< Used to locate Object%s in the filesystem | ||||||
|  |  | ||||||
|     std::mutex writeCacheLock;                             ///< Write cache lock |     std::mutex writeCacheLock;                             ///< Write cache lock | ||||||
|     std::map<Object::idType, std::vector<char>> writeCache;///< Write cache, map of Object ids and their serialized data |     std::map<Object::idType, std::vector<char>> writeCache;///< Write cache, map of Object ids and their serialized data | ||||||
| @@ -117,8 +119,11 @@ private: | |||||||
|     void flushWriteCache(std::unique_lock<std::mutex> &&lockW); |     void flushWriteCache(std::unique_lock<std::mutex> &&lockW); | ||||||
|  |  | ||||||
|     Object::idType largestUnusedId = 1;   ///< Largest available objectID |     Object::idType largestUnusedId = 1;   ///< Largest available objectID | ||||||
|  |     std::vector<Object::idType> unusedIds;///< Vector of unused IDs | ||||||
|     std::unordered_map<Object::ObjectType, std::unordered_map<std::string, Object::idType>> |     std::unordered_map<Object::ObjectType, std::unordered_map<std::string, Object::idType>> | ||||||
|             keyIndex;///< Maps Object%'s keys to their ID's |             keyIndex;///< Maps Object%'s keys to their ID's | ||||||
|  |  | ||||||
|  |     std::unordered_map<Object::idType, uint64_t> refCounts;///< Count of references to an object per its id | ||||||
| }; | }; | ||||||
|  |  | ||||||
|  |  | ||||||
|   | |||||||
| @@ -37,6 +37,10 @@ public: | |||||||
|     const idType id;      ///< Unique numerical of the object |     const idType id;      ///< Unique numerical of the object | ||||||
|     const ObjectType type;///< Type of the object |     const ObjectType type;///< Type of the object | ||||||
|  |  | ||||||
|  |     static std::unique_ptr<Object> deserialize(const std::vector<char> &src); | ||||||
|  |     static std::unique_ptr<Object> deserialize(std::vector<char>::const_iterator &in, | ||||||
|  |                                                const std::vector<char>::const_iterator &end); | ||||||
|  |  | ||||||
| protected: | protected: | ||||||
|     /// Default constructor |     /// Default constructor | ||||||
|     /// \param id   Object ID |     /// \param id   Object ID | ||||||
|   | |||||||
| @@ -47,6 +47,12 @@ public: | |||||||
|     /// \throws   Exception on any error or if object doesn't exist |     /// \throws   Exception on any error or if object doesn't exist | ||||||
|     virtual std::vector<char> getObjectRaw(Object::idType id) const = 0; |     virtual std::vector<char> getObjectRaw(Object::idType id) const = 0; | ||||||
|  |  | ||||||
|  |     /// Returns the Object with id \p id | ||||||
|  |     /// \param id ID of object to return | ||||||
|  |     /// \return   Serialized object | ||||||
|  |     /// \throws   Exception on any error or if object doesn't exist | ||||||
|  |     std::unique_ptr<Object> getObject(Object::idType id) const; | ||||||
|  |  | ||||||
|     /// Adds the Object \p obj to the Repository |     /// Adds the Object \p obj to the Repository | ||||||
|     /// \param obj  Constant reference to the object |     /// \param obj  Constant reference to the object | ||||||
|     /// \return     True |     /// \return     True | ||||||
| @@ -54,10 +60,10 @@ public: | |||||||
|     virtual bool putObject(const Object &obj) = 0; |     virtual bool putObject(const Object &obj) = 0; | ||||||
|  |  | ||||||
|     /// Deletes Object \p obj from the Repository |     /// Deletes Object \p obj from the Repository | ||||||
|     /// \param obj  Constant reference to the object |     /// \param obj  Constant reference to the vector with ids of objects to delete | ||||||
|     /// \return     True if successful, False if it didn't exist |     /// \return     True if successful, False if it didn't exist | ||||||
|     /// \throws     Exception on any error |     /// \throws     Exception on any error | ||||||
|     virtual bool deleteObject(const Object &obj) = 0; |     virtual bool deleteObjects(const std::vector<Object::idType> &objs) = 0; | ||||||
|  |  | ||||||
|     /// Returns the Object of type \p type and with key \p key |     /// Returns the Object of type \p type and with key \p key | ||||||
|     /// \param type Type of the object |     /// \param type Type of the object | ||||||
|   | |||||||
| @@ -5,8 +5,10 @@ | |||||||
| #include "FileRepository.h" | #include "FileRepository.h" | ||||||
|  |  | ||||||
| #include <exception> | #include <exception> | ||||||
|  | #include <iostream> | ||||||
| #include <iterator> | #include <iterator> | ||||||
| #include <mutex> | #include <mutex> | ||||||
|  | #include <queue> | ||||||
|  |  | ||||||
| #include "CheckFilter.h" | #include "CheckFilter.h" | ||||||
| #include "FilterFactory.h" | #include "FilterFactory.h" | ||||||
| @@ -45,6 +47,9 @@ bool FileRepository::open() { | |||||||
|         std::tie(keyIndex, largestUnusedId) = |         std::tie(keyIndex, largestUnusedId) = | ||||||
|                 Serialize::deserialize<std::pair<decltype(keyIndex), decltype(largestUnusedId)>>( |                 Serialize::deserialize<std::pair<decltype(keyIndex), decltype(largestUnusedId)>>( | ||||||
|                         filters.filterRead(readFile(root / "index"))); |                         filters.filterRead(readFile(root / "index"))); | ||||||
|  |         refCounts = Serialize::deserialize<decltype(refCounts)>(filters.filterRead(readFile(root / "refcounts"))); | ||||||
|  |         unusedIds = Serialize::deserialize<decltype(unusedIds)>(filters.filterRead(readFile(root / "unusedIds"))); | ||||||
|  |         fileToObjs = Serialize::deserialize<decltype(fileToObjs)>(filters.filterRead(readFile(root / "fileToObjs"))); | ||||||
|     } catch (const std::exception &e) { |     } catch (const std::exception &e) { | ||||||
|         ready = false; |         ready = false; | ||||||
|         throw; |         throw; | ||||||
| @@ -79,6 +84,9 @@ FileRepository::~FileRepository() { | |||||||
|  |  | ||||||
|         writeFile(root / "offsets", filters.filterWrite(Serialize::serialize(std::make_pair(maxFileId, offsetIndex)))); |         writeFile(root / "offsets", filters.filterWrite(Serialize::serialize(std::make_pair(maxFileId, offsetIndex)))); | ||||||
|         writeFile(root / "index", filters.filterWrite(Serialize::serialize(std::make_pair(keyIndex, largestUnusedId)))); |         writeFile(root / "index", filters.filterWrite(Serialize::serialize(std::make_pair(keyIndex, largestUnusedId)))); | ||||||
|  |         writeFile(root / "unusedIds", filters.filterWrite(Serialize::serialize(unusedIds))); | ||||||
|  |         writeFile(root / "refcounts", filters.filterWrite(Serialize::serialize(refCounts))); | ||||||
|  |         writeFile(root / "fileToObjs", filters.filterWrite(Serialize::serialize(fileToObjs))); | ||||||
|     } |     } | ||||||
| } | } | ||||||
|  |  | ||||||
| @@ -133,6 +141,7 @@ void FileRepository::flushWriteCache(std::unique_lock<std::mutex> &&lockW) { | |||||||
|         { |         { | ||||||
|             std::lock_guard lockI(repoLock); |             std::lock_guard lockI(repoLock); | ||||||
|             offsetIndex.emplace(i.first, OffsetEntry(currentFileId, offset, i.second.size())); |             offsetIndex.emplace(i.first, OffsetEntry(currentFileId, offset, i.second.size())); | ||||||
|  |             fileToObjs[currentFileId].emplace(i.first); | ||||||
|         } |         } | ||||||
|         offset += i.second.size(); |         offset += i.second.size(); | ||||||
|         ofstream.rdbuf()->sputn(i.second.data(), i.second.size()); |         ofstream.rdbuf()->sputn(i.second.data(), i.second.size()); | ||||||
| @@ -144,14 +153,81 @@ bool FileRepository::putObject(const Object &obj) { | |||||||
|     { |     { | ||||||
|         std::lock_guard lock(repoLock); |         std::lock_guard lock(repoLock); | ||||||
|         keyIndex[obj.type][obj.getKey()] = obj.id; |         keyIndex[obj.type][obj.getKey()] = obj.id; | ||||||
|  |         for (auto const &i: obj.getRefs()) refCounts[i]++; | ||||||
|     } |     } | ||||||
|     writeObject(obj); |     writeObject(obj); | ||||||
|     return true; |     return true; | ||||||
| } | } | ||||||
|  |  | ||||||
| bool FileRepository::deleteObject(const Object &obj) { | bool FileRepository::deleteObjects(const std::vector<Object::idType> &objs) { | ||||||
|     if (!ready) throw Exception("Tried working with uninitialized repo!"); |     if (!ready) throw Exception("Tried working with uninitialized repo!"); | ||||||
|     throw Exception("Deletion not implemented!"); |  | ||||||
|  |     std::queue<Object::idType> toVisit; | ||||||
|  |     std::set<Object::idType> toDelete; | ||||||
|  |  | ||||||
|  |     for (auto const &o: objs) { | ||||||
|  |         toVisit.emplace(o); | ||||||
|  |         toDelete.emplace(o); | ||||||
|  |     } | ||||||
|  |  | ||||||
|  |     std::cout << "Scanning for objects" << std::endl; | ||||||
|  |  | ||||||
|  |     while (!toVisit.empty()) { | ||||||
|  |         auto o = toVisit.back(); | ||||||
|  |         toVisit.pop(); | ||||||
|  |  | ||||||
|  |         auto obj = getObject(o); | ||||||
|  |         for (const auto &id: obj->getRefs()) { | ||||||
|  |             std::unique_lock lock(repoLock); | ||||||
|  |             refCounts[id]--; | ||||||
|  |             if (refCounts.at(id) == 0) { | ||||||
|  |                 toDelete.emplace(id); | ||||||
|  |                 toVisit.emplace(id); | ||||||
|  |                 refCounts.erase(id); | ||||||
|  |             } | ||||||
|  |         } | ||||||
|  |     } | ||||||
|  |  | ||||||
|  |     std::cout << "Found " << toDelete.size() << " to delete " << std::endl; | ||||||
|  |  | ||||||
|  |  | ||||||
|  |     std::unordered_map<uint64_t, Object::idType> fileToObj; | ||||||
|  |     std::set<uint64_t> touchedFiles; | ||||||
|  |  | ||||||
|  |     for (auto const &id: toDelete) { | ||||||
|  |         fileToObj.emplace(offsetIndex.at(id).fileId, id); | ||||||
|  |         touchedFiles.emplace(offsetIndex.at(id).fileId); | ||||||
|  |     } | ||||||
|  |  | ||||||
|  |     std::cout << "Will rewrite " << touchedFiles.size() << " files" << std::endl; | ||||||
|  |  | ||||||
|  |     for (auto const &f: touchedFiles) { | ||||||
|  |         std::cout << "Rewriting file " << f << std::endl; | ||||||
|  |         const auto &objs = fileToObjs.at(f); | ||||||
|  |         std::vector<std::unique_ptr<Object>> objects; | ||||||
|  |         for (auto const &o: objs) { | ||||||
|  |             auto obj = getObject(o); | ||||||
|  |             { | ||||||
|  |                 std::unique_lock lock(repoLock); | ||||||
|  |                 offsetIndex.erase(o); | ||||||
|  |             } | ||||||
|  |             if (toDelete.find(o) == toDelete.end()) putObject(*obj); | ||||||
|  |         } | ||||||
|  |         { | ||||||
|  |             std::unique_lock lock(repoLock); | ||||||
|  |             fileToObjs.erase(f); | ||||||
|  |         } | ||||||
|  |         std::filesystem::remove(root / std::to_string(f)); | ||||||
|  |     } | ||||||
|  |     { | ||||||
|  |         std::unique_lock lock(repoLock); | ||||||
|  |         for (auto const &id: toDelete) { | ||||||
|  |             unusedIds.emplace_back(id); | ||||||
|  |             // FIXME: this is a bit inefficient | ||||||
|  |             for (auto &m: keyIndex) erase_if(m.second, [&](const auto &t) { return toDelete.contains(t.second); }); | ||||||
|  |         } | ||||||
|  |     } | ||||||
|  |     return true; | ||||||
| } | } | ||||||
|  |  | ||||||
| std::vector<char> FileRepository::readFile(const std::filesystem::path &file, unsigned long long offset, | std::vector<char> FileRepository::readFile(const std::filesystem::path &file, unsigned long long offset, | ||||||
| @@ -214,6 +290,11 @@ bool FileRepository::exists(Object::ObjectType type, const std::string &key) con | |||||||
|  |  | ||||||
| Object::idType FileRepository::getId() { | Object::idType FileRepository::getId() { | ||||||
|     std::lock_guard lock(repoLock); |     std::lock_guard lock(repoLock); | ||||||
|  |     if (!unusedIds.empty()) { | ||||||
|  |         auto ret = unusedIds.back(); | ||||||
|  |         unusedIds.pop_back(); | ||||||
|  |         return ret; | ||||||
|  |     } | ||||||
|     return largestUnusedId++; |     return largestUnusedId++; | ||||||
| } | } | ||||||
|  |  | ||||||
|   | |||||||
| @@ -6,6 +6,10 @@ | |||||||
|  |  | ||||||
| #include "Serialize.h" | #include "Serialize.h" | ||||||
|  |  | ||||||
|  | #include "objects/Archive.h" | ||||||
|  | #include "objects/Chunk.h" | ||||||
|  | #include "objects/File.h" | ||||||
|  |  | ||||||
| Object::Object(idType id, ObjectType type) : id(id), type(type) {} | Object::Object(idType id, ObjectType type) : id(id), type(type) {} | ||||||
|  |  | ||||||
| Object::Object(std::vector<char>::const_iterator &in, const std::vector<char>::const_iterator &end) | Object::Object(std::vector<char>::const_iterator &in, const std::vector<char>::const_iterator &end) | ||||||
| @@ -21,3 +25,28 @@ Object::~Object() = default; | |||||||
| static std::vector<Object::idType> emptyRef{}; | static std::vector<Object::idType> emptyRef{}; | ||||||
|  |  | ||||||
| const std::vector<Object::idType> &Object::getRefs() const { return emptyRef; } | const std::vector<Object::idType> &Object::getRefs() const { return emptyRef; } | ||||||
|  |  | ||||||
|  | std::unique_ptr<Object> Object::deserialize(std::vector<char>::const_iterator &in, | ||||||
|  |                                             const std::vector<char>::const_iterator &end) { | ||||||
|  |     auto inCpy = in; | ||||||
|  |     auto id = Serialize::deserialize<idType>(in, end); | ||||||
|  |     auto type = Serialize::deserialize<ObjectType>(in, end); | ||||||
|  |  | ||||||
|  |     switch (type) { | ||||||
|  |         case ObjectType::Archive: | ||||||
|  |             return std::make_unique<Archive>(Serialize::deserialize<Archive>(inCpy, end)); | ||||||
|  |         case ObjectType::File: | ||||||
|  |             return std::make_unique<File>(Serialize::deserialize<File>(inCpy, end)); | ||||||
|  |         case ObjectType::Chunk: | ||||||
|  |             return std::make_unique<Chunk>(Serialize::deserialize<Chunk>(inCpy, end)); | ||||||
|  |         case ObjectType::END: | ||||||
|  |             break; | ||||||
|  |         default: | ||||||
|  |             throw Exception("Bad object!"); | ||||||
|  |     } | ||||||
|  | } | ||||||
|  |  | ||||||
|  | std::unique_ptr<Object> Object::deserialize(const std::vector<char> &src) { | ||||||
|  |     auto srcIterator = src.cbegin(); | ||||||
|  |     return deserialize(srcIterator, src.end()); | ||||||
|  | } | ||||||
|   | |||||||
| @@ -8,3 +8,7 @@ Repository::~Repository() = default; | |||||||
| Repository::Repository(Config config) : config(std::move(config)) {} | Repository::Repository(Config config) : config(std::move(config)) {} | ||||||
|  |  | ||||||
| const Config &Repository::getConfig() const { return config; } | const Config &Repository::getConfig() const { return config; } | ||||||
|  |  | ||||||
|  | std::unique_ptr<Object> Repository::getObject(Object::idType id) const { | ||||||
|  |     return Object::deserialize(this->getObjectRaw(id)); | ||||||
|  | } | ||||||
|   | |||||||
| @@ -192,7 +192,6 @@ TEST(FileRepository, Filters) { | |||||||
| } | } | ||||||
|  |  | ||||||
| TEST(FileRepository, IDsDisabled) { | TEST(FileRepository, IDsDisabled) { | ||||||
|     GTEST_SKIP(); |  | ||||||
|     Cleaner c({"IDS/testrepo"}); |     Cleaner c({"IDS/testrepo"}); | ||||||
|     { |     { | ||||||
|         Config conf; |         Config conf; | ||||||
| @@ -257,7 +256,7 @@ TEST(FileRepository, IDsDisabled) { | |||||||
|         ASSERT_EQ(repo.getObjectId(Object::ObjectType::Chunk, o2k), 2); |         ASSERT_EQ(repo.getObjectId(Object::ObjectType::Chunk, o2k), 2); | ||||||
|  |  | ||||||
|  |  | ||||||
|         repo.deleteObject(o1); |         repo.deleteObjects({o1.id}); | ||||||
|     } |     } | ||||||
|     { |     { | ||||||
|         Config conf; |         Config conf; | ||||||
|   | |||||||
		Reference in New Issue
	
	Block a user