summaryrefslogtreecommitdiff
path: root/src/buildtool/storage/target_cache_entry.cpp
diff options
context:
space:
mode:
authorOliver Reiche <oliver.reiche@huawei.com>2023-02-24 15:49:14 +0100
committerOliver Reiche <oliver.reiche@huawei.com>2023-03-13 17:28:59 +0100
commit42b452e72f536b63bac080880b8daa481099793c (patch)
tree0af1a60e5e0fefb5572df38e092def3d8ac74c05 /src/buildtool/storage/target_cache_entry.cpp
parent546bf5beebf2eb75e7b325f8f18969b4dd34a169 (diff)
downloadjustbuild-42b452e72f536b63bac080880b8daa481099793c.tar.gz
Storage: Reworked storage and garbage collection
The improved GC implementation uses refactored storage classes instead of directly accessing "unknown" file paths. The required storage class refactoring is quite substantial and outlined in the following paragraphs. The module `buildtool/file_system` was extended by: - `ObjectCAS`: a plain CAS implementation for reading/writing blobs and computing digests for a given `ObjectType`. Depending on that type, files written to the file system may have different properties (e.g., the x-bit set) or the digest may be computed differently (e.g., tree digests in non-compatible mode). A new module `buildtool/storage` was introduced containing: - `LocalCAS`: provides a common interface for the "logical CAS", which internally combines three `ObjectCAS`s, one for each `ObjectType` (file, executable, tree). - `LocalAC`: implements the action cache, which needs the `LocalCAS` for storing cache values. - `TargetCache`: implements the high-level target cache, which also needs the `LocalCAS` for storing cache values. - `LocalStorage`: combines the storage classes `LocalCAS`, `LocalAC`, and `TargetCache`. Those are initialized with settings from `StorageConfig`, such as the build root base path or number of generations for the garbage collector. `LocalStorage` is templated with a Boolean parameter `kDoGlobalUplink`, which indicates that, on every read/write access, the garbage collector should be used for uplinking across all generations (global). - `GarbageCollector`: responsible for garbage collection and the global uplinking across all generations. To do so, it employs instances of `LocalStorage` with `kDoGlobalUplink` set to false, in order to avoid endless recursion. The actual (local) uplinking within two single generations is performed by the corresponding storage class (e.g., `TargetCache` implements uplinking of target cache entries between two target cache generations etc.). Thereby, the actual knowledge how data should be uplinked is implemented by the instance that is responsible for creating the data in the first place.
Diffstat (limited to 'src/buildtool/storage/target_cache_entry.cpp')
-rw-r--r--src/buildtool/storage/target_cache_entry.cpp106
1 files changed, 106 insertions, 0 deletions
diff --git a/src/buildtool/storage/target_cache_entry.cpp b/src/buildtool/storage/target_cache_entry.cpp
new file mode 100644
index 00000000..683b2f02
--- /dev/null
+++ b/src/buildtool/storage/target_cache_entry.cpp
@@ -0,0 +1,106 @@
+// Copyright 2022 Huawei Cloud Computing Technology Co., Ltd.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+// http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#include "src/buildtool/storage/target_cache_entry.hpp"
+
+#include <algorithm>
+#include <exception>
+#include <iterator>
+
+#include "src/buildtool/logging/log_level.hpp"
+#include "src/buildtool/logging/logger.hpp"
+
+auto TargetCacheEntry::FromTarget(
+ AnalysedTargetPtr const& target,
+ std::unordered_map<ArtifactDescription, Artifact::ObjectInfo> const&
+ replacements) noexcept -> std::optional<TargetCacheEntry> {
+ auto result = TargetResult{
+ target->Artifacts(), target->Provides(), target->RunFiles()};
+ if (auto desc = result.ReplaceNonKnownAndToJson(replacements)) {
+ return TargetCacheEntry{*desc};
+ }
+ return std::nullopt;
+}
+
+auto TargetCacheEntry::FromJson(nlohmann::json desc) noexcept
+ -> TargetCacheEntry {
+ return TargetCacheEntry(std::move(desc));
+}
+
+auto TargetCacheEntry::ToResult() const noexcept
+ -> std::optional<TargetResult> {
+ return TargetResult::FromJson(desc_);
+}
+
+[[nodiscard]] auto ToObjectInfo(nlohmann::json const& json)
+ -> Artifact::ObjectInfo {
+ auto const& desc = ArtifactDescription::FromJson(json);
+ // The assumption is that all artifacts mentioned in a target cache
+ // entry are KNOWN to the remote side.
+ gsl_ExpectsAudit(desc and desc->IsKnown());
+ auto const& info = desc->ToArtifact().Info();
+ gsl_ExpectsAudit(info);
+ return *info;
+}
+
+[[nodiscard]] auto ScanArtifactMap(
+ gsl::not_null<std::vector<Artifact::ObjectInfo>*> const& infos,
+ nlohmann::json const& json) -> bool {
+ if (not json.is_object()) {
+ return false;
+ }
+ infos->reserve(infos->size() + json.size());
+ std::transform(json.begin(),
+ json.end(),
+ std::back_inserter(*infos),
+ [](auto const& item) { return ToObjectInfo(item); });
+ return true;
+}
+
+[[nodiscard]] auto ScanProvidesMap(
+ gsl::not_null<std::vector<Artifact::ObjectInfo>*> const& infos,
+ nlohmann::json const& json) -> bool {
+ if (not json.is_object()) {
+ return false;
+ }
+ auto const& nodes = json["nodes"];
+ auto const& provided_artifacts = json["provided_artifacts"];
+ infos->reserve(infos->size() + provided_artifacts.size());
+ std::transform(
+ provided_artifacts.begin(),
+ provided_artifacts.end(),
+ std::back_inserter(*infos),
+ [&nodes](auto const& item) {
+ return ToObjectInfo(nodes[item.template get<std::string>()]);
+ });
+ return true;
+}
+
+auto TargetCacheEntry::ToArtifacts(
+ gsl::not_null<std::vector<Artifact::ObjectInfo>*> const& infos)
+ const noexcept -> bool {
+ try {
+ if (ScanArtifactMap(infos, desc_["artifacts"]) and
+ ScanArtifactMap(infos, desc_["runfiles"]) and
+ ScanProvidesMap(infos, desc_["provides"])) {
+ return true;
+ }
+ } catch (std::exception const& ex) {
+ Logger::Log(
+ LogLevel::Error,
+ "Scanning target cache entry for artifacts failed with:\n{}",
+ ex.what());
+ }
+ return false;
+}