summaryrefslogtreecommitdiff
path: root/src
diff options
context:
space:
mode:
authorMaksim Denisov <denisov.maksim@huawei.com>2024-12-11 15:30:43 +0100
committerMaksim Denisov <denisov.maksim@huawei.com>2024-12-19 16:37:59 +0100
commit6b76cc424d622dae484a218f3bf8bfc7851a97fc (patch)
tree983d22217ff76daf7112ad3d81d2a4bb296e6918 /src
parent6a1a70e6882e9ef19843cf7171fc74eee763da44 (diff)
downloadjustbuild-6b76cc424d622dae484a218f3bf8bfc7851a97fc.tar.gz
TreeStructure: Implement computation logic
Diffstat (limited to 'src')
-rw-r--r--src/buildtool/tree_structure/TARGETS24
-rw-r--r--src/buildtool/tree_structure/compute_tree_structure.cpp136
-rw-r--r--src/buildtool/tree_structure/compute_tree_structure.hpp41
3 files changed, 201 insertions, 0 deletions
diff --git a/src/buildtool/tree_structure/TARGETS b/src/buildtool/tree_structure/TARGETS
index e02f6e1c..c52f2b57 100644
--- a/src/buildtool/tree_structure/TARGETS
+++ b/src/buildtool/tree_structure/TARGETS
@@ -21,4 +21,28 @@
, ["src/utils/cpp", "expected"]
]
}
+, "compute_tree_structure":
+ { "type": ["@", "rules", "CC", "library"]
+ , "name": ["compute_tree_structure"]
+ , "hdrs": ["compute_tree_structure.hpp"]
+ , "srcs": ["compute_tree_structure.cpp"]
+ , "deps":
+ [ "tree_structure_cache"
+ , ["src/buildtool/common", "common"]
+ , ["src/buildtool/storage", "storage"]
+ , ["src/utils/cpp", "expected"]
+ ]
+ , "stage": ["src", "buildtool", "tree_structure"]
+ , "private-deps":
+ [ ["@", "fmt", "", "fmt"]
+ , ["src/buildtool/common", "artifact_digest_factory"]
+ , ["src/buildtool/common", "protocol_traits"]
+ , ["src/buildtool/crypto", "hash_function"]
+ , ["src/buildtool/file_system", "file_system_manager"]
+ , ["src/buildtool/file_system", "git_repo"]
+ , ["src/buildtool/file_system", "object_type"]
+ , ["src/utils/cpp", "hex_string"]
+ , ["src/utils/cpp", "path"]
+ ]
+ }
}
diff --git a/src/buildtool/tree_structure/compute_tree_structure.cpp b/src/buildtool/tree_structure/compute_tree_structure.cpp
new file mode 100644
index 00000000..1e1265cd
--- /dev/null
+++ b/src/buildtool/tree_structure/compute_tree_structure.cpp
@@ -0,0 +1,136 @@
+// Copyright 2024 Huawei Cloud Computing Technology Co., Ltd.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+// http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#include "src/buildtool/tree_structure/compute_tree_structure.hpp"
+
+#include <algorithm>
+#include <functional>
+#include <optional>
+#include <unordered_map>
+#include <utility>
+#include <vector>
+
+#include "fmt/core.h"
+#include "src/buildtool/common/artifact_digest_factory.hpp"
+#include "src/buildtool/common/protocol_traits.hpp"
+#include "src/buildtool/crypto/hash_function.hpp"
+#include "src/buildtool/file_system/file_system_manager.hpp"
+#include "src/buildtool/file_system/git_repo.hpp"
+#include "src/buildtool/file_system/object_type.hpp"
+#include "src/utils/cpp/hex_string.hpp"
+#include "src/utils/cpp/path.hpp"
+
+auto ComputeTreeStructure(ArtifactDigest const& tree,
+ Storage const& storage,
+ TreeStructureCache const& cache) noexcept
+ -> expected<ArtifactDigest, std::string> {
+ if (not tree.IsTree() or not ProtocolTraits::IsNative(tree.GetHashType())) {
+ return unexpected{fmt::format("Not a git tree: {}", tree.hash())};
+ }
+
+ if (auto result = cache.Get(tree)) {
+ return *std::move(result);
+ }
+
+ auto const tree_path = storage.CAS().TreePath(tree);
+ if (not tree_path) {
+ return unexpected{
+ fmt::format("Failed to read from the storage: {}", tree.hash())};
+ }
+
+ auto const tree_content = FileSystemManager::ReadFile(*tree_path);
+ if (not tree_content) {
+ return unexpected{
+ fmt::format("Failed to read content of: {}", tree.hash())};
+ }
+
+ auto const check_symlinks =
+ [&storage](std::vector<ArtifactDigest> const& ids) {
+ return std::all_of(
+ ids.begin(), ids.end(), [&storage](auto const& id) -> bool {
+ auto path_to_symlink =
+ storage.CAS().BlobPath(id, /*is_executable=*/false);
+ if (not path_to_symlink) {
+ return false;
+ }
+ auto const content =
+ FileSystemManager::ReadFile(*path_to_symlink);
+ return content and PathIsNonUpwards(*content);
+ });
+ };
+ auto const entries = GitRepo::ReadTreeData(
+ *tree_content, tree.hash(), check_symlinks, /*is_hex_id=*/true);
+ if (not entries) {
+ return unexpected{
+ fmt::format("Failed to parse git tree: {}", tree.hash())};
+ }
+
+ GitRepo::tree_entries_t structure_entries{};
+ for (auto const& [raw_id, es] : *entries) {
+ for (auto const& entry : es) {
+ std::optional<ArtifactDigest> structure_digest;
+ if (IsTreeObject(entry.type)) {
+ auto const git_digest =
+ ArtifactDigestFactory::Create(HashFunction::Type::GitSHA1,
+ ToHexString(raw_id),
+ /*size is unknown*/ 0,
+ /*is_tree=*/true);
+ if (not git_digest) {
+ return unexpected{git_digest.error()};
+ }
+ auto sub_tree =
+ ComputeTreeStructure(*git_digest, storage, cache);
+ if (not sub_tree) {
+ return sub_tree;
+ }
+ structure_digest = *std::move(sub_tree);
+ }
+ else {
+ structure_digest = storage.CAS().StoreBlob(
+ std::string{}, IsExecutableObject(entry.type));
+ }
+ if (not structure_digest) {
+ return unexpected{fmt::format(
+ "Failed to get structure digest for: {}", raw_id)};
+ }
+ if (auto id = FromHexString(structure_digest->hash())) {
+ structure_entries[*std::move(id)].emplace_back(entry);
+ }
+ else {
+ return unexpected{
+ fmt::format("Failed to get raw id for {}", raw_id)};
+ }
+ }
+ }
+
+ auto const structure_tree = GitRepo::CreateShallowTree(structure_entries);
+ if (not structure_tree) {
+ return unexpected{fmt::format(
+ "Failed to create structured Git tree for {}", tree.hash())};
+ }
+
+ auto tree_structure = storage.CAS().StoreTree(structure_tree->second);
+ if (not tree_structure) {
+ return unexpected{fmt::format(
+ "Failed to add tree structure to the CAS for {}", tree.hash())};
+ }
+
+ if (not cache.Set(tree, *tree_structure)) {
+ return unexpected{fmt::format(
+ "Failed to create a tree structure cache entry for\n{} => {}",
+ tree.hash(),
+ tree_structure->hash())};
+ }
+ return *std::move(tree_structure);
+}
diff --git a/src/buildtool/tree_structure/compute_tree_structure.hpp b/src/buildtool/tree_structure/compute_tree_structure.hpp
new file mode 100644
index 00000000..dc31d814
--- /dev/null
+++ b/src/buildtool/tree_structure/compute_tree_structure.hpp
@@ -0,0 +1,41 @@
+// Copyright 2024 Huawei Cloud Computing Technology Co., Ltd.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+// http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#ifndef INCLUDED_SRC_BUILDTOOL_TREE_STRUCTURE_COMPUTE_TREE_STRUCTURE_HPP
+#define INCLUDED_SRC_BUILDTOOL_TREE_STRUCTURE_COMPUTE_TREE_STRUCTURE_HPP
+
+#include <string>
+
+#include "src/buildtool/common/artifact_digest.hpp"
+#include "src/buildtool/storage/storage.hpp"
+#include "src/buildtool/tree_structure/tree_structure_cache.hpp"
+#include "src/utils/cpp/expected.hpp"
+
+/// \brief Compute the tree structure of a git tree and add corresponding
+/// coupling to the cache. Tree structure is a directory, where all blobs and
+/// symlinks are replaced with empty blobs. Every subtree gets written to the
+/// cache as well. Expects tree is present in the storage.
+/// \param tree Git tree to be analyzed. Must be present in the storage.
+/// \param storage Storage (GitSHA1) to be used for adding new tree
+/// structure artifacts
+/// \param cache Cache for storing key-value dependencies.
+/// \return Digest of the tree structure that is present in the storage on
+/// success, or an error message on failure.
+[[nodiscard]] auto ComputeTreeStructure(
+ ArtifactDigest const& tree,
+ Storage const& storage,
+ TreeStructureCache const& cache) noexcept
+ -> expected<ArtifactDigest, std::string>;
+
+#endif // INCLUDED_SRC_BUILDTOOL_TREE_STRUCTURE_COMPUTE_TREE_STRUCTURE_HPP