From 6cfd7e19bcc9b41b119398cdd78d4e7c7601a3c1 Mon Sep 17 00:00:00 2001 From: Masaya Suzuki Date: Mon, 28 Oct 2024 14:48:19 -0700 Subject: [PATCH] Add get-files command This command allows users to fetch multiple files from a specific commit hash in a Git repository. When a file is not found, the command will not return an error and the file is not in the result. --- cmd/get_files.go | 47 +++++++++++++++++++++ cmd/pipe.go | 7 ++++ get_files.go | 107 +++++++++++++++++++++++++++++++++++++++++++++++ 3 files changed, 161 insertions(+) create mode 100644 cmd/get_files.go create mode 100644 get_files.go diff --git a/cmd/get_files.go b/cmd/get_files.go new file mode 100644 index 0000000..a24d5d3 --- /dev/null +++ b/cmd/get_files.go @@ -0,0 +1,47 @@ +// Copyright 2024 Aviator Technologies, Inc. +// SPDX-License-Identifier: MIT + +package cmd + +import ( + "net/http" + + nichegit "github.com/aviator-co/niche-git" + "github.com/aviator-co/niche-git/debug" + "github.com/go-git/go-git/v5/plumbing" +) + +type GetFilesArgs struct { + RepoURL string `json:"repoURL"` + CommitHash string `json:"commitHash"` + FilePaths []string `json:"filePaths"` +} + +type getFilesOutput struct { + Files map[string]string `json:"files"` + FetchDebugInfo *debug.FetchDebugInfo `json:"fetchDebugInfo"` + BlobFetchDebugInfo *debug.FetchDebugInfo `json:"blobFetchDebugInfo"` + Error string `json:"error,omitempty"` +} + +func GetFiles(args GetFilesArgs) *getFilesOutput { + client := &http.Client{Transport: &authnRoundtripper{}} + files, fetchDebugInfo, blobFetchDebugInfo, err := nichegit.FetchFiles( + args.RepoURL, + client, + plumbing.NewHash(args.CommitHash), + args.FilePaths, + ) + if files == nil { + files = make(map[string]string) + } + output := &getFilesOutput{ + Files: files, + FetchDebugInfo: &fetchDebugInfo, + BlobFetchDebugInfo: blobFetchDebugInfo, + } + if err != nil { + output.Error = err.Error() + } + return output +} diff --git a/cmd/pipe.go b/cmd/pipe.go index 4f63195..345fbf9 100644 --- a/cmd/pipe.go +++ b/cmd/pipe.go @@ -37,6 +37,13 @@ var pipeCmd = &cobra.Command{ dec := json.NewDecoder(in) switch pipeArg.command { + case "get-files": + input := GetFilesArgs{} + if err := dec.Decode(&input); err != nil { + return err + } + output := GetFiles(input) + return writeJSON(pipeArg.outputFile, output) case "get-modified-files-regexp-matches": input := GetModifiedFilesRegexpMatchesArgs{} if err := dec.Decode(&input); err != nil { diff --git a/get_files.go b/get_files.go new file mode 100644 index 0000000..a50e6e7 --- /dev/null +++ b/get_files.go @@ -0,0 +1,107 @@ +// Copyright 2024 Aviator Technologies, Inc. +// SPDX-License-Identifier: MIT + +package nichegit + +import ( + "bytes" + "fmt" + "net/http" + "strings" + + "github.com/aviator-co/niche-git/debug" + "github.com/aviator-co/niche-git/internal/fetch" + "github.com/go-git/go-git/v5/plumbing" + "github.com/go-git/go-git/v5/plumbing/filemode" + "github.com/go-git/go-git/v5/plumbing/format/packfile" + "github.com/go-git/go-git/v5/plumbing/object" + "github.com/go-git/go-git/v5/storage/memory" +) + +func FetchFiles(repoURL string, client *http.Client, commitHash plumbing.Hash, filePaths []string) (map[string]string, debug.FetchDebugInfo, *debug.FetchDebugInfo, error) { + packfilebs, fetchDebugInfo, err := fetch.FetchBlobNonePackfile(repoURL, client, []plumbing.Hash{commitHash}) + if err != nil { + return nil, fetchDebugInfo, nil, err + } + storage := memory.NewStorage() + parser, err := packfile.NewParserWithStorage(packfile.NewScanner(bytes.NewReader(packfilebs)), storage) + if err != nil { + return nil, fetchDebugInfo, nil, fmt.Errorf("failed to parse packfile: %v", err) + } + if _, err := parser.Parse(); err != nil { + return nil, fetchDebugInfo, nil, fmt.Errorf("failed to parse packfile: %v", err) + } + + tree, err := getTreeFromCommit(storage, commitHash) + if err != nil { + return nil, fetchDebugInfo, nil, err + } + blobs := make(map[string]plumbing.Hash) + for _, filePath := range filePaths { + blobHash, err := getBlobHashFromTree(storage, tree, filePath) + if err != nil { + return nil, fetchDebugInfo, nil, fmt.Errorf("failed to get a blob hash for %s: %v", filePath, err) + } + if blobHash != plumbing.ZeroHash { + blobs[filePath] = blobHash + } + } + + if len(blobs) == 0 { + return make(map[string]string), fetchDebugInfo, nil, nil + } + + var blobHashes []plumbing.Hash + for _, blobHash := range blobs { + blobHashes = append(blobHashes, blobHash) + } + + packfilebs, fetchBlobDebugInfo, err := fetch.FetchBlobPackfile(repoURL, client, blobHashes) + blobFetchDebugInfo := &fetchBlobDebugInfo + if err != nil { + return nil, fetchDebugInfo, blobFetchDebugInfo, err + } + parser, err = packfile.NewParserWithStorage(packfile.NewScanner(bytes.NewReader(packfilebs)), storage) + if err != nil { + return nil, fetchDebugInfo, blobFetchDebugInfo, fmt.Errorf("failed to parse packfile: %v", err) + } + if _, err := parser.Parse(); err != nil { + return nil, fetchDebugInfo, blobFetchDebugInfo, fmt.Errorf("failed to parse packfile: %v", err) + } + + files := make(map[string]string) + for filePath, blobHash := range blobs { + bs, err := getBlobContent(storage, blobHash) + if err != nil { + return nil, fetchDebugInfo, blobFetchDebugInfo, fmt.Errorf("failed to get a blob content for %s: %v", filePath, err) + } + files[filePath] = string(bs) + } + return files, fetchDebugInfo, blobFetchDebugInfo, nil +} + +func getBlobHashFromTree(storage *memory.Storage, tree *object.Tree, filePath string) (plumbing.Hash, error) { + first, second, _ := strings.Cut(filePath, "/") + for _, entry := range tree.Entries { + if entry.Name == first { + if entry.Mode == filemode.Regular || entry.Mode == filemode.Executable { + if second == "" { + return entry.Hash, nil + } + // Treat this as not found. + return plumbing.ZeroHash, nil + } + if entry.Mode == filemode.Dir { + subTree, err := object.GetTree(storage, entry.Hash) + if err != nil { + return plumbing.ZeroHash, err + } + return getBlobHashFromTree(storage, subTree, second) + } + // Treat this as not found. + return plumbing.ZeroHash, nil + } + } + // The file does not exist. + return plumbing.ZeroHash, nil +}