blob: 41e3ef23180fa7f9ab1d33ed8f858b61fa110428 [file] [log] [blame]
// Copyright 2021 The Go Authors. All rights reserved.
// Use of this source code is governed by a BSD-style
// license that can be found in the LICENSE file.
// Package gitfs presents a file tree downloaded from a remote Git repo as an in-memory fs.FS.
package gitfs
import (
"bytes"
"encoding/hex"
"fmt"
"io"
"io/fs"
"io/ioutil"
"net/http"
"strings"
)
// A Repo is a connection to a remote repository served over HTTP or HTTPS.
type Repo struct {
url string // trailing slash removed
caps map[string]string
}
// NewRepo connects to a Git repository at the given http:// or https:// URL.
func NewRepo(url string) (*Repo, error) {
r := &Repo{url: strings.TrimSuffix(url, "/")}
if err := r.handshake(); err != nil {
return nil, err
}
return r, nil
}
// handshake runs the initial Git opening handshake, learning the capabilities of the server.
// See https://git-scm.com/docs/protocol-v2#_initial_client_request.
func (r *Repo) handshake() error {
req, _ := http.NewRequest("GET", r.url+"/info/refs?service=git-upload-pack", nil)
req.Header.Set("Accept", "*/*")
req.Header.Set("Git-Protocol", "version=2")
resp, err := http.DefaultClient.Do(req)
if err != nil {
return fmt.Errorf("handshake: %v", err)
}
data, err := ioutil.ReadAll(resp.Body)
if resp.StatusCode != 200 {
return fmt.Errorf("handshake: %v\n%s", resp.Status, data)
}
if err != nil {
return fmt.Errorf("handshake: reading body: %v", err)
}
if ct := resp.Header.Get("Content-Type"); ct != "application/x-git-upload-pack-advertisement" {
return fmt.Errorf("handshake: invalid response Content-Type: %v", ct)
}
pr := newPktLineReader(bytes.NewReader(data))
lines, err := pr.Lines()
if len(lines) == 1 && lines[0] == "# service=git-upload-pack" {
lines, err = pr.Lines()
}
if err != nil {
return fmt.Errorf("handshake: parsing response: %v", err)
}
caps := make(map[string]string)
for _, line := range lines {
verb, args, _ := cut(line, "=")
caps[verb] = args
}
if _, ok := caps["version 2"]; !ok {
return fmt.Errorf("handshake: not version 2: %q", lines)
}
r.caps = caps
return nil
}
// Resolve looks up the given ref and returns the corresponding Hash.
func (r *Repo) Resolve(ref string) (Hash, error) {
if h, err := parseHash(ref); err == nil {
return h, nil
}
fail := func(err error) (Hash, error) {
return Hash{}, fmt.Errorf("resolve %s: %v", ref, err)
}
refs, err := r.refs(ref)
if err != nil {
return fail(err)
}
for _, known := range refs {
if known.name == ref {
return known.hash, nil
}
}
return fail(fmt.Errorf("unknown ref"))
}
// A ref is a single Git reference, like refs/heads/main, refs/tags/v1.0.0, or HEAD.
type ref struct {
name string // "refs/heads/main", "refs/tags/v1.0.0", "HEAD"
hash Hash // hexadecimal hash
}
// refs executes an ls-refs command on the remote server
// to look up refs with the given prefixes.
// See https://git-scm.com/docs/protocol-v2#_ls_refs.
func (r *Repo) refs(prefixes ...string) ([]ref, error) {
if _, ok := r.caps["ls-refs"]; !ok {
return nil, fmt.Errorf("refs: server does not support ls-refs")
}
var buf bytes.Buffer
pw := newPktLineWriter(&buf)
pw.WriteString("command=ls-refs")
pw.Delim()
pw.WriteString("peel")
pw.WriteString("symrefs")
for _, prefix := range prefixes {
pw.WriteString("ref-prefix " + prefix)
}
pw.Close()
postbody := buf.Bytes()
req, _ := http.NewRequest("POST", r.url+"/git-upload-pack", &buf)
req.Header.Set("Content-Type", "application/x-git-upload-pack-request")
req.Header.Set("Accept", "application/x-git-upload-pack-result")
req.Header.Set("Git-Protocol", "version=2")
resp, err := http.DefaultClient.Do(req)
if err != nil {
return nil, fmt.Errorf("refs: %v", err)
}
defer resp.Body.Close()
data, err := ioutil.ReadAll(resp.Body)
if resp.StatusCode != 200 {
return nil, fmt.Errorf("refs: %v\n%s", resp.Status, data)
}
if err != nil {
return nil, fmt.Errorf("refs: reading body: %v", err)
}
if ct := resp.Header.Get("Content-Type"); ct != "application/x-git-upload-pack-result" {
return nil, fmt.Errorf("refs: invalid response Content-Type: %v", ct)
}
var refs []ref
lines, err := newPktLineReader(bytes.NewReader(data)).Lines()
if err != nil {
return nil, fmt.Errorf("refs: parsing response: %v %d\n%s\n%s", err, len(data), hex.Dump(postbody), hex.Dump(data))
}
for _, line := range lines {
hash, rest, ok := cut(line, " ")
if !ok {
return nil, fmt.Errorf("refs: parsing response: invalid line: %q", line)
}
h, err := parseHash(hash)
if err != nil {
return nil, fmt.Errorf("refs: parsing response: invalid line: %q", line)
}
name, _, _ := cut(rest, " ")
refs = append(refs, ref{hash: h, name: name})
}
return refs, nil
}
// Clone resolves the given ref to a hash and returns the corresponding fs.FS.
func (r *Repo) Clone(ref string) (Hash, fs.FS, error) {
fail := func(err error) (Hash, fs.FS, error) {
return Hash{}, nil, fmt.Errorf("clone %s: %v", ref, err)
}
h, err := r.Resolve(ref)
if err != nil {
return fail(err)
}
tfs, err := r.fetch(h)
if err != nil {
return fail(err)
}
return h, tfs, nil
}
// CloneHash returns the fs.FS for the given hash.
func (r *Repo) CloneHash(h Hash) (fs.FS, error) {
tfs, err := r.fetch(h)
if err != nil {
return nil, fmt.Errorf("clone %s: %v", h, err)
}
return tfs, nil
}
// fetch returns the fs.FS for a given hash.
func (r *Repo) fetch(h Hash) (fs.FS, error) {
// Fetch a shallow packfile from the remote server.
// Shallow means it only contains the tree at that one commit,
// not the entire history of the repo.
// See https://git-scm.com/docs/protocol-v2#_fetch.
opts, ok := r.caps["fetch"]
if !ok {
return nil, fmt.Errorf("fetch: server does not support fetch")
}
if !strings.Contains(" "+opts+" ", " shallow ") {
return nil, fmt.Errorf("fetch: server does not support shallow fetch")
}
// Prepare and send request for pack file.
var buf bytes.Buffer
pw := newPktLineWriter(&buf)
pw.WriteString("command=fetch")
pw.Delim()
pw.WriteString("deepen 1")
pw.WriteString("want " + h.String())
pw.WriteString("done")
pw.Close()
postbody := buf.Bytes()
req, _ := http.NewRequest("POST", r.url+"/git-upload-pack", &buf)
req.Header.Set("Content-Type", "application/x-git-upload-pack-request")
req.Header.Set("Accept", "application/x-git-upload-pack-result")
req.Header.Set("Git-Protocol", "version=2")
resp, err := http.DefaultClient.Do(req)
if err != nil {
return nil, fmt.Errorf("fetch: %v", err)
}
defer resp.Body.Close()
if resp.StatusCode != 200 {
data, _ := ioutil.ReadAll(resp.Body)
return nil, fmt.Errorf("fetch: %v\n%s\n%s", resp.Status, data, hex.Dump(postbody))
}
if ct := resp.Header.Get("Content-Type"); ct != "application/x-git-upload-pack-result" {
return nil, fmt.Errorf("fetch: invalid response Content-Type: %v", ct)
}
// Response is sequence of pkt-line packets.
// It is plain text output (printed by git) until we find "packfile".
// Then it switches to packets with a single prefix byte saying
// what kind of data is in that packet:
// 1 for pack file data, 2 for text output, 3 for errors.
var data []byte
pr := newPktLineReader(resp.Body)
sawPackfile := false
for {
line, err := pr.Next()
if err != nil {
if err == io.EOF {
break
}
return nil, fmt.Errorf("fetch: parsing response: %v", err)
}
if line == nil { // ignore delimiter
continue
}
if !sawPackfile {
// Discard response lines until we get to packfile start.
if strings.TrimSuffix(string(line), "\n") == "packfile" {
sawPackfile = true
}
continue
}
if len(line) == 0 || line[0] == 0 || line[0] > 3 {
fmt.Printf("%q\n", line)
continue
return nil, fmt.Errorf("fetch: malformed response: invalid sideband: %q", line)
}
switch line[0] {
case 1:
data = append(data, line[1:]...)
case 2:
fmt.Printf("%s\n", line[1:])
case 3:
return nil, fmt.Errorf("fetch: server error: %s", line[1:])
}
}
if !bytes.HasPrefix(data, []byte("PACK")) {
return nil, fmt.Errorf("fetch: malformed response: not packfile")
}
// Unpack pack file and return fs.FS for the commit we downloaded.
var s store
if err := unpack(&s, data); err != nil {
return nil, fmt.Errorf("fetch: %v", err)
}
tfs, err := s.commit(h)
if err != nil {
return nil, fmt.Errorf("fetch: %v", err)
}
return tfs, nil
}