123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382 |
- package gig
- import (
- "bytes"
- "encoding/binary"
- "fmt"
- "os"
- "strings"
- )
- // Resources:
- // https://github.com/git/git/blob/master/Documentation/technical/pack-format.txt
- // http://schacon.github.io/gitbook/7_the_packfile.html
- //PackHeader stores version and number of objects in the packfile
- // all data is in network-byte order (big-endian)
- type PackHeader struct {
- Sig [4]byte
- Version uint32
- Objects uint32
- }
- //FanOut table where the "N-th entry of this table records the
- // number of objects in the corresponding pack, the first
- // byte of whose object name is less than or equal to N.
- type FanOut [256]uint32
- //Bounds returns the how many objects whose first byte
- //has a value of b-1 (in s) and b (returned in e)
- //are contained in the fanout table
- func (fo FanOut) Bounds(b byte) (s, e int) {
- e = int(fo[b])
- if b > 0 {
- s = int(fo[b-1])
- }
- return
- }
- //PackIndex represents the git pack file
- //index. It is the main object to use for
- //opening objects contained in packfiles
- //vai OpenObject
- type PackIndex struct {
- *os.File
- Version uint32
- FO FanOut
- shaBase int64
- }
- //PackFile is git pack file with the actual
- //data in it. It should normally not be used
- //directly.
- type PackFile struct {
- *os.File
- Version uint32
- ObjCount uint32
- }
- //PackIndexOpen opens the git pack file with the given
- //path. The ".idx" if missing will be appended.
- func PackIndexOpen(path string) (*PackIndex, error) {
- if !strings.HasSuffix(path, ".idx") {
- path += ".idx"
- }
- fd, err := os.Open(path)
- if err != nil {
- return nil, fmt.Errorf("git: could not read pack index: %v", err)
- }
- idx := &PackIndex{File: fd, Version: 1}
- var peek [4]byte
- err = binary.Read(fd, binary.BigEndian, &peek)
- if err != nil {
- fd.Close()
- return nil, fmt.Errorf("git: could not read pack index: %v", err)
- }
- if bytes.Equal(peek[:], []byte("\377tOc")) {
- binary.Read(fd, binary.BigEndian, &idx.Version)
- }
- if idx.Version == 1 {
- _, err = idx.Seek(0, 0)
- if err != nil {
- fd.Close()
- return nil, fmt.Errorf("git: io error: %v", err)
- }
- } else if idx.Version > 2 {
- fd.Close()
- return nil, fmt.Errorf("git: unsupported pack index version: %d", idx.Version)
- }
- err = binary.Read(idx, binary.BigEndian, &idx.FO)
- if err != nil {
- idx.Close()
- return nil, fmt.Errorf("git: io error: %v", err)
- }
- idx.shaBase = int64((idx.Version-1)*8) + int64(binary.Size(idx.FO))
- return idx, nil
- }
- //ReadSHA1 reads the SHA1 stared at position pos (in the FanOut table).
- func (pi *PackIndex) ReadSHA1(chksum *SHA1, pos int) error {
- if version := pi.Version; version != 2 {
- return fmt.Errorf("git: v%d version support incomplete", version)
- }
- start := pi.shaBase
- _, err := pi.ReadAt(chksum[0:20], start+int64(pos)*int64(20))
- if err != nil {
- return err
- }
- return nil
- }
- //ReadOffset returns the offset in the pack file of the object
- //at position pos in the FanOut table.
- func (pi *PackIndex) ReadOffset(pos int) (int64, error) {
- if version := pi.Version; version != 2 {
- return -1, fmt.Errorf("git: v%d version incomplete", version)
- }
- //header[2*4] + FanOut[256*4] + n * (sha1[20]+crc[4])
- start := int64(2*4+256*4) + int64(pi.FO[255]*24) + int64(pos*4)
- var offset uint32
- _, err := pi.Seek(start, 0)
- if err != nil {
- return -1, fmt.Errorf("git: io error: %v", err)
- }
- err = binary.Read(pi, binary.BigEndian, &offset)
- if err != nil {
- return -1, err
- }
- //see if msb is set, if so this is an
- // offset into the 64b_offset table
- if val := uint32(1<<31) & offset; val != 0 {
- return -1, fmt.Errorf("git: > 31 bit offests not implemented. Meh")
- }
- return int64(offset), nil
- }
- func (pi *PackIndex) findSHA1(target SHA1) (int, error) {
- //s, e and midpoint are one-based indices,
- //where s is the index before interval and
- //e is the index of the last element in it
- //-> search interval is: (s | 1, 2, ... e]
- s, e := pi.FO.Bounds(target[0])
- //invariant: object is, if present, in the interval, (s, e]
- for s < e {
- midpoint := s + (e-s+1)/2
- var sha SHA1
- err := pi.ReadSHA1(&sha, midpoint-1)
- if err != nil {
- return 0, fmt.Errorf("git: io error: %v", err)
- }
- switch bytes.Compare(target[:], sha[:]) {
- case -1: // target < sha1, new interval (s, m-1]
- e = midpoint - 1
- case +1: //taget > sha1, new interval (m, e]
- s = midpoint
- default:
- return midpoint - 1, nil
- }
- }
- return 0, fmt.Errorf("git: sha1 not found in index")
- }
- //FindOffset tries to find object with the id target and if
- //if found returns the offset of the object in the pack file.
- //Returns an error that can be detected by os.IsNotExist if
- //the object could not be found.
- func (pi *PackIndex) FindOffset(target SHA1) (int64, error) {
- pos, err := pi.findSHA1(target)
- if err != nil {
- return 0, err
- }
- off, err := pi.ReadOffset(pos)
- if err != nil {
- return 0, err
- }
- return off, nil
- }
- //OpenPackFile opens the corresponding pack file.
- func (pi *PackIndex) OpenPackFile() (*PackFile, error) {
- f := pi.Name()
- pf, err := OpenPackFile(f[:len(f)-4] + ".pack")
- if err != nil {
- return nil, err
- }
- return pf, nil
- }
- //OpenObject will try to find the object with the given id
- //in it is index and then reach out to its corresponding
- //pack file to open the actual git Object.
- //If the object cannot be found it will return an error
- //the can be detected via os.IsNotExist()
- //Delta objects will returned as such and not be resolved.
- func (pi *PackIndex) OpenObject(id SHA1) (Object, error) {
- off, err := pi.FindOffset(id)
- if err != nil {
- return nil, err
- }
- pf, err := pi.OpenPackFile()
- if err != nil {
- return nil, err
- }
- obj, err := pf.readRawObject(off)
- if err != nil {
- return nil, err
- }
- if IsStandardObject(obj.otype) {
- return parseObject(obj)
- }
- if !IsDeltaObject(obj.otype) {
- return nil, fmt.Errorf("git: unsupported object")
- }
- //This is a delta object
- delta, err := parseDelta(obj)
- return delta, err
- }
- //OpenPackFile opens the git pack file at the given path
- //It will check the pack file header and version.
- //Currently only version 2 is supported.
- //NB: This is low-level API and should most likely
- //not be used directly.
- func OpenPackFile(path string) (*PackFile, error) {
- osfd, err := os.Open(path)
- if err != nil {
- return nil, err
- }
- var header PackHeader
- err = binary.Read(osfd, binary.BigEndian, &header)
- if err != nil {
- return nil, fmt.Errorf("git: could not read header: %v", err)
- }
- if string(header.Sig[:]) != "PACK" {
- return nil, fmt.Errorf("git: packfile signature error")
- }
- if header.Version != 2 {
- return nil, fmt.Errorf("git: unsupported packfile version")
- }
- fd := &PackFile{File: osfd,
- Version: header.Version,
- ObjCount: header.Objects}
- return fd, nil
- }
- func (pf *PackFile) readRawObject(offset int64) (gitObject, error) {
- r := newPackReader(pf, offset)
- b, err := r.ReadByte()
- if err != nil {
- return gitObject{}, fmt.Errorf("git: io error: %v", err)
- }
- //object header format:
- //[mxxx tttt] (byte)
- // tttt -> type [4 bit]
- otype := ObjectType((b & 0x70) >> 4)
- // xxx -> size [3 bit]
- size := int64(b & 0xF)
- // m -> 1, if size > 2^3 (n-byte encoding)
- if b&0x80 != 0 {
- s, err := readVarSize(r, 4)
- if err != nil {
- return gitObject{}, err
- }
- size += s
- }
- obj := gitObject{otype, size, r}
- if IsStandardObject(otype) {
- err = obj.wrapSourceWithDeflate()
- if err != nil {
- return gitObject{}, err
- }
- }
- return obj, nil
- }
- //OpenObject reads the git object header at offset and
- //then parses the data as the corresponding object type.
- func (pf *PackFile) OpenObject(offset int64) (Object, error) {
- obj, err := pf.readRawObject(offset)
- if err != nil {
- return nil, err
- }
- switch obj.otype {
- case ObjCommit:
- return parseCommit(obj)
- case ObjTree:
- return parseTree(obj)
- case ObjBlob:
- return parseBlob(obj)
- case ObjTag:
- return parseTag(obj)
- case ObjOFSDelta:
- fallthrough
- case ObjRefDelta:
- return parseDelta(obj)
- default:
- return nil, fmt.Errorf("git: unknown object type")
- }
- }
- type packReader struct {
- fd *PackFile
- start int64
- off int64
- }
- func newPackReader(fd *PackFile, offset int64) *packReader {
- return &packReader{fd: fd, start: offset, off: offset}
- }
- func (p *packReader) Read(d []byte) (n int, err error) {
- n, err = p.fd.ReadAt(d, p.off)
- p.off += int64(n)
- return
- }
- func (p *packReader) ReadByte() (c byte, err error) {
- var b [1]byte
- _, err = p.Read(b[:])
- c = b[0]
- return
- }
- func (p *packReader) Close() (err error) {
- return //noop
- }
|