summaryrefslogtreecommitdiff
path: root/internal/git/pack.go
blob: 02033d663465303850c19d89dcfb55c9e87ab1d4 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
package git

import (
	"bytes"
	"compress/zlib"
	"context"
	"crypto/sha1"
	"encoding/binary"
	"fmt"
	"io"
)

// GitStorage interface for storage backends that can provide Git objects
type GitStorage interface {
	GetObject(ctx context.Context, repo, objectID string) ([]byte, error)
	GetReachableObjects(ctx context.Context, repo string, wants []string, haves []string) ([]string, error)
}

type PackGenerator struct {
	storage GitStorage
}

func NewPackGenerator(storage GitStorage) *PackGenerator {
	return &PackGenerator{
		storage: storage,
	}
}

func (pg *PackGenerator) GeneratePack(ctx context.Context, repo string, wants []string, haves []string) ([]byte, error) {
	// Get all objects to include in pack
	objectSHAs, err := pg.storage.GetReachableObjects(ctx, repo, wants, haves)
	if err != nil {
		return nil, fmt.Errorf("failed to get reachable objects: %w", err)
	}

	if len(objectSHAs) == 0 {
		// Return empty pack
		return pg.generateEmptyPack(), nil
	}

	// Read all objects
	var objects []*GitObject
	for _, sha := range objectSHAs {
		objData, err := pg.storage.GetObject(ctx, repo, sha)
		if err != nil {
			return nil, fmt.Errorf("failed to read required object %s: %w", sha, err)
		}
		
		obj, err := ParseGitObject(objData, sha)
		if err != nil {
			return nil, fmt.Errorf("failed to parse required object %s: %w", sha, err)
		}
		
		objects = append(objects, obj)
	}

	return pg.generatePackFromObjects(objects)
}

func (pg *PackGenerator) generateEmptyPack() []byte {
	var buf bytes.Buffer
	
	// Pack header: "PACK"
	buf.Write([]byte("PACK"))
	
	// Version (4 bytes, big-endian): version 2
	binary.Write(&buf, binary.BigEndian, uint32(2))
	
	// Number of objects (4 bytes, big-endian): 0
	binary.Write(&buf, binary.BigEndian, uint32(0))
	
	// Calculate SHA1 checksum of the pack content
	hash := sha1.New()
	hash.Write(buf.Bytes())
	checksum := hash.Sum(nil)
	
	// Append checksum
	buf.Write(checksum)
	
	return buf.Bytes()
}

func (pg *PackGenerator) generatePackFromObjects(objects []*GitObject) ([]byte, error) {
	var buf bytes.Buffer
	
	// Pack header: "PACK"
	buf.Write([]byte("PACK"))
	
	// Version (4 bytes, big-endian): version 2
	binary.Write(&buf, binary.BigEndian, uint32(2))
	
	// Number of objects (4 bytes, big-endian)
	binary.Write(&buf, binary.BigEndian, uint32(len(objects)))
	
	// Write each object
	for _, obj := range objects {
		err := pg.writePackObject(&buf, obj)
		if err != nil {
			return nil, fmt.Errorf("failed to write object %s: %w", obj.SHA, err)
		}
	}
	
	// Calculate SHA1 checksum of the pack content
	hash := sha1.New()
	hash.Write(buf.Bytes())
	checksum := hash.Sum(nil)
	
	// Append checksum
	buf.Write(checksum)
	
	return buf.Bytes(), nil
}

func (pg *PackGenerator) writePackObject(buf *bytes.Buffer, obj *GitObject) error {
	// Reconstruct original object data (type + size + null + content)
	var objData bytes.Buffer
	objData.WriteString(string(obj.Type))
	objData.WriteString(" ")
	objData.WriteString(fmt.Sprintf("%d", obj.Size))
	objData.WriteByte(0)
	objData.Write(obj.Data)
	
	// Compress the object data
	var compressed bytes.Buffer
	zw := zlib.NewWriter(&compressed)
	_, err := zw.Write(objData.Bytes())
	if err != nil {
		return err
	}
	err = zw.Close()
	if err != nil {
		return err
	}
	
	compressedData := compressed.Bytes()
	
	// Write object header
	err = pg.writePackObjectHeader(buf, obj.Type, int64(len(objData.Bytes())))
	if err != nil {
		return err
	}
	
	// Write compressed data
	buf.Write(compressedData)
	
	return nil
}

func (pg *PackGenerator) writePackObjectHeader(buf *bytes.Buffer, objType ObjectType, size int64) error {
	// Pack object header encoding:
	// First byte: MTTT SSSS
	// M = more bytes follow (MSB)
	// TTT = object type (3 bits)
	// SSSS = size (4 bits, LSB)
	// Additional bytes (if M=1): MMMM MMMM (7 bits of size, MSB indicates more bytes)
	
	var typeValue uint8
	switch objType {
	case ObjectTypeCommit:
		typeValue = 1
	case ObjectTypeTree:
		typeValue = 2
	case ObjectTypeBlob:
		typeValue = 3
	case ObjectTypeTag:
		typeValue = 4
	default:
		return fmt.Errorf("unsupported object type: %s", objType)
	}
	
	// First byte
	firstByte := (typeValue << 4) | uint8(size&0x0F)
	size >>= 4
	
	if size > 0 {
		firstByte |= 0x80 // Set more-bytes flag
	}
	
	buf.WriteByte(firstByte)
	
	// Additional bytes for size
	for size > 0 {
		nextByte := uint8(size & 0x7F)
		size >>= 7
		
		if size > 0 {
			nextByte |= 0x80 // Set more-bytes flag
		}
		
		buf.WriteByte(nextByte)
	}
	
	return nil
}

// PackWriter handles writing pack data with proper Git protocol framing
type PackWriter struct {
	writer io.Writer
}

func NewPackWriter(w io.Writer) *PackWriter {
	return &PackWriter{writer: w}
}

func (pw *PackWriter) WritePacketLine(data string) error {
	length := len(data) + 4
	_, err := fmt.Fprintf(pw.writer, "%04x%s", length, data)
	return err
}

func (pw *PackWriter) WriteFlush() error {
	_, err := pw.writer.Write([]byte("0000"))
	return err
}

func (pw *PackWriter) WritePack(packData []byte) error {
	// For side-band protocol, we need to frame the pack data
	// Band 1: pack data
	const maxPacketSize = 65515 // Max packet size minus 4-byte length and 1-byte band
	
	for len(packData) > 0 {
		chunkSize := len(packData)
		if chunkSize > maxPacketSize {
			chunkSize = maxPacketSize
		}
		
		chunk := packData[:chunkSize]
		packData = packData[chunkSize:]
		
		// Write packet with band indicator
		length := len(chunk) + 5 // 4-byte length + 1-byte band + data
		_, err := fmt.Fprintf(pw.writer, "%04x\x01", length)
		if err != nil {
			return err
		}
		
		_, err = pw.writer.Write(chunk)
		if err != nil {
			return err
		}
	}
	
	return nil
}