1 const std = @import("std");
3 const Alloc = std.mem.Allocator;
4 const Reader = std.io.AnyReader;
5 const Writer = std.io.AnyWriter;
7 const MaxFileSize = 1024 * 1024;
10 const Commit = struct {
17 const TreeEntry = struct {
22 const Tree = std.ArrayList(TreeEntry);
26 const Object = struct {
30 pub fn init(kind: u3, data: []u8) Object {
36 pub fn parse(self: Object, alloc: Alloc) !union(enum) { c: Commit, t: Tree, b: Blob } {
39 const authorOffset = std.mem.indexOf(u8, self.data, "author ") orelse return error.InvalidCommitFormat;
40 const authorNewline = std.mem.indexOfScalarPos(u8, self.data, authorOffset, '\n') orelse return error.InvalidCommitFormat;
41 const committerOffset = std.mem.indexOf(u8, self.data, "committer ") orelse return error.InvalidCommitFormat;
42 const committerNewline = std.mem.indexOfScalarPos(u8, self.data, committerOffset, '\n') orelse return error.InvalidCommitFormat;
46 .tree = try std.fmt.parseUnsigned(Id, self.data[5..45], 16),
47 .parent = try std.fmt.parseUnsigned(Id, self.data[53..93], 16),
48 .author = self.data[authorOffset..authorNewline],
49 .committer = self.data[committerOffset..committerNewline],
50 .message = self.data[committerNewline + 1 .. self.data.len],
55 var t = Tree.init(alloc);
57 var offset: usize = 0;
59 while (offset < self.data.len - 1) {
60 const spaceOffset = std.mem.indexOfScalarPos(u8, self.data, offset, ' ') orelse return error.InvalidTreeFormat;
61 const zeroOffset = std.mem.indexOfScalarPos(u8, self.data, spaceOffset, 0) orelse return error.InvalidTreeFormat;
64 .permissions = self.data[offset..spaceOffset],
65 .name = self.data[spaceOffset + 1 .. zeroOffset],
66 .id = std.mem.readVarInt(Id, self.data[zeroOffset + 1 .. zeroOffset + 21], .big),
69 offset = zeroOffset + 21;
76 .b = Blob{ .data = self.data },
80 return error.TagNotImplemented;
82 else => return error.UnknownGitObjectType,
85 // pub fn getCommit(self: *Object) Commit {}
86 // pub fn getBlob(self: *Object) Blob {}
89 fn decompress(alloc: Alloc, r: Reader) ![]u8 {
90 var buffer = std.ArrayList(u8).init(alloc);
92 try std.compress.zlib.decompress(r, buffer.writer().any());
94 return alloc.realloc(buffer.allocatedSlice(), buffer.items.len);
97 const PackFile = struct {
100 pckFile: std.fs.File,
101 objectOffsets: std.AutoArrayHashMap(Id, u32),
103 pub fn open(alloc: Alloc, dir: std.fs.Dir) !?PackFile {
106 .idxFile = undefined,
107 .pckFile = undefined,
108 .objectOffsets = std.AutoArrayHashMap(Id, u32).init(alloc),
111 var packDir = try dir.openDir("objects/pack", .{ .iterate = true });
112 defer packDir.close();
114 var packFileFound = false;
116 var packIt = packDir.iterate();
117 while (try packIt.next()) |f| {
118 if (std.mem.endsWith(u8, f.name, ".idx")) {
119 const idxFilename = f.name;
120 var pckFilename = try std.BoundedArray(u8, std.fs.max_path_bytes).init(0);
122 pckFilename.writer(),
124 .{idxFilename[0 .. idxFilename.len - 4]},
127 self.idxFile = try packDir.openFile(idxFilename, .{});
128 self.pckFile = try packDir.openFile(pckFilename.constSlice(), .{});
130 try self.parseIndex();
132 packFileFound = true;
142 pub fn close(self: *PackFile) void {
143 self.objectOffsets.deinit();
144 self.idxFile.close();
145 self.pckFile.close();
148 pub fn parseIndex(self: *PackFile) !void {
149 const idxReader = self.idxFile.reader().any();
151 var fanoutTable: [256]u32 = undefined;
154 try self.idxFile.seekTo(8 + i * 4);
155 fanoutTable[i] = try idxReader.readVarInt(u32, .big, 4);
158 if (i > 0) fanoutTable[i] - fanoutTable[i - 1] else fanoutTable[i];
160 for (0..numObjects) |j| {
162 4 + 4 + 4 * 256 + (j + if (i > 0) fanoutTable[i - 1] else 0) * 20;
163 try self.idxFile.seekTo(idOffset);
164 const id = try idxReader.readVarInt(Id, .big, 20);
166 try self.objectOffsets.put(id, 0);
170 const numObjects = self.objectOffsets.keys().len;
171 for (0..numObjects) |i| {
173 4 + 4 + 4 * 256 + numObjects * (20 + 4) + i * 4;
174 try self.idxFile.seekTo(offsetOffset);
175 const offset = try idxReader.readVarInt(u32, .big, 4);
177 self.objectOffsets.values()[i] = offset;
181 fn getSize(reader: Reader, ignoreTypeBits: bool) !struct { size: u64, bytelen: u64 } {
185 const byte = try reader.readByte();
188 if (ignoreTypeBits) {
189 const bits: u4 = @truncate(byte);
192 const bits: u7 = @truncate(byte);
196 if (ignoreTypeBits) {
197 const bits: u7 = @truncate(byte);
198 size += @as(u64, bits) << (7 * (counter - 1) + 4);
200 const bits: u7 = @truncate(byte);
201 size += @as(u64, bits) << (7 * (counter));
205 if (byte & 0b10000000 == 0) {
212 const nBytes = counter + 1;
220 fn getOffset(reader: Reader) !struct { offset: u64, bytelen: u64 } {
224 const byte = try reader.readByte();
226 const bits: u7 = @truncate(byte);
228 offset += @as(u64, bits);
230 if (byte & 0b10000000 == 0) {
237 const nBytes = counter + 1;
240 for (1..nBytes) |i| {
241 offset += std.math.pow(u64, 2, 7 * i);
250 fn applyDelta(alloc: Alloc, baseData: []const u8, deltData: []const u8) ![]u8 {
251 var fbs = std.io.fixedBufferStream(deltData);
252 const deltDataReader = fbs.reader().any();
253 const baseObjectSize = try getSize(deltDataReader, false);
254 const resultObjectSize = try getSize(deltDataReader, false);
255 const deltaDataOffset = baseObjectSize.bytelen + resultObjectSize.bytelen;
257 const result = try alloc.alloc(u8, resultObjectSize.size);
258 var resultCounter: u64 = 0;
260 var counter: u64 = 0;
262 const b = deltData[deltaDataOffset + counter];
264 if (b & 0b10000000 != 0) {
265 var dataOffset: u64 = 0;
266 var dataSize: u64 = 0;
268 for (0..4) |i| { // offset bits
269 if (b & (@as(u64, 1) << @min(3, i)) != 0) {
270 dataOffset += @as(u64, deltData[deltaDataOffset + counter + 1 + bitsSet]) << @min(3 * 8, i * 8);
274 for (4..7) |i| { // size bits
275 if (b & (@as(u64, 1) << @min(6, i)) != 0) {
276 dataSize += @as(u64, deltData[deltaDataOffset + counter + 1 + bitsSet]) << @min(6 * 8, (i - 4) * 8);
282 std.mem.copyForwards(
284 result[resultCounter..result.len],
285 baseData[dataOffset .. dataOffset + dataSize],
288 resultCounter += dataSize;
290 const dataSize: u7 = @truncate(b);
292 std.mem.copyForwards(
294 result[resultCounter..result.len],
295 deltData[deltaDataOffset + counter + 1 .. deltaDataOffset + counter + 1 + dataSize],
297 resultCounter += dataSize;
302 if (deltaDataOffset + counter >= deltData.len)
309 fn ofsDelta(self: *PackFile, offset: i64) anyerror!Object {
310 const pckReader = self.pckFile.reader().any();
312 const pos = try self.pckFile.getPos();
314 try self.pckFile.seekBy(-offset);
315 const baseObject = try self.readObject(pckReader);
316 defer self.alloc.free(baseObject.data);
318 try self.pckFile.seekTo(pos);
319 const deltaData = try decompress(self.alloc, pckReader);
320 defer self.alloc.free(deltaData);
322 const objectData = try applyDelta(self.alloc, baseObject.data, deltaData);
323 return Object.init(baseObject.kind, objectData);
326 fn readObject(self: *PackFile, reader: Reader) anyerror!Object {
327 const firstByte = try reader.readByte();
328 const objectKind: u3 = @truncate(firstByte >> 4);
329 try self.pckFile.seekBy(-1);
330 const objectSize = try getSize(reader, true);
332 if (objectKind == 6) {
333 const offset = try getOffset(reader);
334 return try self.ofsDelta(
335 @intCast(offset.offset + objectSize.bytelen + offset.bytelen),
338 const objectData = try decompress(self.alloc, reader);
339 return Object.init(objectKind, objectData);
343 pub fn getObject(self: *PackFile, id: Id) !?Object {
344 if (self.objectOffsets.get(id)) |offset| {
345 const pckReader = self.pckFile.reader().any();
346 try self.pckFile.seekTo(offset);
348 return try self.readObject(pckReader);
354 const Repo = struct {
359 pub fn open(alloc: Alloc, path: []const u8) !Repo {
360 const dir = try std.fs.cwd().openDir(path, .{});
362 const packfile = try PackFile.open(alloc, dir);
367 .packfile = packfile,
371 pub fn close(self: *Repo) void {
373 if (self.packfile != null) {
374 self.packfile.?.close();
378 pub fn getHead(self: *Repo) !Id {
380 const head = try self.dir.readFileAlloc(self.alloc, "HEAD", 1024);
381 defer self.alloc.free(head);
383 // read file pointed at by HEAD
384 const headPath = head[5 .. head.len - 1];
385 var idBuffer: [40]u8 = undefined;
386 const idStr = try self.dir.readFile(headPath, &idBuffer);
388 // parse id from file
389 return try std.fmt.parseUnsigned(u160, idStr, 16);
392 pub fn getObject(self: *Repo, id: Id) !?Object {
393 if (self.packfile) |*packfile| {
394 return packfile.getObject(id);
401 var repo = try Repo.open(std.testing.allocator, "../imgui/.git");
404 const head = try repo.getHead();
406 std.debug.print("HEAD: {}\n", .{head});
410 var repo = try Repo.open(std.testing.allocator, "../imgui/.git");
413 if (repo.packfile) |packfile| {
414 std.debug.print("{}\n", .{packfile.objectOffsets.keys().len});
415 std.debug.print("{}\n", .{packfile.objectOffsets.values().len});
420 var repo = try Repo.open(std.testing.allocator, "../imgui/.git");
423 const head = try repo.getHead();
425 if (try repo.getObject(head)) |o| {
426 defer std.testing.allocator.free(o.data);
428 std.debug.print("object({}): {s}\n", .{ o.kind, o.data });
432 test "parse commit" {
433 var repo = try Repo.open(std.testing.allocator, "../imgui/.git");
436 const head = try repo.getHead();
438 if (try repo.getObject(head)) |o| {
439 defer std.testing.allocator.free(o.data);
441 switch (try o.parse(std.testing.allocator)) {
443 std.debug.print("commit:\n tree: {x}\n parent: {x}\n author: {s}\n committer: {s}\n message: {s}\n", .{ c.tree, c.parent, c.author, c.committer, c.message });
451 var repo = try Repo.open(std.testing.allocator, "../imgui/.git");
454 if (try repo.getObject(0xceb2b2c62d6f8f3686dcacecd5be931839b02c77)) |o| {
455 defer std.testing.allocator.free(o.data);
457 // std.debug.print("tree({}): {any}\n", .{ o.kind, o.data });
462 var repo = try Repo.open(std.testing.allocator, "../imgui/.git");
465 if (try repo.getObject(0xceb2b2c62d6f8f3686dcacecd5be931839b02c77)) |o| {
466 defer std.testing.allocator.free(o.data);
468 switch (try o.parse(std.testing.allocator)) {
471 for (t.items) |treeEntry| {
472 std.debug.print("{s} {s} {x}\n", .{ treeEntry.permissions, treeEntry.name, treeEntry.id });
480 test "list commits" {
481 var repo = try Repo.open(std.testing.allocator, "../imgui/.git");
484 const head = try repo.getHead();
489 if (try repo.getObject(id)) |o| {
490 defer std.testing.allocator.free(o.data);
492 switch (try o.parse(std.testing.allocator)) {
494 std.debug.print("commit {x}:\n tree: {x}\n parent: {x}\n author: {s}\n committer: {s}\n message: {s}\n", .{ id, c.tree, c.parent, c.author, c.committer, c.message });
504 var repo = try Repo.open(std.testing.allocator, "../imgui/.git");
507 if (try repo.getObject(0xceb2b2c62d6f8f3686dcacecd5be931839b02c77)) |o| {
508 defer std.testing.allocator.free(o.data);
510 switch (try o.parse(std.testing.allocator)) {
513 for (t.items) |treeEntry| {
514 if (try repo.getObject(treeEntry.id)) |bo| {
515 defer std.testing.allocator.free(bo.data);
517 if (treeEntry.permissions.len == 6) {
518 std.debug.print("{s}: {s}\n", .{ treeEntry.name, bo.data[0..50] });
520 std.debug.print("[{s}]\n", .{treeEntry.name});