1 const std = @import("std");
3 const Alloc = std.mem.Allocator;
4 const Reader = std.io.AnyReader;
5 const Writer = std.io.AnyWriter;
7 const MaxFileSize = 1024 * 1024;
10 const Commit = struct {
17 const TreeEntry = struct {
22 const Tree = std.ArrayList(TreeEntry);
26 const Object = struct {
30 pub fn init(kind: u3, data: []u8) Object {
36 pub fn parse(self: Object, alloc: Alloc) !union(enum) { c: Commit, t: Tree, b: Blob } {
39 const authorOffset = std.mem.indexOf(u8, self.data, "author ") orelse return error.InvalidCommitFormat;
40 const authorNewline = std.mem.indexOfScalarPos(u8, self.data, authorOffset, '\n') orelse return error.InvalidCommitFormat;
41 const committerOffset = std.mem.indexOf(u8, self.data, "committer ") orelse return error.InvalidCommitFormat;
42 const committerNewline = std.mem.indexOfScalarPos(u8, self.data, committerOffset, '\n') orelse return error.InvalidCommitFormat;
46 .tree = try std.fmt.parseUnsigned(Id, self.data[5..45], 16),
47 .parent = try std.fmt.parseUnsigned(Id, self.data[53..93], 16),
48 .author = self.data[authorOffset..authorNewline],
49 .committer = self.data[committerOffset..committerNewline],
50 .message = self.data[committerNewline + 1 .. self.data.len],
55 var t = Tree.init(alloc);
57 var offset: usize = 0;
59 while (offset < self.data.len - 1) {
60 const spaceOffset = std.mem.indexOfScalarPos(u8, self.data, offset, ' ') orelse return error.InvalidTreeFormat;
61 const zeroOffset = std.mem.indexOfScalarPos(u8, self.data, spaceOffset, 0) orelse return error.InvalidTreeFormat;
64 .permissions = self.data[offset..spaceOffset],
65 .name = self.data[spaceOffset + 1 .. zeroOffset],
66 .id = std.mem.readVarInt(Id, self.data[zeroOffset + 1 .. zeroOffset + 21], .big),
69 offset = zeroOffset + 21;
76 .b = Blob{ .data = self.data },
80 return error.TagNotImplemented;
82 else => return error.UnknownGitObjectType,
85 // pub fn getCommit(self: *Object) Commit {}
86 // pub fn getBlob(self: *Object) Blob {}
89 fn decompress(alloc: Alloc, r: Reader) ![]u8 {
90 var buffer = std.ArrayList(u8).init(alloc);
92 try std.compress.zlib.decompress(r, buffer.writer().any());
94 return alloc.realloc(buffer.allocatedSlice(), buffer.items.len);
97 const PackFile = struct {
100 pckFile: std.fs.File,
101 objectOffsets: std.AutoArrayHashMap(Id, u32),
103 pub fn open(alloc: Alloc, dir: std.fs.Dir) !?PackFile {
106 .idxFile = undefined,
107 .pckFile = undefined,
108 .objectOffsets = std.AutoArrayHashMap(Id, u32).init(alloc),
111 var packDir = try dir.openDir("objects/pack", .{ .iterate = true });
112 defer packDir.close();
114 var packFileFound = false;
116 var packIt = packDir.iterate();
117 while (try packIt.next()) |f| {
118 if (std.mem.endsWith(u8, f.name, ".idx")) {
119 const idxFilename = f.name;
120 var pckFilename = try std.BoundedArray(u8, std.fs.max_path_bytes).init(0);
122 pckFilename.writer(),
124 .{idxFilename[0 .. idxFilename.len - 4]},
127 self.idxFile = try packDir.openFile(idxFilename, .{});
128 self.pckFile = try packDir.openFile(pckFilename.constSlice(), .{});
130 try self.parseIndex();
132 packFileFound = true;
142 pub fn close(self: *PackFile) void {
143 self.objectOffsets.deinit();
144 self.idxFile.close();
145 self.pckFile.close();
148 pub fn parseIndex(self: *PackFile) !void {
149 const idxReader = self.idxFile.reader().any();
151 var fanoutTable: [256]u32 = undefined;
154 try self.idxFile.seekTo(8 + i * 4);
155 fanoutTable[i] = try idxReader.readVarInt(u32, .big, 4);
158 if (i > 0) fanoutTable[i] - fanoutTable[i - 1] else fanoutTable[i];
160 for (0..numObjects) |j| {
162 4 + 4 + 4 * 256 + (j + if (i > 0) fanoutTable[i - 1] else 0) * 20;
163 try self.idxFile.seekTo(idOffset);
164 const id = try idxReader.readVarInt(Id, .big, 20);
166 try self.objectOffsets.put(id, 0);
170 const numObjects = self.objectOffsets.keys().len;
171 for (0..numObjects) |i| {
173 4 + 4 + 4 * 256 + numObjects * (20 + 4) + i * 4;
174 try self.idxFile.seekTo(offsetOffset);
175 const offset = try idxReader.readVarInt(u32, .big, 4);
177 self.objectOffsets.values()[i] = offset;
181 fn getSize(reader: Reader, ignoreTypeBits: bool) !struct { size: u64, bytelen: u64 } {
185 const byte = try reader.readByte();
188 if (ignoreTypeBits) {
189 const bits: u4 = @truncate(byte);
192 const bits: u7 = @truncate(byte);
196 if (ignoreTypeBits) {
197 const bits: u7 = @truncate(byte);
198 size += @as(u64, bits) << (7 * (counter - 1) + 4);
200 const bits: u7 = @truncate(byte);
201 size += @as(u64, bits) << (7 * (counter));
205 if (byte & 0b10000000 == 0) {
212 const nBytes = counter + 1;
220 fn getOffset(reader: Reader) !struct { offset: u64, bytelen: u64 } {
224 const byte = try reader.readByte();
226 const bits: u7 = @truncate(byte);
228 offset += @as(u64, bits);
230 if (byte & 0b10000000 == 0) {
237 const nBytes = counter + 1;
240 for (1..nBytes) |i| {
241 offset += std.math.pow(u64, 2, 7 * i);
250 fn applyDelta(alloc: Alloc, baseData: []const u8, deltData: []const u8) ![]u8 {
251 var fbs = std.io.fixedBufferStream(deltData);
252 const deltDataReader = fbs.reader().any();
253 const baseObjectSize = try getSize(deltDataReader, false);
254 const resultObjectSize = try getSize(deltDataReader, false);
255 const deltaDataOffset = baseObjectSize.bytelen + resultObjectSize.bytelen;
257 const result = try alloc.alloc(u8, resultObjectSize.size);
258 var resultCounter: u64 = 0;
260 var counter: u64 = 0;
262 const b = deltData[deltaDataOffset + counter];
264 if (b & 0b10000000 != 0) {
265 var dataOffset: u64 = 0;
266 var dataSize: u64 = 0;
268 for (0..4) |i| { // offset bits
269 if (b & (@as(u64, 1) << @min(3, i)) != 0) {
270 dataOffset += @as(u64, deltData[deltaDataOffset + counter + 1 + bitsSet]) << @min(3 * 8, i * 8);
274 for (4..7) |i| { // size bits
275 if (b & (@as(u64, 1) << @min(6, i)) != 0) {
276 dataSize += @as(u64, deltData[deltaDataOffset + counter + 1 + bitsSet]) << @min(6 * 8, (i - 4) * 8);
285 std.mem.copyForwards(
287 result[resultCounter..result.len],
288 baseData[dataOffset .. dataOffset + dataSize],
291 resultCounter += dataSize;
293 const dataSize: u7 = @truncate(b);
295 std.mem.copyForwards(
297 result[resultCounter..result.len],
298 deltData[deltaDataOffset + counter + 1 .. deltaDataOffset + counter + 1 + dataSize],
301 resultCounter += dataSize;
306 if (deltaDataOffset + counter >= deltData.len)
313 fn ofsDelta(self: *PackFile, offset: i64) anyerror!Object {
314 const pckReader = self.pckFile.reader().any();
316 const pos = try self.pckFile.getPos();
318 try self.pckFile.seekBy(-offset);
319 const baseObject = try self.readObject(pckReader);
320 defer self.alloc.free(baseObject.data);
322 try self.pckFile.seekTo(pos);
323 const deltaData = try decompress(self.alloc, pckReader);
324 defer self.alloc.free(deltaData);
326 const objectData = try applyDelta(self.alloc, baseObject.data, deltaData);
327 return Object.init(baseObject.kind, objectData);
330 fn readObject(self: *PackFile, reader: Reader) anyerror!Object {
331 const firstByte = try reader.readByte();
332 const objectKind: u3 = @truncate(firstByte >> 4);
333 try self.pckFile.seekBy(-1);
334 const objectSize = try getSize(reader, true);
336 if (objectKind == 6) {
337 const offset = try getOffset(reader);
339 return try self.ofsDelta(
340 @intCast(offset.offset + objectSize.bytelen + offset.bytelen),
343 const objectData = try decompress(self.alloc, reader);
344 return Object.init(objectKind, objectData);
348 pub fn getObject(self: *PackFile, id: Id) !?Object {
349 if (self.objectOffsets.get(id)) |offset| {
350 const pckReader = self.pckFile.reader().any();
351 try self.pckFile.seekTo(offset);
353 return try self.readObject(pckReader);
359 const Repo = struct {
364 pub fn open(alloc: Alloc, path: []const u8) !Repo {
365 const dir = try std.fs.cwd().openDir(path, .{});
367 const packfile = try PackFile.open(alloc, dir);
372 .packfile = packfile,
376 pub fn close(self: *Repo) void {
378 if (self.packfile != null) {
379 self.packfile.?.close();
383 pub fn getHead(self: *Repo) !Id {
385 const head = try self.dir.readFileAlloc(self.alloc, "HEAD", 1024);
386 defer self.alloc.free(head);
388 // read file pointed at by HEAD
389 const headPath = head[5 .. head.len - 1];
390 var idBuffer: [40]u8 = undefined;
391 const idStr = try self.dir.readFile(headPath, &idBuffer);
393 // parse id from file
394 return try std.fmt.parseUnsigned(u160, idStr, 16);
397 pub fn getObject(self: *Repo, id: Id) !?Object {
398 if (self.packfile) |*packfile| {
399 return packfile.getObject(id);
406 var repo = try Repo.open(std.testing.allocator, "../imgui/.git");
409 const head = try repo.getHead();
411 std.debug.print("HEAD: {}\n", .{head});
415 var repo = try Repo.open(std.testing.allocator, "../imgui/.git");
418 if (repo.packfile) |packfile| {
419 std.debug.print("{}\n", .{packfile.objectOffsets.keys().len});
420 std.debug.print("{}\n", .{packfile.objectOffsets.values().len});
425 var repo = try Repo.open(std.testing.allocator, "../imgui/.git");
428 const head = try repo.getHead();
430 if (try repo.getObject(head)) |o| {
431 defer std.testing.allocator.free(o.data);
433 std.debug.print("object({}): {s}\n", .{ o.kind, o.data });
437 test "parse commit" {
438 var repo = try Repo.open(std.testing.allocator, "../imgui/.git");
441 const head = try repo.getHead();
443 if (try repo.getObject(head)) |o| {
444 defer std.testing.allocator.free(o.data);
446 switch (try o.parse(std.testing.allocator)) {
448 std.debug.print("commit:\n tree: {x}\n parent: {x}\n author: {s}\n committer: {s}\n message: {s}\n", .{ c.tree, c.parent, c.author, c.committer, c.message });
456 var repo = try Repo.open(std.testing.allocator, "../imgui/.git");
459 if (try repo.getObject(0xceb2b2c62d6f8f3686dcacecd5be931839b02c77)) |o| {
460 defer std.testing.allocator.free(o.data);
462 // std.debug.print("tree({}): {any}\n", .{ o.kind, o.data });
467 var repo = try Repo.open(std.testing.allocator, "../imgui/.git");
470 if (try repo.getObject(0xceb2b2c62d6f8f3686dcacecd5be931839b02c77)) |o| {
471 defer std.testing.allocator.free(o.data);
473 switch (try o.parse(std.testing.allocator)) {
476 for (t.items) |treeEntry| {
477 std.debug.print("{s} {s} {x}\n", .{ treeEntry.permissions, treeEntry.name, treeEntry.id });
485 test "list commits" {
486 var repo = try Repo.open(std.testing.allocator, "../imgui/.git");
489 const head = try repo.getHead();
494 if (try repo.getObject(id)) |o| {
495 defer std.testing.allocator.free(o.data);
497 switch (try o.parse(std.testing.allocator)) {
499 std.debug.print("commit {x}:\n tree: {x}\n parent: {x}\n author: {s}\n committer: {s}\n message: {s}\n", .{ id, c.tree, c.parent, c.author, c.committer, c.message });
509 var repo = try Repo.open(std.testing.allocator, "../imgui/.git");
512 if (try repo.getObject(0xceb2b2c62d6f8f3686dcacecd5be931839b02c77)) |o| {
513 defer std.testing.allocator.free(o.data);
515 switch (try o.parse(std.testing.allocator)) {
518 for (t.items) |treeEntry| {
519 if (try repo.getObject(treeEntry.id)) |bo| {
520 defer std.testing.allocator.free(bo.data);
522 if (treeEntry.permissions.len == 6) {
523 std.debug.print("{s}: {s}\n", .{ treeEntry.name, bo.data[0..50] });
525 std.debug.print("[{s}]\n", .{treeEntry.name});