1#include <assert.h>
2
3#include "cache.h"
4#include "refs.h"
5#include "tag.h"
6#include "commit.h"
7#include "tree.h"
8#include "blob.h"
9#include "diff.h"
10
11#define DEBUG 0
12
13struct commit** blame_lines;
14int num_blame_lines;
15
16struct util_info
17{
18 int* line_map;
19 int num_lines;
20 unsigned char sha1[20]; /* blob sha, not commit! */
21 char* buf;
22 unsigned long size;
23// const char* path;
24};
25
26struct chunk
27{
28 int off1, len1; // ---
29 int off2, len2; // +++
30};
31
32struct patch
33{
34 struct chunk* chunks;
35 int num;
36};
37
38static void get_blob(struct commit* commit);
39
40int num_get_patch = 0;
41int num_commits = 0;
42
43struct patch* get_patch(struct commit* commit, struct commit* other)
44{
45 struct patch* ret = xmalloc(sizeof(struct patch));
46 ret->chunks = NULL;
47 ret->num = 0;
48
49 struct util_info* info_c = (struct util_info*) commit->object.util;
50 struct util_info* info_o = (struct util_info*) other->object.util;
51
52 if(!memcmp(info_c->sha1, info_o->sha1, 20))
53 return ret;
54
55 get_blob(commit);
56 get_blob(other);
57
58 FILE* fout = fopen("/tmp/git-blame-tmp1", "w");
59 if(!fout)
60 die("fopen tmp1 failed: %s", strerror(errno));
61
62 if(fwrite(info_c->buf, info_c->size, 1, fout) != 1)
63 die("fwrite 1 failed: %s", strerror(errno));
64 fclose(fout);
65
66 fout = fopen("/tmp/git-blame-tmp2", "w");
67 if(!fout)
68 die("fopen tmp2 failed: %s", strerror(errno));
69
70 if(fwrite(info_o->buf, info_o->size, 1, fout) != 1)
71 die("fwrite 2 failed: %s", strerror(errno));
72 fclose(fout);
73
74 FILE* fin = popen("diff -u0 /tmp/git-blame-tmp1 /tmp/git-blame-tmp2", "r");
75 if(!fin)
76 die("popen failed: %s", strerror(errno));
77
78 char buf[1024];
79 while(fgets(buf, sizeof(buf), fin)) {
80 if(buf[0] != '@' || buf[1] != '@')
81 continue;
82
83 if(DEBUG)
84 printf("chunk line: %s", buf);
85 ret->num++;
86 ret->chunks = xrealloc(ret->chunks, sizeof(struct chunk)*ret->num);
87 struct chunk* chunk = &ret->chunks[ret->num-1];
88
89 assert(!strncmp(buf, "@@ -", 4));
90
91 char* start = buf+4;
92 char* sp = index(start, ' ');
93 *sp = '\0';
94 if(index(start, ',')) {
95 int ret = sscanf(start, "%d,%d", &chunk->off1, &chunk->len1);
96 assert(ret == 2);
97 } else {
98 int ret = sscanf(start, "%d", &chunk->off1);
99 assert(ret == 1);
100 chunk->len1 = 1;
101 }
102 *sp = ' ';
103
104 start = sp+1;
105 sp = index(start, ' ');
106 *sp = '\0';
107 if(index(start, ',')) {
108 int ret = sscanf(start, "%d,%d", &chunk->off2, &chunk->len2);
109 assert(ret == 2);
110 } else {
111 int ret = sscanf(start, "%d", &chunk->off2);
112 assert(ret == 1);
113 chunk->len2 = 1;
114 }
115 *sp = ' ';
116
117 if(chunk->off1 > 0)
118 chunk->off1 -= 1;
119 if(chunk->off2 > 0)
120 chunk->off2 -= 1;
121
122 assert(chunk->off1 >= 0);
123 assert(chunk->off2 >= 0);
124 }
125 fclose(fin);
126
127 num_get_patch++;
128 return ret;
129}
130
131void free_patch(struct patch* p)
132{
133 free(p->chunks);
134 free(p);
135}
136
137static int get_blob_sha1_internal(unsigned char *sha1, const char *base, int baselen,
138 const char *pathname, unsigned mode, int stage);
139
140
141static unsigned char blob_sha1[20];
142static int get_blob_sha1(struct tree* t, const char* pathname, unsigned char* sha1)
143{
144 const char *pathspec[2];
145 pathspec[0] = pathname;
146 pathspec[1] = NULL;
147 memset(blob_sha1, 0, sizeof(blob_sha1));
148 read_tree_recursive(t, "", 0, 0, pathspec, get_blob_sha1_internal);
149
150 int i;
151 for(i = 0; i < 20; i++) {
152 if(blob_sha1[i] != 0)
153 break;
154 }
155
156 if(i == 20)
157 return -1;
158
159 memcpy(sha1, blob_sha1, 20);
160 return 0;
161}
162
163static int get_blob_sha1_internal(unsigned char *sha1, const char *base, int baselen,
164 const char *pathname, unsigned mode, int stage)
165{
166// printf("Got blob: %s base: '%s' baselen: %d pathname: '%s' mode: %o stage: %d\n",
167// sha1_to_hex(sha1), base, baselen, pathname, mode, stage);
168
169 if(S_ISDIR(mode))
170 return READ_TREE_RECURSIVE;
171
172 memcpy(blob_sha1, sha1, 20);
173 return -1;
174}
175
176static void get_blob(struct commit* commit)
177{
178 struct util_info* info = commit->object.util;
179 char type[20];
180
181 if(info->buf)
182 return;
183
184 info->buf = read_sha1_file(info->sha1, type, &info->size);
185 assert(!strcmp(type, "blob"));
186}
187
188void print_patch(struct patch* p)
189{
190 printf("Num chunks: %d\n", p->num);
191 int i;
192 for(i = 0; i < p->num; i++) {
193 printf("%d,%d %d,%d\n", p->chunks[i].off1, p->chunks[i].len1, p->chunks[i].off2, p->chunks[i].len2);
194 }
195}
196
197
198// p is a patch from commit to other.
199void fill_line_map(struct commit* commit, struct commit* other, struct patch* p)
200{
201 int num_lines = ((struct util_info*) commit->object.util)->num_lines;
202 int* line_map = ((struct util_info*) commit->object.util)->line_map;
203 int num_lines2 = ((struct util_info*) other->object.util)->num_lines;
204 int* line_map2 = ((struct util_info*) other->object.util)->line_map;
205 int cur_chunk = 0;
206 int i1, i2;
207
208 if(p->num && DEBUG)
209 print_patch(p);
210
211 for(i1 = 0; i1 < num_lines; i1++)
212 line_map[i1] = -1;
213
214 if(DEBUG)
215 printf("num lines 1: %d num lines 2: %d\n", num_lines, num_lines2);
216
217 for(i1 = 0, i2 = 0; i1 < num_lines; i1++, i2++) {
218 if(DEBUG > 1)
219 printf("%d %d\n", i1, i2);
220
221 if(i2 >= num_lines2)
222 break;
223
224 line_map[i1] = line_map2[i2];
225
226 struct chunk* chunk = NULL;
227 if(cur_chunk < p->num)
228 chunk = &p->chunks[cur_chunk];
229
230 if(chunk && chunk->off1 == i1) {
231 i2 = chunk->off2;
232
233 if(chunk->len1 > 0)
234 i1 += chunk->len1-1;
235 if(chunk->len2 > 0)
236 i2 += chunk->len2-1;
237 cur_chunk++;
238 }
239 }
240}
241
242int map_line(struct commit* commit, int line)
243{
244 struct util_info* info = commit->object.util;
245 assert(line >= 0 && line < info->num_lines);
246 return info->line_map[line];
247}
248
249int fill_util_info(struct commit* commit, const char* path)
250{
251 if(commit->object.util)
252 return 0;
253
254 struct util_info* util = xmalloc(sizeof(struct util_info));
255 util->buf = NULL;
256 util->size = 0;
257 util->num_lines = -1;
258 util->line_map = NULL;
259
260 commit->object.util = util;
261
262 if(get_blob_sha1(commit->tree, path, util->sha1))
263 return -1;
264
265 return 0;
266}
267
268void alloc_line_map(struct commit* commit)
269{
270 struct util_info* util = commit->object.util;
271
272 if(util->line_map)
273 return;
274
275 get_blob(commit);
276
277 int i;
278 util->num_lines = 0;
279 for(i = 0; i < util->size; i++) {
280 if(util->buf[i] == '\n')
281 util->num_lines++;
282 }
283 util->line_map = xmalloc(sizeof(int)*util->num_lines);
284}
285
286void copy_line_map(struct commit* dst, struct commit* src)
287{
288 struct util_info* u_dst = dst->object.util;
289 struct util_info* u_src = src->object.util;
290
291 u_dst->line_map = u_src->line_map;
292 u_dst->num_lines = u_src->num_lines;
293 u_dst->buf = u_src->buf;
294 u_dst->size = u_src->size;
295}
296
297void process_commits(struct commit_list* list, const char* path)
298{
299 int i;
300
301 while(list) {
302 struct commit* commit = pop_commit(&list);
303 struct commit_list* parents;
304 struct util_info* info;
305
306 info = commit->object.util;
307 num_commits++;
308 if(DEBUG)
309 printf("\nProcessing commit: %d %s\n", num_commits, sha1_to_hex(commit->object.sha1));
310 for(parents = commit->parents;
311 parents != NULL; parents = parents->next) {
312 struct commit* parent = parents->item;
313
314 if(parse_commit(parent) < 0)
315 die("parse_commit error");
316
317 if(DEBUG)
318 printf("parent: %s\n", sha1_to_hex(parent->object.sha1));
319
320 if(fill_util_info(parent, path))
321 continue;
322
323 // Temporarily assign everything to the parent.
324 int num_blame = 0;
325 for(i = 0; i < num_blame_lines; i++) {
326 if(blame_lines[i] == commit) {
327 num_blame++;
328 blame_lines[i] = parent;
329 }
330 }
331
332 if(num_blame == 0)
333 continue;
334
335 struct patch* patch = get_patch(parent, commit);
336 if(patch->num == 0) {
337 copy_line_map(parent, commit);
338 } else {
339 alloc_line_map(parent);
340 fill_line_map(parent, commit, patch);
341 }
342
343 for(i = 0; i < patch->num; i++) {
344 int l;
345 for(l = 0; l < patch->chunks[i].len2; l++) {
346 int mapped_line = map_line(commit, patch->chunks[i].off2 + l);
347 if(mapped_line != -1 && blame_lines[mapped_line] == parent)
348 blame_lines[mapped_line] = commit;
349 }
350 }
351 free_patch(patch);
352 }
353 }
354}
355
356#define SEEN 1
357struct commit_list* get_commit_list(struct commit* commit, const char* pathname)
358{
359 struct commit_list* ret = NULL;
360 struct commit_list* process = NULL;
361 unsigned char sha1[20];
362
363 commit_list_insert(commit, &process);
364
365 while(process) {
366 struct commit* com = pop_commit(&process);
367 if(com->object.flags & SEEN)
368 continue;
369
370 com->object.flags |= SEEN;
371 commit_list_insert(com, &ret);
372 struct commit_list* parents;
373
374 parse_commit(com);
375
376 for(parents = com->parents;
377 parents != NULL; parents = parents->next) {
378 struct commit* parent = parents->item;
379
380 parse_commit(parent);
381
382 if(!get_blob_sha1(parent->tree, pathname, sha1))
383 commit_list_insert(parent, &process);
384 }
385 }
386
387 return ret;
388}
389
390int main(int argc, const char **argv)
391{
392 unsigned char sha1[20];
393 struct commit *commit;
394 const char* filename;
395 int i;
396
397 setup_git_directory();
398
399 if (argc != 3)
400 die("Usage: blame commit-ish file");
401
402 if (get_sha1(argv[1], sha1))
403 die("get_sha1 failed");
404
405 commit = lookup_commit_reference(sha1);
406
407 filename = argv[2];
408
409 struct commit_list* list = get_commit_list(commit, filename);
410 sort_in_topological_order(&list, 1);
411
412 if(fill_util_info(commit, filename)) {
413 printf("%s not found in %s\n", filename, argv[1]);
414 return 0;
415 }
416 alloc_line_map(commit);
417
418 struct util_info* util = commit->object.util;
419 num_blame_lines = util->num_lines;
420 blame_lines = xmalloc(sizeof(struct commit*)*num_blame_lines);
421
422
423 for(i = 0; i < num_blame_lines; i++) {
424 blame_lines[i] = commit;
425
426 ((struct util_info*) commit->object.util)->line_map[i] = i;
427 }
428
429 process_commits(list, filename);
430
431 for(i = 0; i < num_blame_lines; i++) {
432 printf("%d %s\n", i+1-1, sha1_to_hex(blame_lines[i]->object.sha1));
433// printf("%d %s\n", i+1-1, find_unique_abbrev(blame_lines[i]->object.sha1, 6));
434 }
435
436 if(DEBUG) {
437 printf("num get patch: %d\n", num_get_patch);
438 printf("num commits: %d\n", num_commits);
439 }
440
441 return 0;
442}