mirror of
https://github.com/git/git.git
synced 2024-11-18 15:04:49 +01:00
fc675b8cd5
Here is an updated version of git-blame. The main changes compared to the first version are: * Use the new revision.h interface to do the revision walking * Do the right thing in a lot of more cases than before. In particular parallel development tracks are hopefully handled sanely. * Lots of clean-up It still won't follow file renames though. There are still some differences in the output between git-blame and git-annotate. For example, in 'Makefile' git-blame assigns lines 354-358 to455a7f3275
and git-annotate assigns the same lines to79a9d8ea0d
. I think git-blame is correct in this case. This patterns occur in several other places, git-annotate seems to sometimes assign lines to merge commits when the lines actually changed in some other commit which precedes the merge. [jc: I have conned Ryan into doing test cases, so that it would help development and fixes on both implementations. Let the battle begin! ;-) ] Signed-off-by: Fredrik Kuivinen <freku045@student.liu.se> Signed-off-by: Junio C Hamano <junkio@cox.net>
562 lines
12 KiB
C
562 lines
12 KiB
C
/*
|
|
* Copyright (C) 2006, Fredrik Kuivinen <freku045@student.liu.se>
|
|
*/
|
|
|
|
#include <assert.h>
|
|
#include <time.h>
|
|
#include <sys/time.h>
|
|
|
|
#include "cache.h"
|
|
#include "refs.h"
|
|
#include "tag.h"
|
|
#include "commit.h"
|
|
#include "tree.h"
|
|
#include "blob.h"
|
|
#include "diff.h"
|
|
#include "revision.h"
|
|
|
|
#define DEBUG 0
|
|
|
|
struct commit **blame_lines;
|
|
int num_blame_lines;
|
|
|
|
struct util_info {
|
|
int *line_map;
|
|
unsigned char sha1[20]; /* blob sha, not commit! */
|
|
char *buf;
|
|
unsigned long size;
|
|
int num_lines;
|
|
// const char* path;
|
|
};
|
|
|
|
struct chunk {
|
|
int off1, len1; // ---
|
|
int off2, len2; // +++
|
|
};
|
|
|
|
struct patch {
|
|
struct chunk *chunks;
|
|
int num;
|
|
};
|
|
|
|
static void get_blob(struct commit *commit);
|
|
|
|
/* Only used for statistics */
|
|
static int num_get_patch = 0;
|
|
static int num_commits = 0;
|
|
static int patch_time = 0;
|
|
|
|
#define TEMPFILE_PATH_LEN 60
|
|
static struct patch *get_patch(struct commit *commit, struct commit *other)
|
|
{
|
|
struct patch *ret;
|
|
struct util_info *info_c = (struct util_info *)commit->object.util;
|
|
struct util_info *info_o = (struct util_info *)other->object.util;
|
|
char tmp_path1[TEMPFILE_PATH_LEN], tmp_path2[TEMPFILE_PATH_LEN];
|
|
char diff_cmd[TEMPFILE_PATH_LEN*2 + 20];
|
|
struct timeval tv_start, tv_end;
|
|
int fd;
|
|
FILE *fin;
|
|
char buf[1024];
|
|
|
|
ret = xmalloc(sizeof(struct patch));
|
|
ret->chunks = NULL;
|
|
ret->num = 0;
|
|
|
|
get_blob(commit);
|
|
get_blob(other);
|
|
|
|
gettimeofday(&tv_start, NULL);
|
|
|
|
fd = git_mkstemp(tmp_path1, TEMPFILE_PATH_LEN, "git-blame-XXXXXX");
|
|
if (fd < 0)
|
|
die("unable to create temp-file: %s", strerror(errno));
|
|
|
|
if (xwrite(fd, info_c->buf, info_c->size) != info_c->size)
|
|
die("write failed: %s", strerror(errno));
|
|
close(fd);
|
|
|
|
fd = git_mkstemp(tmp_path2, TEMPFILE_PATH_LEN, "git-blame-XXXXXX");
|
|
if (fd < 0)
|
|
die("unable to create temp-file: %s", strerror(errno));
|
|
|
|
if (xwrite(fd, info_o->buf, info_o->size) != info_o->size)
|
|
die("write failed: %s", strerror(errno));
|
|
close(fd);
|
|
|
|
sprintf(diff_cmd, "diff -u0 %s %s", tmp_path1, tmp_path2);
|
|
fin = popen(diff_cmd, "r");
|
|
if (!fin)
|
|
die("popen failed: %s", strerror(errno));
|
|
|
|
while (fgets(buf, sizeof(buf), fin)) {
|
|
struct chunk *chunk;
|
|
char *start, *sp;
|
|
|
|
if (buf[0] != '@' || buf[1] != '@')
|
|
continue;
|
|
|
|
if (DEBUG)
|
|
printf("chunk line: %s", buf);
|
|
ret->num++;
|
|
ret->chunks = xrealloc(ret->chunks,
|
|
sizeof(struct chunk) * ret->num);
|
|
chunk = &ret->chunks[ret->num - 1];
|
|
|
|
assert(!strncmp(buf, "@@ -", 4));
|
|
|
|
start = buf + 4;
|
|
sp = index(start, ' ');
|
|
*sp = '\0';
|
|
if (index(start, ',')) {
|
|
int ret =
|
|
sscanf(start, "%d,%d", &chunk->off1, &chunk->len1);
|
|
assert(ret == 2);
|
|
} else {
|
|
int ret = sscanf(start, "%d", &chunk->off1);
|
|
assert(ret == 1);
|
|
chunk->len1 = 1;
|
|
}
|
|
*sp = ' ';
|
|
|
|
start = sp + 1;
|
|
sp = index(start, ' ');
|
|
*sp = '\0';
|
|
if (index(start, ',')) {
|
|
int ret =
|
|
sscanf(start, "%d,%d", &chunk->off2, &chunk->len2);
|
|
assert(ret == 2);
|
|
} else {
|
|
int ret = sscanf(start, "%d", &chunk->off2);
|
|
assert(ret == 1);
|
|
chunk->len2 = 1;
|
|
}
|
|
*sp = ' ';
|
|
|
|
if (chunk->len1 == 0)
|
|
chunk->off1++;
|
|
if (chunk->len2 == 0)
|
|
chunk->off2++;
|
|
|
|
if (chunk->off1 > 0)
|
|
chunk->off1--;
|
|
if (chunk->off2 > 0)
|
|
chunk->off2--;
|
|
|
|
assert(chunk->off1 >= 0);
|
|
assert(chunk->off2 >= 0);
|
|
}
|
|
pclose(fin);
|
|
unlink(tmp_path1);
|
|
unlink(tmp_path2);
|
|
|
|
gettimeofday(&tv_end, NULL);
|
|
patch_time += 1000000 * (tv_end.tv_sec - tv_start.tv_sec) +
|
|
tv_end.tv_usec - tv_start.tv_usec;
|
|
|
|
num_get_patch++;
|
|
return ret;
|
|
}
|
|
|
|
static void free_patch(struct patch *p)
|
|
{
|
|
free(p->chunks);
|
|
free(p);
|
|
}
|
|
|
|
static int get_blob_sha1_internal(unsigned char *sha1, const char *base,
|
|
int baselen, const char *pathname,
|
|
unsigned mode, int stage);
|
|
|
|
static unsigned char blob_sha1[20];
|
|
static int get_blob_sha1(struct tree *t, const char *pathname,
|
|
unsigned char *sha1)
|
|
{
|
|
int i;
|
|
const char *pathspec[2];
|
|
pathspec[0] = pathname;
|
|
pathspec[1] = NULL;
|
|
memset(blob_sha1, 0, sizeof(blob_sha1));
|
|
read_tree_recursive(t, "", 0, 0, pathspec, get_blob_sha1_internal);
|
|
|
|
for (i = 0; i < 20; i++) {
|
|
if (blob_sha1[i] != 0)
|
|
break;
|
|
}
|
|
|
|
if (i == 20)
|
|
return -1;
|
|
|
|
memcpy(sha1, blob_sha1, 20);
|
|
return 0;
|
|
}
|
|
|
|
static int get_blob_sha1_internal(unsigned char *sha1, const char *base,
|
|
int baselen, const char *pathname,
|
|
unsigned mode, int stage)
|
|
{
|
|
if (S_ISDIR(mode))
|
|
return READ_TREE_RECURSIVE;
|
|
|
|
memcpy(blob_sha1, sha1, 20);
|
|
return -1;
|
|
}
|
|
|
|
static void get_blob(struct commit *commit)
|
|
{
|
|
struct util_info *info = commit->object.util;
|
|
char type[20];
|
|
|
|
if (info->buf)
|
|
return;
|
|
|
|
info->buf = read_sha1_file(info->sha1, type, &info->size);
|
|
|
|
assert(!strcmp(type, "blob"));
|
|
}
|
|
|
|
/* For debugging only */
|
|
static void print_patch(struct patch *p)
|
|
{
|
|
int i;
|
|
printf("Num chunks: %d\n", p->num);
|
|
for (i = 0; i < p->num; i++) {
|
|
printf("%d,%d %d,%d\n", p->chunks[i].off1, p->chunks[i].len1,
|
|
p->chunks[i].off2, p->chunks[i].len2);
|
|
}
|
|
}
|
|
|
|
/* For debugging only */
|
|
static void print_map(struct commit *cmit, struct commit *other)
|
|
{
|
|
struct util_info *util = cmit->object.util;
|
|
struct util_info *util2 = other->object.util;
|
|
|
|
int i;
|
|
int max =
|
|
util->num_lines >
|
|
util2->num_lines ? util->num_lines : util2->num_lines;
|
|
int num;
|
|
|
|
for (i = 0; i < max; i++) {
|
|
printf("i: %d ", i);
|
|
num = -1;
|
|
|
|
if (i < util->num_lines) {
|
|
num = util->line_map[i];
|
|
printf("%d\t", num);
|
|
} else
|
|
printf("\t");
|
|
|
|
if (i < util2->num_lines) {
|
|
int num2 = util2->line_map[i];
|
|
printf("%d\t", num2);
|
|
if (num != -1 && num2 != num)
|
|
printf("---");
|
|
} else
|
|
printf("\t");
|
|
|
|
printf("\n");
|
|
}
|
|
}
|
|
|
|
// p is a patch from commit to other.
|
|
static void fill_line_map(struct commit *commit, struct commit *other,
|
|
struct patch *p)
|
|
{
|
|
struct util_info *util = commit->object.util;
|
|
struct util_info *util2 = other->object.util;
|
|
int *map = util->line_map;
|
|
int *map2 = util2->line_map;
|
|
int cur_chunk = 0;
|
|
int i1, i2;
|
|
|
|
if (p->num && DEBUG)
|
|
print_patch(p);
|
|
|
|
if (DEBUG)
|
|
printf("num lines 1: %d num lines 2: %d\n", util->num_lines,
|
|
util2->num_lines);
|
|
|
|
for (i1 = 0, i2 = 0; i1 < util->num_lines; i1++, i2++) {
|
|
struct chunk *chunk = NULL;
|
|
if (cur_chunk < p->num)
|
|
chunk = &p->chunks[cur_chunk];
|
|
|
|
if (chunk && chunk->off1 == i1) {
|
|
if (DEBUG && i2 != chunk->off2)
|
|
printf("i2: %d off2: %d\n", i2, chunk->off2);
|
|
|
|
assert(i2 == chunk->off2);
|
|
|
|
i1--;
|
|
i2--;
|
|
if (chunk->len1 > 0)
|
|
i1 += chunk->len1;
|
|
|
|
if (chunk->len2 > 0)
|
|
i2 += chunk->len2;
|
|
|
|
cur_chunk++;
|
|
} else {
|
|
if (i2 >= util2->num_lines)
|
|
break;
|
|
|
|
if (map[i1] != map2[i2] && map[i1] != -1) {
|
|
if (DEBUG)
|
|
printf("map: i1: %d %d %p i2: %d %d %p\n",
|
|
i1, map[i1],
|
|
i1 != -1 ? blame_lines[map[i1]] : NULL,
|
|
i2, map2[i2],
|
|
i2 != -1 ? blame_lines[map2[i2]] : NULL);
|
|
if (map2[i2] != -1 &&
|
|
blame_lines[map[i1]] &&
|
|
!blame_lines[map2[i2]])
|
|
map[i1] = map2[i2];
|
|
}
|
|
|
|
if (map[i1] == -1 && map2[i2] != -1)
|
|
map[i1] = map2[i2];
|
|
}
|
|
|
|
if (DEBUG > 1)
|
|
printf("l1: %d l2: %d i1: %d i2: %d\n",
|
|
map[i1], map2[i2], i1, i2);
|
|
}
|
|
}
|
|
|
|
static int map_line(struct commit *commit, int line)
|
|
{
|
|
struct util_info *info = commit->object.util;
|
|
assert(line >= 0 && line < info->num_lines);
|
|
return info->line_map[line];
|
|
}
|
|
|
|
static int fill_util_info(struct commit *commit, const char *path)
|
|
{
|
|
struct util_info *util;
|
|
if (commit->object.util)
|
|
return 0;
|
|
|
|
util = xmalloc(sizeof(struct util_info));
|
|
|
|
if (get_blob_sha1(commit->tree, path, util->sha1)) {
|
|
free(util);
|
|
return 1;
|
|
} else {
|
|
util->buf = NULL;
|
|
util->size = 0;
|
|
util->line_map = NULL;
|
|
util->num_lines = -1;
|
|
commit->object.util = util;
|
|
return 0;
|
|
}
|
|
}
|
|
|
|
static void alloc_line_map(struct commit *commit)
|
|
{
|
|
struct util_info *util = commit->object.util;
|
|
int i;
|
|
|
|
if (util->line_map)
|
|
return;
|
|
|
|
get_blob(commit);
|
|
|
|
util->num_lines = 0;
|
|
for (i = 0; i < util->size; i++) {
|
|
if (util->buf[i] == '\n')
|
|
util->num_lines++;
|
|
}
|
|
if(util->buf[util->size - 1] != '\n')
|
|
util->num_lines++;
|
|
|
|
util->line_map = xmalloc(sizeof(int) * util->num_lines);
|
|
|
|
for (i = 0; i < util->num_lines; i++)
|
|
util->line_map[i] = -1;
|
|
}
|
|
|
|
static void init_first_commit(struct commit* commit, const char* filename)
|
|
{
|
|
struct util_info* util;
|
|
int i;
|
|
|
|
if (fill_util_info(commit, filename))
|
|
die("fill_util_info failed");
|
|
|
|
alloc_line_map(commit);
|
|
|
|
util = commit->object.util;
|
|
num_blame_lines = util->num_lines;
|
|
|
|
for (i = 0; i < num_blame_lines; i++)
|
|
util->line_map[i] = i;
|
|
}
|
|
|
|
|
|
static void process_commits(struct rev_info *rev, const char *path,
|
|
struct commit** initial)
|
|
{
|
|
int i;
|
|
struct util_info* util;
|
|
int lines_left;
|
|
int *blame_p;
|
|
int *new_lines;
|
|
int new_lines_len;
|
|
|
|
struct commit* commit = get_revision(rev);
|
|
assert(commit);
|
|
init_first_commit(commit, path);
|
|
|
|
util = commit->object.util;
|
|
num_blame_lines = util->num_lines;
|
|
blame_lines = xmalloc(sizeof(struct commit *) * num_blame_lines);
|
|
for (i = 0; i < num_blame_lines; i++)
|
|
blame_lines[i] = NULL;
|
|
|
|
lines_left = num_blame_lines;
|
|
blame_p = xmalloc(sizeof(int) * num_blame_lines);
|
|
new_lines = xmalloc(sizeof(int) * num_blame_lines);
|
|
do {
|
|
struct commit_list *parents;
|
|
int num_parents;
|
|
struct util_info *util;
|
|
|
|
if (DEBUG)
|
|
printf("\nProcessing commit: %d %s\n", num_commits,
|
|
sha1_to_hex(commit->object.sha1));
|
|
|
|
if (lines_left == 0)
|
|
return;
|
|
|
|
num_commits++;
|
|
memset(blame_p, 0, sizeof(int) * num_blame_lines);
|
|
new_lines_len = 0;
|
|
num_parents = 0;
|
|
for (parents = commit->parents;
|
|
parents != NULL; parents = parents->next)
|
|
num_parents++;
|
|
|
|
if(num_parents == 0)
|
|
*initial = commit;
|
|
|
|
if(fill_util_info(commit, path))
|
|
continue;
|
|
|
|
alloc_line_map(commit);
|
|
util = commit->object.util;
|
|
|
|
for (parents = commit->parents;
|
|
parents != NULL; parents = parents->next) {
|
|
struct commit *parent = parents->item;
|
|
struct patch *patch;
|
|
|
|
if (parse_commit(parent) < 0)
|
|
die("parse_commit error");
|
|
|
|
if (DEBUG)
|
|
printf("parent: %s\n",
|
|
sha1_to_hex(parent->object.sha1));
|
|
|
|
if(fill_util_info(parent, path)) {
|
|
num_parents--;
|
|
continue;
|
|
}
|
|
|
|
patch = get_patch(parent, commit);
|
|
alloc_line_map(parent);
|
|
fill_line_map(parent, commit, patch);
|
|
|
|
for (i = 0; i < patch->num; i++) {
|
|
int l;
|
|
for (l = 0; l < patch->chunks[i].len2; l++) {
|
|
int mapped_line =
|
|
map_line(commit, patch->chunks[i].off2 + l);
|
|
if (mapped_line != -1) {
|
|
blame_p[mapped_line]++;
|
|
if (blame_p[mapped_line] == num_parents)
|
|
new_lines[new_lines_len++] = mapped_line;
|
|
}
|
|
}
|
|
}
|
|
free_patch(patch);
|
|
}
|
|
|
|
if (DEBUG)
|
|
printf("parents: %d\n", num_parents);
|
|
|
|
for (i = 0; i < new_lines_len; i++) {
|
|
int mapped_line = new_lines[i];
|
|
if (blame_lines[mapped_line] == NULL) {
|
|
blame_lines[mapped_line] = commit;
|
|
lines_left--;
|
|
if (DEBUG)
|
|
printf("blame: mapped: %d i: %d\n",
|
|
mapped_line, i);
|
|
}
|
|
}
|
|
} while ((commit = get_revision(rev)) != NULL);
|
|
}
|
|
|
|
int main(int argc, const char **argv)
|
|
{
|
|
int i;
|
|
struct commit *initial = NULL;
|
|
unsigned char sha1[20];
|
|
const char* filename;
|
|
int num_args;
|
|
const char* args[10];
|
|
struct rev_info rev;
|
|
|
|
setup_git_directory();
|
|
|
|
if (argc != 3)
|
|
die("Usage: blame commit-ish file");
|
|
|
|
|
|
filename = argv[2];
|
|
|
|
{
|
|
struct commit* commit;
|
|
if (get_sha1(argv[1], sha1))
|
|
die("get_sha1 failed");
|
|
commit = lookup_commit_reference(sha1);
|
|
|
|
if (fill_util_info(commit, filename)) {
|
|
printf("%s not found in %s\n", filename, argv[1]);
|
|
return 1;
|
|
}
|
|
}
|
|
|
|
num_args = 0;
|
|
args[num_args++] = NULL;
|
|
args[num_args++] = "--topo-order";
|
|
args[num_args++] = "--remove-empty";
|
|
args[num_args++] = argv[1];
|
|
args[num_args++] = "--";
|
|
args[num_args++] = filename;
|
|
args[num_args] = NULL;
|
|
|
|
setup_revisions(num_args, args, &rev, "HEAD");
|
|
prepare_revision_walk(&rev);
|
|
process_commits(&rev, filename, &initial);
|
|
|
|
for (i = 0; i < num_blame_lines; i++) {
|
|
struct commit *c = blame_lines[i];
|
|
if (!c)
|
|
c = initial;
|
|
|
|
printf("%d %.8s\n", i, sha1_to_hex(c->object.sha1));
|
|
// printf("%d %s\n", i, find_unique_abbrev(blame_lines[i]->object.sha1, 6));
|
|
}
|
|
|
|
if (DEBUG) {
|
|
printf("num get patch: %d\n", num_get_patch);
|
|
printf("num commits: %d\n", num_commits);
|
|
printf("patch time: %f\n", patch_time / 1000000.0);
|
|
printf("initial: %s\n", sha1_to_hex(initial->object.sha1));
|
|
}
|
|
|
|
return 0;
|
|
}
|