]> git.armaanb.net Git - stagit.git/blob - stagit.c
don't use a heuristic for renames, the content must match exactly
[stagit.git] / stagit.c
1 #include <sys/stat.h>
2 #include <sys/types.h>
3
4 #include <err.h>
5 #include <errno.h>
6 #include <inttypes.h>
7 #include <libgen.h>
8 #include <limits.h>
9 #include <stdio.h>
10 #include <stdlib.h>
11 #include <string.h>
12 #include <unistd.h>
13
14 #include <git2.h>
15
16 #include "compat.h"
17
18 struct deltainfo {
19         git_patch *patch;
20
21         size_t addcount;
22         size_t delcount;
23 };
24
25 struct commitinfo {
26         const git_oid *id;
27
28         char oid[GIT_OID_HEXSZ + 1];
29         char parentoid[GIT_OID_HEXSZ + 1];
30
31         const git_signature *author;
32         const git_signature *committer;
33         const char          *summary;
34         const char          *msg;
35
36         git_diff   *diff;
37         git_commit *commit;
38         git_commit *parent;
39         git_tree   *commit_tree;
40         git_tree   *parent_tree;
41
42         size_t addcount;
43         size_t delcount;
44         size_t filecount;
45
46         struct deltainfo **deltas;
47         size_t ndeltas;
48 };
49
50 static git_repository *repo;
51
52 static const char *relpath = "";
53 static const char *repodir;
54
55 static char *name = "";
56 static char *strippedname = "";
57 static char description[255];
58 static char cloneurl[1024];
59 static char *submodules;
60 static char *licensefiles[] = { "HEAD:LICENSE", "HEAD:LICENSE.md", "HEAD:COPYING" };
61 static char *license;
62 static char *readmefiles[] = { "HEAD:README", "HEAD:README.md" };
63 static char *readme;
64 static long long nlogcommits = -1; /* < 0 indicates not used */
65
66 /* cache */
67 static git_oid lastoid;
68 static char lastoidstr[GIT_OID_HEXSZ + 2]; /* id + newline + NUL byte */
69 static FILE *rcachefp, *wcachefp;
70 static const char *cachefile;
71
72 void
73 joinpath(char *buf, size_t bufsiz, const char *path, const char *path2)
74 {
75         int r;
76
77         r = snprintf(buf, bufsiz, "%s%s%s",
78                 path, path[0] && path[strlen(path) - 1] != '/' ? "/" : "", path2);
79         if (r == -1 || (size_t)r >= bufsiz)
80                 errx(1, "path truncated: '%s%s%s'",
81                         path, path[0] && path[strlen(path) - 1] != '/' ? "/" : "", path2);
82 }
83
84 void
85 deltainfo_free(struct deltainfo *di)
86 {
87         if (!di)
88                 return;
89         git_patch_free(di->patch);
90         memset(di, 0, sizeof(*di));
91         free(di);
92 }
93
94 int
95 commitinfo_getstats(struct commitinfo *ci)
96 {
97         struct deltainfo *di;
98         git_diff_options opts;
99         git_diff_find_options fopts;
100         const git_diff_delta *delta;
101         const git_diff_hunk *hunk;
102         const git_diff_line *line;
103         git_patch *patch = NULL;
104         size_t ndeltas, nhunks, nhunklines;
105         size_t i, j, k;
106
107         if (git_tree_lookup(&(ci->commit_tree), repo, git_commit_tree_id(ci->commit)))
108                 goto err;
109         if (!git_commit_parent(&(ci->parent), ci->commit, 0)) {
110                 if (git_tree_lookup(&(ci->parent_tree), repo, git_commit_tree_id(ci->parent))) {
111                         ci->parent = NULL;
112                         ci->parent_tree = NULL;
113                 }
114         }
115
116         git_diff_init_options(&opts, GIT_DIFF_OPTIONS_VERSION);
117         opts.flags |= GIT_DIFF_DISABLE_PATHSPEC_MATCH |
118                       GIT_DIFF_IGNORE_SUBMODULES |
119                       GIT_DIFF_INCLUDE_TYPECHANGE;
120         if (git_diff_tree_to_tree(&(ci->diff), repo, ci->parent_tree, ci->commit_tree, &opts))
121                 goto err;
122
123         if (git_diff_find_init_options(&fopts, GIT_DIFF_FIND_OPTIONS_VERSION))
124                 goto err;
125         /* find renames and copies, exact matches (no heuristic) for renames. */
126         fopts.flags |= GIT_DIFF_FIND_RENAMES | GIT_DIFF_FIND_COPIES |
127                        GIT_DIFF_FIND_EXACT_MATCH_ONLY;
128         if (git_diff_find_similar(ci->diff, &fopts))
129                 goto err;
130
131         ndeltas = git_diff_num_deltas(ci->diff);
132         if (ndeltas && !(ci->deltas = calloc(ndeltas, sizeof(struct deltainfo *))))
133                 err(1, "calloc");
134
135         for (i = 0; i < ndeltas; i++) {
136                 if (git_patch_from_diff(&patch, ci->diff, i))
137                         goto err;
138
139                 if (!(di = calloc(1, sizeof(struct deltainfo))))
140                         err(1, "calloc");
141                 di->patch = patch;
142                 ci->deltas[i] = di;
143
144                 delta = git_patch_get_delta(patch);
145
146                 /* skip stats for binary data */
147                 if (delta->flags & GIT_DIFF_FLAG_BINARY)
148                         continue;
149
150                 nhunks = git_patch_num_hunks(patch);
151                 for (j = 0; j < nhunks; j++) {
152                         if (git_patch_get_hunk(&hunk, &nhunklines, patch, j))
153                                 break;
154                         for (k = 0; ; k++) {
155                                 if (git_patch_get_line_in_hunk(&line, patch, j, k))
156                                         break;
157                                 if (line->old_lineno == -1) {
158                                         di->addcount++;
159                                         ci->addcount++;
160                                 } else if (line->new_lineno == -1) {
161                                         di->delcount++;
162                                         ci->delcount++;
163                                 }
164                         }
165                 }
166         }
167         ci->ndeltas = i;
168         ci->filecount = i;
169
170         return 0;
171
172 err:
173         git_diff_free(ci->diff);
174         ci->diff = NULL;
175         git_tree_free(ci->commit_tree);
176         ci->commit_tree = NULL;
177         git_tree_free(ci->parent_tree);
178         ci->parent_tree = NULL;
179         git_commit_free(ci->parent);
180         ci->parent = NULL;
181
182         if (ci->deltas)
183                 for (i = 0; i < ci->ndeltas; i++)
184                         deltainfo_free(ci->deltas[i]);
185         free(ci->deltas);
186         ci->deltas = NULL;
187         ci->ndeltas = 0;
188         ci->addcount = 0;
189         ci->delcount = 0;
190         ci->filecount = 0;
191
192         return -1;
193 }
194
195 void
196 commitinfo_free(struct commitinfo *ci)
197 {
198         size_t i;
199
200         if (!ci)
201                 return;
202         if (ci->deltas)
203                 for (i = 0; i < ci->ndeltas; i++)
204                         deltainfo_free(ci->deltas[i]);
205
206         free(ci->deltas);
207         git_diff_free(ci->diff);
208         git_tree_free(ci->commit_tree);
209         git_tree_free(ci->parent_tree);
210         git_commit_free(ci->commit);
211         git_commit_free(ci->parent);
212         memset(ci, 0, sizeof(*ci));
213         free(ci);
214 }
215
216 struct commitinfo *
217 commitinfo_getbyoid(const git_oid *id)
218 {
219         struct commitinfo *ci;
220
221         if (!(ci = calloc(1, sizeof(struct commitinfo))))
222                 err(1, "calloc");
223
224         if (git_commit_lookup(&(ci->commit), repo, id))
225                 goto err;
226         ci->id = id;
227
228         git_oid_tostr(ci->oid, sizeof(ci->oid), git_commit_id(ci->commit));
229         git_oid_tostr(ci->parentoid, sizeof(ci->parentoid), git_commit_parent_id(ci->commit, 0));
230
231         ci->author = git_commit_author(ci->commit);
232         ci->committer = git_commit_committer(ci->commit);
233         ci->summary = git_commit_summary(ci->commit);
234         ci->msg = git_commit_message(ci->commit);
235
236         return ci;
237
238 err:
239         commitinfo_free(ci);
240
241         return NULL;
242 }
243
244 FILE *
245 efopen(const char *name, const char *flags)
246 {
247         FILE *fp;
248
249         if (!(fp = fopen(name, flags)))
250                 err(1, "fopen: '%s'", name);
251
252         return fp;
253 }
254
255 /* Escape characters below as HTML 2.0 / XML 1.0. */
256 void
257 xmlencode(FILE *fp, const char *s, size_t len)
258 {
259         size_t i;
260
261         for (i = 0; *s && i < len; s++, i++) {
262                 switch(*s) {
263                 case '<':  fputs("&lt;",   fp); break;
264                 case '>':  fputs("&gt;",   fp); break;
265                 case '\'': fputs("&#39;",  fp); break;
266                 case '&':  fputs("&amp;",  fp); break;
267                 case '"':  fputs("&quot;", fp); break;
268                 default:   fputc(*s, fp);
269                 }
270         }
271 }
272
273 int
274 mkdirp(const char *path)
275 {
276         char tmp[PATH_MAX], *p;
277
278         if (strlcpy(tmp, path, sizeof(tmp)) >= sizeof(tmp))
279                 errx(1, "path truncated: '%s'", path);
280         for (p = tmp + (tmp[0] == '/'); *p; p++) {
281                 if (*p != '/')
282                         continue;
283                 *p = '\0';
284                 if (mkdir(tmp, S_IRWXU | S_IRWXG | S_IRWXO) < 0 && errno != EEXIST)
285                         return -1;
286                 *p = '/';
287         }
288         if (mkdir(tmp, S_IRWXU | S_IRWXG | S_IRWXO) < 0 && errno != EEXIST)
289                 return -1;
290         return 0;
291 }
292
293 void
294 printtimez(FILE *fp, const git_time *intime)
295 {
296         struct tm *intm;
297         time_t t;
298         char out[32];
299
300         t = (time_t)intime->time;
301         if (!(intm = gmtime(&t)))
302                 return;
303         strftime(out, sizeof(out), "%Y-%m-%dT%H:%M:%SZ", intm);
304         fputs(out, fp);
305 }
306
307 void
308 printtime(FILE *fp, const git_time *intime)
309 {
310         struct tm *intm;
311         time_t t;
312         char out[32];
313
314         t = (time_t)intime->time + (intime->offset * 60);
315         if (!(intm = gmtime(&t)))
316                 return;
317         strftime(out, sizeof(out), "%a, %e %b %Y %H:%M:%S", intm);
318         if (intime->offset < 0)
319                 fprintf(fp, "%s -%02d%02d", out,
320                             -(intime->offset) / 60, -(intime->offset) % 60);
321         else
322                 fprintf(fp, "%s +%02d%02d", out,
323                             intime->offset / 60, intime->offset % 60);
324 }
325
326 void
327 printtimeshort(FILE *fp, const git_time *intime)
328 {
329         struct tm *intm;
330         time_t t;
331         char out[32];
332
333         t = (time_t)intime->time;
334         if (!(intm = gmtime(&t)))
335                 return;
336         strftime(out, sizeof(out), "%Y-%m-%d %H:%M", intm);
337         fputs(out, fp);
338 }
339
340 void
341 writeheader(FILE *fp, const char *title)
342 {
343         fputs("<!DOCTYPE html>\n"
344                 "<html>\n<head>\n"
345                 "<meta http-equiv=\"Content-Type\" content=\"text/html; charset=UTF-8\" />\n"
346                 "<title>", fp);
347         xmlencode(fp, title, strlen(title));
348         if (title[0] && strippedname[0])
349                 fputs(" - ", fp);
350         xmlencode(fp, strippedname, strlen(strippedname));
351         if (description[0])
352                 fputs(" - ", fp);
353         xmlencode(fp, description, strlen(description));
354         fprintf(fp, "</title>\n<link rel=\"icon\" type=\"image/png\" href=\"%sfavicon.png\" />\n", relpath);
355         fprintf(fp, "<link rel=\"alternate\" type=\"application/atom+xml\" title=\"%s Atom Feed\" href=\"%satom.xml\" />\n",
356                 name, relpath);
357         fprintf(fp, "<link rel=\"stylesheet\" type=\"text/css\" href=\"%sstyle.css\" />\n", relpath);
358         fputs("</head>\n<body>\n<table><tr><td>", fp);
359         fprintf(fp, "<a href=\"../%s\"><img src=\"%slogo.png\" alt=\"\" width=\"32\" height=\"32\" /></a>",
360                 relpath, relpath);
361         fputs("</td><td><h1>", fp);
362         xmlencode(fp, strippedname, strlen(strippedname));
363         fputs("</h1><span class=\"desc\">", fp);
364         xmlencode(fp, description, strlen(description));
365         fputs("</span></td></tr>", fp);
366         if (cloneurl[0]) {
367                 fputs("<tr class=\"url\"><td></td><td>git clone <a href=\"", fp);
368                 xmlencode(fp, cloneurl, strlen(cloneurl));
369                 fputs("\">", fp);
370                 xmlencode(fp, cloneurl, strlen(cloneurl));
371                 fputs("</a></td></tr>", fp);
372         }
373         fputs("<tr><td></td><td>\n", fp);
374         fprintf(fp, "<a href=\"%slog.html\">Log</a> | ", relpath);
375         fprintf(fp, "<a href=\"%sfiles.html\">Files</a> | ", relpath);
376         fprintf(fp, "<a href=\"%srefs.html\">Refs</a>", relpath);
377         if (submodules)
378                 fprintf(fp, " | <a href=\"%sfile/%s.html\">Submodules</a>",
379                         relpath, submodules);
380         if (readme)
381                 fprintf(fp, " | <a href=\"%sfile/%s.html\">README</a>",
382                         relpath, readme);
383         if (license)
384                 fprintf(fp, " | <a href=\"%sfile/%s.html\">LICENSE</a>",
385                         relpath, license);
386         fputs("</td></tr></table>\n<hr/>\n<div id=\"content\">\n", fp);
387 }
388
389 void
390 writefooter(FILE *fp)
391 {
392         fputs("</div>\n</body>\n</html>\n", fp);
393 }
394
395 int
396 writeblobhtml(FILE *fp, const git_blob *blob)
397 {
398         size_t n = 0, i, prev;
399         const char *nfmt = "<a href=\"#l%d\" class=\"line\" id=\"l%d\">%7d</a> ";
400         const char *s = git_blob_rawcontent(blob);
401         git_off_t len = git_blob_rawsize(blob);
402
403         fputs("<pre id=\"blob\">\n", fp);
404
405         if (len > 0) {
406                 for (i = 0, prev = 0; i < (size_t)len; i++) {
407                         if (s[i] != '\n')
408                                 continue;
409                         n++;
410                         fprintf(fp, nfmt, n, n, n);
411                         xmlencode(fp, &s[prev], i - prev + 1);
412                         prev = i + 1;
413                 }
414                 /* trailing data */
415                 if ((len - prev) > 0) {
416                         n++;
417                         fprintf(fp, nfmt, n, n, n);
418                         xmlencode(fp, &s[prev], len - prev);
419                 }
420         }
421
422         fputs("</pre>\n", fp);
423
424         return n;
425 }
426
427 void
428 printcommit(FILE *fp, struct commitinfo *ci)
429 {
430         fprintf(fp, "<b>commit</b> <a href=\"%scommit/%s.html\">%s</a>\n",
431                 relpath, ci->oid, ci->oid);
432
433         if (ci->parentoid[0])
434                 fprintf(fp, "<b>parent</b> <a href=\"%scommit/%s.html\">%s</a>\n",
435                         relpath, ci->parentoid, ci->parentoid);
436
437         if (ci->author) {
438                 fputs("<b>Author:</b> ", fp);
439                 xmlencode(fp, ci->author->name, strlen(ci->author->name));
440                 fputs(" &lt;<a href=\"mailto:", fp);
441                 xmlencode(fp, ci->author->email, strlen(ci->author->email));
442                 fputs("\">", fp);
443                 xmlencode(fp, ci->author->email, strlen(ci->author->email));
444                 fputs("</a>&gt;\n<b>Date:</b>   ", fp);
445                 printtime(fp, &(ci->author->when));
446                 fputc('\n', fp);
447         }
448         if (ci->msg) {
449                 fputc('\n', fp);
450                 xmlencode(fp, ci->msg, strlen(ci->msg));
451                 fputc('\n', fp);
452         }
453 }
454
455 void
456 printshowfile(FILE *fp, struct commitinfo *ci)
457 {
458         const git_diff_delta *delta;
459         const git_diff_hunk *hunk;
460         const git_diff_line *line;
461         git_patch *patch;
462         size_t nhunks, nhunklines, changed, add, del, total, i, j, k;
463         char linestr[80];
464
465         printcommit(fp, ci);
466
467         if (!ci->deltas)
468                 return;
469
470         if (ci->filecount > 1000   ||
471             ci->ndeltas   > 1000   ||
472             ci->addcount  > 100000 ||
473             ci->delcount  > 100000) {
474                 fputs("Diff is too large, output suppressed.\n", fp);
475                 return;
476         }
477
478         /* diff stat */
479         fputs("<b>Diffstat:</b>\n<table>", fp);
480         for (i = 0; i < ci->ndeltas; i++) {
481                 delta = git_patch_get_delta(ci->deltas[i]->patch);
482
483                 fprintf(fp, "<tr><td><a href=\"#h%zu\">", i);
484                 xmlencode(fp, delta->old_file.path, strlen(delta->old_file.path));
485                 if (strcmp(delta->old_file.path, delta->new_file.path)) {
486                         fputs(" -&gt; ", fp);
487                         xmlencode(fp, delta->new_file.path, strlen(delta->new_file.path));
488                 }
489
490                 add = ci->deltas[i]->addcount;
491                 del = ci->deltas[i]->delcount;
492                 changed = add + del;
493                 total = sizeof(linestr) - 2;
494                 if (changed > total) {
495                         if (add)
496                                 add = ((float)total / changed * add) + 1;
497                         if (del)
498                                 del = ((float)total / changed * del) + 1;
499                 }
500                 memset(&linestr, '+', add);
501                 memset(&linestr[add], '-', del);
502
503                 fprintf(fp, "</a></td><td> | </td><td class=\"num\">%zu</td><td><span class=\"i\">",
504                         ci->deltas[i]->addcount + ci->deltas[i]->delcount);
505                 fwrite(&linestr, 1, add, fp);
506                 fputs("</span><span class=\"d\">", fp);
507                 fwrite(&linestr[add], 1, del, fp);
508                 fputs("</span></td></tr>\n", fp);
509         }
510         fprintf(fp, "</table></pre><pre>%zu file%s changed, %zu insertion%s(+), %zu deletion%s(-)\n",
511                 ci->filecount, ci->filecount == 1 ? "" : "s",
512                 ci->addcount,  ci->addcount  == 1 ? "" : "s",
513                 ci->delcount,  ci->delcount  == 1 ? "" : "s");
514
515         fputs("<hr/>", fp);
516
517         for (i = 0; i < ci->ndeltas; i++) {
518                 patch = ci->deltas[i]->patch;
519                 delta = git_patch_get_delta(patch);
520                 fprintf(fp, "<b>diff --git a/<a id=\"h%zu\" href=\"%sfile/%s.html\">%s</a> b/<a href=\"%sfile/%s.html\">%s</a></b>\n",
521                         i, relpath, delta->old_file.path, delta->old_file.path,
522                         relpath, delta->new_file.path, delta->new_file.path);
523
524                 /* check binary data */
525                 if (delta->flags & GIT_DIFF_FLAG_BINARY) {
526                         fputs("Binary files differ.\n", fp);
527                         continue;
528                 }
529
530                 nhunks = git_patch_num_hunks(patch);
531                 for (j = 0; j < nhunks; j++) {
532                         if (git_patch_get_hunk(&hunk, &nhunklines, patch, j))
533                                 break;
534
535                         fprintf(fp, "<a href=\"#h%zu-%zu\" id=\"h%zu-%zu\" class=\"h\">", i, j, i, j);
536                         xmlencode(fp, hunk->header, hunk->header_len);
537                         fputs("</a>", fp);
538
539                         for (k = 0; ; k++) {
540                                 if (git_patch_get_line_in_hunk(&line, patch, j, k))
541                                         break;
542                                 if (line->old_lineno == -1)
543                                         fprintf(fp, "<a href=\"#h%zu-%zu-%zu\" id=\"h%zu-%zu-%zu\" class=\"i\">+",
544                                                 i, j, k, i, j, k);
545                                 else if (line->new_lineno == -1)
546                                         fprintf(fp, "<a href=\"#h%zu-%zu-%zu\" id=\"h%zu-%zu-%zu\" class=\"d\">-",
547                                                 i, j, k, i, j, k);
548                                 else
549                                         fputc(' ', fp);
550                                 xmlencode(fp, line->content, line->content_len);
551                                 if (line->old_lineno == -1 || line->new_lineno == -1)
552                                         fputs("</a>", fp);
553                         }
554                 }
555         }
556 }
557
558 void
559 writelogline(FILE *fp, struct commitinfo *ci)
560 {
561         fputs("<tr><td>", fp);
562         if (ci->author)
563                 printtimeshort(fp, &(ci->author->when));
564         fputs("</td><td>", fp);
565         if (ci->summary) {
566                 fprintf(fp, "<a href=\"%scommit/%s.html\">", relpath, ci->oid);
567                 xmlencode(fp, ci->summary, strlen(ci->summary));
568                 fputs("</a>", fp);
569         }
570         fputs("</td><td>", fp);
571         if (ci->author)
572                 xmlencode(fp, ci->author->name, strlen(ci->author->name));
573         fputs("</td><td class=\"num\" align=\"right\">", fp);
574         fprintf(fp, "%zu", ci->filecount);
575         fputs("</td><td class=\"num\" align=\"right\">", fp);
576         fprintf(fp, "+%zu", ci->addcount);
577         fputs("</td><td class=\"num\" align=\"right\">", fp);
578         fprintf(fp, "-%zu", ci->delcount);
579         fputs("</td></tr>\n", fp);
580 }
581
582 int
583 writelog(FILE *fp, const git_oid *oid)
584 {
585         struct commitinfo *ci;
586         git_revwalk *w = NULL;
587         git_oid id;
588         char path[PATH_MAX], oidstr[GIT_OID_HEXSZ + 1];
589         FILE *fpfile;
590         int r;
591
592         git_revwalk_new(&w, repo);
593         git_revwalk_push(w, oid);
594         git_revwalk_sorting(w, GIT_SORT_TIME);
595         git_revwalk_simplify_first_parent(w);
596
597         while (!git_revwalk_next(&id, w)) {
598                 relpath = "";
599
600                 if (cachefile && !memcmp(&id, &lastoid, sizeof(id)))
601                         break;
602
603                 git_oid_tostr(oidstr, sizeof(oidstr), &id);
604                 r = snprintf(path, sizeof(path), "commit/%s.html", oidstr);
605                 if (r == -1 || (size_t)r >= sizeof(path))
606                         errx(1, "path truncated: 'commit/%s.html'", oidstr);
607                 r = access(path, F_OK);
608
609                 /* optimization: if there are no log lines to write and
610                    the commit file already exists: skip the diffstat */
611                 if (!nlogcommits && !r)
612                         continue;
613
614                 if (!(ci = commitinfo_getbyoid(&id)))
615                         break;
616                 /* diffstat: for stagit HTML required for the log.html line */
617                 if (commitinfo_getstats(ci) == -1)
618                         goto err;
619
620                 if (nlogcommits < 0) {
621                         writelogline(fp, ci);
622                 } else if (nlogcommits > 0) {
623                         writelogline(fp, ci);
624                         nlogcommits--;
625                         if (!nlogcommits && ci->parentoid[0])
626                                 fputs("<tr><td></td><td colspan=\"5\">"
627                                       "More commits remaining [...]</td>"
628                                       "</tr>\n", fp);
629                 }
630
631                 if (cachefile)
632                         writelogline(wcachefp, ci);
633
634                 /* check if file exists if so skip it */
635                 if (r) {
636                         relpath = "../";
637                         fpfile = efopen(path, "w");
638                         writeheader(fpfile, ci->summary);
639                         fputs("<pre>", fpfile);
640                         printshowfile(fpfile, ci);
641                         fputs("</pre>\n", fpfile);
642                         writefooter(fpfile);
643                         fclose(fpfile);
644                 }
645 err:
646                 commitinfo_free(ci);
647         }
648         git_revwalk_free(w);
649
650         relpath = "";
651
652         return 0;
653 }
654
655 void
656 printcommitatom(FILE *fp, struct commitinfo *ci)
657 {
658         fputs("<entry>\n", fp);
659
660         fprintf(fp, "<id>%s</id>\n", ci->oid);
661         if (ci->author) {
662                 fputs("<published>", fp);
663                 printtimez(fp, &(ci->author->when));
664                 fputs("</published>\n", fp);
665         }
666         if (ci->committer) {
667                 fputs("<updated>", fp);
668                 printtimez(fp, &(ci->committer->when));
669                 fputs("</updated>\n", fp);
670         }
671         if (ci->summary) {
672                 fputs("<title type=\"text\">", fp);
673                 xmlencode(fp, ci->summary, strlen(ci->summary));
674                 fputs("</title>\n", fp);
675         }
676         fprintf(fp, "<link rel=\"alternate\" type=\"text/html\" href=\"commit/%s.html\" />",
677                 ci->oid);
678
679         if (ci->author) {
680                 fputs("<author><name>", fp);
681                 xmlencode(fp, ci->author->name, strlen(ci->author->name));
682                 fputs("</name>\n<email>", fp);
683                 xmlencode(fp, ci->author->email, strlen(ci->author->email));
684                 fputs("</email>\n</author>\n", fp);
685         }
686
687         fputs("<content type=\"text\">", fp);
688         fprintf(fp, "commit %s\n", ci->oid);
689         if (ci->parentoid[0])
690                 fprintf(fp, "parent %s\n", ci->parentoid);
691         if (ci->author) {
692                 fputs("Author: ", fp);
693                 xmlencode(fp, ci->author->name, strlen(ci->author->name));
694                 fputs(" &lt;", fp);
695                 xmlencode(fp, ci->author->email, strlen(ci->author->email));
696                 fputs("&gt;\nDate:   ", fp);
697                 printtime(fp, &(ci->author->when));
698                 fputc('\n', fp);
699         }
700         if (ci->msg) {
701                 fputc('\n', fp);
702                 xmlencode(fp, ci->msg, strlen(ci->msg));
703         }
704         fputs("\n</content>\n</entry>\n", fp);
705 }
706
707 int
708 writeatom(FILE *fp)
709 {
710         struct commitinfo *ci;
711         git_revwalk *w = NULL;
712         git_oid id;
713         size_t i, m = 100; /* last 'm' commits */
714
715         fputs("<?xml version=\"1.0\" encoding=\"UTF-8\"?>\n"
716               "<feed xmlns=\"http://www.w3.org/2005/Atom\">\n<title>", fp);
717         xmlencode(fp, strippedname, strlen(strippedname));
718         fputs(", branch HEAD</title>\n<subtitle>", fp);
719         xmlencode(fp, description, strlen(description));
720         fputs("</subtitle>\n", fp);
721
722         git_revwalk_new(&w, repo);
723         git_revwalk_push_head(w);
724         git_revwalk_sorting(w, GIT_SORT_TIME);
725         git_revwalk_simplify_first_parent(w);
726
727         for (i = 0; i < m && !git_revwalk_next(&id, w); i++) {
728                 if (!(ci = commitinfo_getbyoid(&id)))
729                         break;
730                 printcommitatom(fp, ci);
731                 commitinfo_free(ci);
732         }
733         git_revwalk_free(w);
734
735         fputs("</feed>\n", fp);
736
737         return 0;
738 }
739
740 int
741 writeblob(git_object *obj, const char *fpath, const char *filename, git_off_t filesize)
742 {
743         char tmp[PATH_MAX] = "", *d;
744         const char *p;
745         int lc = 0;
746         FILE *fp;
747
748         if (strlcpy(tmp, fpath, sizeof(tmp)) >= sizeof(tmp))
749                 errx(1, "path truncated: '%s'", fpath);
750         if (!(d = dirname(tmp)))
751                 err(1, "dirname");
752         if (mkdirp(d))
753                 return -1;
754
755         for (p = fpath, tmp[0] = '\0'; *p; p++) {
756                 if (*p == '/' && strlcat(tmp, "../", sizeof(tmp)) >= sizeof(tmp))
757                         errx(1, "path truncated: '../%s'", tmp);
758         }
759         relpath = tmp;
760
761         fp = efopen(fpath, "w");
762         writeheader(fp, filename);
763         fputs("<p> ", fp);
764         xmlencode(fp, filename, strlen(filename));
765         fprintf(fp, " (%juB)", (uintmax_t)filesize);
766         fputs("</p><hr/>", fp);
767
768         if (git_blob_is_binary((git_blob *)obj)) {
769                 fputs("<p>Binary file.</p>\n", fp);
770         } else {
771                 lc = writeblobhtml(fp, (git_blob *)obj);
772                 if (ferror(fp))
773                         err(1, "fwrite");
774         }
775         writefooter(fp);
776         fclose(fp);
777
778         relpath = "";
779
780         return lc;
781 }
782
783 const char *
784 filemode(git_filemode_t m)
785 {
786         static char mode[11];
787
788         memset(mode, '-', sizeof(mode) - 1);
789         mode[10] = '\0';
790
791         if (S_ISREG(m))
792                 mode[0] = '-';
793         else if (S_ISBLK(m))
794                 mode[0] = 'b';
795         else if (S_ISCHR(m))
796                 mode[0] = 'c';
797         else if (S_ISDIR(m))
798                 mode[0] = 'd';
799         else if (S_ISFIFO(m))
800                 mode[0] = 'p';
801         else if (S_ISLNK(m))
802                 mode[0] = 'l';
803         else if (S_ISSOCK(m))
804                 mode[0] = 's';
805         else
806                 mode[0] = '?';
807
808         if (m & S_IRUSR) mode[1] = 'r';
809         if (m & S_IWUSR) mode[2] = 'w';
810         if (m & S_IXUSR) mode[3] = 'x';
811         if (m & S_IRGRP) mode[4] = 'r';
812         if (m & S_IWGRP) mode[5] = 'w';
813         if (m & S_IXGRP) mode[6] = 'x';
814         if (m & S_IROTH) mode[7] = 'r';
815         if (m & S_IWOTH) mode[8] = 'w';
816         if (m & S_IXOTH) mode[9] = 'x';
817
818         if (m & S_ISUID) mode[3] = (mode[3] == 'x') ? 's' : 'S';
819         if (m & S_ISGID) mode[6] = (mode[6] == 'x') ? 's' : 'S';
820         if (m & S_ISVTX) mode[9] = (mode[9] == 'x') ? 't' : 'T';
821
822         return mode;
823 }
824
825 int
826 writefilestree(FILE *fp, git_tree *tree, const char *path)
827 {
828         const git_tree_entry *entry = NULL;
829         git_submodule *module = NULL;
830         git_object *obj = NULL;
831         git_off_t filesize;
832         const char *entryname;
833         char filepath[PATH_MAX], entrypath[PATH_MAX];
834         size_t count, i;
835         int lc, r, ret;
836
837         count = git_tree_entrycount(tree);
838         for (i = 0; i < count; i++) {
839                 if (!(entry = git_tree_entry_byindex(tree, i)) ||
840                     !(entryname = git_tree_entry_name(entry)))
841                         return -1;
842                 joinpath(entrypath, sizeof(entrypath), path, entryname);
843
844                 r = snprintf(filepath, sizeof(filepath), "file/%s.html",
845                          entrypath);
846                 if (r == -1 || (size_t)r >= sizeof(filepath))
847                         errx(1, "path truncated: 'file/%s.html'", entrypath);
848
849                 if (!git_tree_entry_to_object(&obj, repo, entry)) {
850                         switch (git_object_type(obj)) {
851                         case GIT_OBJ_BLOB:
852                                 break;
853                         case GIT_OBJ_TREE:
854                                 /* NOTE: recurses */
855                                 ret = writefilestree(fp, (git_tree *)obj,
856                                                      entrypath);
857                                 git_object_free(obj);
858                                 if (ret)
859                                         return ret;
860                                 continue;
861                         default:
862                                 git_object_free(obj);
863                                 continue;
864                         }
865
866                         filesize = git_blob_rawsize((git_blob *)obj);
867                         lc = writeblob(obj, filepath, entryname, filesize);
868
869                         fputs("<tr><td>", fp);
870                         fputs(filemode(git_tree_entry_filemode(entry)), fp);
871                         fprintf(fp, "</td><td><a href=\"%s%s\">", relpath, filepath);
872                         xmlencode(fp, entrypath, strlen(entrypath));
873                         fputs("</a></td><td class=\"num\" align=\"right\">", fp);
874                         if (lc > 0)
875                                 fprintf(fp, "%dL", lc);
876                         else
877                                 fprintf(fp, "%juB", (uintmax_t)filesize);
878                         fputs("</td></tr>\n", fp);
879                         git_object_free(obj);
880                 } else if (!git_submodule_lookup(&module, repo, entryname)) {
881                         fprintf(fp, "<tr><td>m---------</td><td><a href=\"%sfile/.gitmodules.html\">",
882                                 relpath);
883                         xmlencode(fp, entrypath, strlen(entrypath));
884                         git_submodule_free(module);
885                         fputs("</a></td><td class=\"num\" align=\"right\"></td></tr>\n", fp);
886                 }
887         }
888
889         return 0;
890 }
891
892 int
893 writefiles(FILE *fp, const git_oid *id)
894 {
895         git_tree *tree = NULL;
896         git_commit *commit = NULL;
897         int ret = -1;
898
899         fputs("<table id=\"files\"><thead>\n<tr>"
900               "<td><b>Mode</b></td><td><b>Name</b></td>"
901               "<td class=\"num\" align=\"right\"><b>Size</b></td>"
902               "</tr>\n</thead><tbody>\n", fp);
903
904         if (!git_commit_lookup(&commit, repo, id) &&
905             !git_commit_tree(&tree, commit))
906                 ret = writefilestree(fp, tree, "");
907
908         fputs("</tbody></table>", fp);
909
910         git_commit_free(commit);
911         git_tree_free(tree);
912
913         return ret;
914 }
915
916 int
917 refs_cmp(const void *v1, const void *v2)
918 {
919         git_reference *r1 = (*(git_reference **)v1);
920         git_reference *r2 = (*(git_reference **)v2);
921         int r;
922
923         if ((r = git_reference_is_branch(r1) - git_reference_is_branch(r2)))
924                 return r;
925
926         return strcmp(git_reference_shorthand(r1),
927                       git_reference_shorthand(r2));
928 }
929
930 int
931 writerefs(FILE *fp)
932 {
933         struct commitinfo *ci;
934         const git_oid *id = NULL;
935         git_object *obj = NULL;
936         git_reference *dref = NULL, *r, *ref = NULL;
937         git_reference_iterator *it = NULL;
938         git_reference **refs = NULL;
939         size_t count, i, j, refcount;
940         const char *titles[] = { "Branches", "Tags" };
941         const char *ids[] = { "branches", "tags" };
942         const char *name;
943
944         if (git_reference_iterator_new(&it, repo))
945                 return -1;
946
947         for (refcount = 0; !git_reference_next(&ref, it); refcount++) {
948                 if (!(refs = reallocarray(refs, refcount + 1, sizeof(git_reference *))))
949                         err(1, "realloc");
950                 refs[refcount] = ref;
951         }
952         git_reference_iterator_free(it);
953
954         /* sort by type then shorthand name */
955         qsort(refs, refcount, sizeof(git_reference *), refs_cmp);
956
957         for (j = 0; j < 2; j++) {
958                 for (i = 0, count = 0; i < refcount; i++) {
959                         if (!(git_reference_is_branch(refs[i]) && j == 0) &&
960                             !(git_reference_is_tag(refs[i]) && j == 1))
961                                 continue;
962
963                         switch (git_reference_type(refs[i])) {
964                         case GIT_REF_SYMBOLIC:
965                                 if (git_reference_resolve(&dref, refs[i]))
966                                         goto err;
967                                 r = dref;
968                                 break;
969                         case GIT_REF_OID:
970                                 r = refs[i];
971                                 break;
972                         default:
973                                 continue;
974                         }
975                         if (!git_reference_target(r) ||
976                             git_reference_peel(&obj, r, GIT_OBJ_ANY))
977                                 goto err;
978                         if (!(id = git_object_id(obj)))
979                                 goto err;
980                         if (!(ci = commitinfo_getbyoid(id)))
981                                 break;
982
983                         /* print header if it has an entry (first). */
984                         if (++count == 1) {
985                                 fprintf(fp, "<h2>%s</h2><table id=\"%s\">"
986                                         "<thead>\n<tr><td><b>Name</b></td>"
987                                         "<td><b>Last commit date</b></td>"
988                                         "<td><b>Author</b></td>\n</tr>\n"
989                                         "</thead><tbody>\n",
990                                          titles[j], ids[j]);
991                         }
992
993                         relpath = "";
994                         name = git_reference_shorthand(r);
995
996                         fputs("<tr><td>", fp);
997                         xmlencode(fp, name, strlen(name));
998                         fputs("</td><td>", fp);
999                         if (ci->author)
1000                                 printtimeshort(fp, &(ci->author->when));
1001                         fputs("</td><td>", fp);
1002                         if (ci->author)
1003                                 xmlencode(fp, ci->author->name, strlen(ci->author->name));
1004                         fputs("</td></tr>\n", fp);
1005
1006                         relpath = "../";
1007
1008                         commitinfo_free(ci);
1009                         git_object_free(obj);
1010                         obj = NULL;
1011                         git_reference_free(dref);
1012                         dref = NULL;
1013                 }
1014                 /* table footer */
1015                 if (count)
1016                         fputs("</tbody></table><br/>", fp);
1017         }
1018
1019 err:
1020         git_object_free(obj);
1021         git_reference_free(dref);
1022
1023         for (i = 0; i < refcount; i++)
1024                 git_reference_free(refs[i]);
1025         free(refs);
1026
1027         return 0;
1028 }
1029
1030 void
1031 usage(char *argv0)
1032 {
1033         fprintf(stderr, "%s [-c cachefile | -l commits] repodir\n", argv0);
1034         exit(1);
1035 }
1036
1037 int
1038 main(int argc, char *argv[])
1039 {
1040         git_object *obj = NULL;
1041         const git_oid *head = NULL;
1042         const git_error *e = NULL;
1043         mode_t mask;
1044         FILE *fp, *fpread;
1045         char path[PATH_MAX], repodirabs[PATH_MAX + 1], *p;
1046         char tmppath[64] = "cache.XXXXXXXXXXXX", buf[BUFSIZ];
1047         size_t n;
1048         int i, fd;
1049
1050         for (i = 1; i < argc; i++) {
1051                 if (argv[i][0] != '-') {
1052                         if (repodir)
1053                                 usage(argv[0]);
1054                         repodir = argv[i];
1055                 } else if (argv[i][1] == 'c') {
1056                         if (nlogcommits > 0 || i + 1 >= argc)
1057                                 usage(argv[0]);
1058                         cachefile = argv[++i];
1059                 } else if (argv[i][1] == 'l') {
1060                         if (cachefile || i + 1 >= argc)
1061                                 usage(argv[0]);
1062                         errno = 0;
1063                         nlogcommits = strtoll(argv[++i], &p, 10);
1064                         if (argv[i][0] == '\0' || *p != '\0' ||
1065                             nlogcommits <= 0 || errno)
1066                                 usage(argv[0]);
1067                 }
1068         }
1069         if (!repodir)
1070                 usage(argv[0]);
1071
1072         if (!realpath(repodir, repodirabs))
1073                 err(1, "realpath");
1074
1075         git_libgit2_init();
1076
1077 #ifdef __OpenBSD__
1078         if (cachefile) {
1079                 if (pledge("stdio rpath wpath cpath fattr", NULL) == -1)
1080                         err(1, "pledge");
1081         } else {
1082                 if (pledge("stdio rpath wpath cpath", NULL) == -1)
1083                         err(1, "pledge");
1084         }
1085 #endif
1086
1087         if (git_repository_open_ext(&repo, repodir,
1088                 GIT_REPOSITORY_OPEN_NO_SEARCH, NULL) < 0) {
1089                 e = giterr_last();
1090                 fprintf(stderr, "%s: %s\n", argv[0], e->message);
1091                 return 1;
1092         }
1093
1094         /* find HEAD */
1095         if (!git_revparse_single(&obj, repo, "HEAD"))
1096                 head = git_object_id(obj);
1097         git_object_free(obj);
1098
1099         /* use directory name as name */
1100         if ((name = strrchr(repodirabs, '/')))
1101                 name++;
1102         else
1103                 name = "";
1104
1105         /* strip .git suffix */
1106         if (!(strippedname = strdup(name)))
1107                 err(1, "strdup");
1108         if ((p = strrchr(strippedname, '.')))
1109                 if (!strcmp(p, ".git"))
1110                         *p = '\0';
1111
1112         /* read description or .git/description */
1113         joinpath(path, sizeof(path), repodir, "description");
1114         if (!(fpread = fopen(path, "r"))) {
1115                 joinpath(path, sizeof(path), repodir, ".git/description");
1116                 fpread = fopen(path, "r");
1117         }
1118         if (fpread) {
1119                 if (!fgets(description, sizeof(description), fpread))
1120                         description[0] = '\0';
1121                 fclose(fpread);
1122         }
1123
1124         /* read url or .git/url */
1125         joinpath(path, sizeof(path), repodir, "url");
1126         if (!(fpread = fopen(path, "r"))) {
1127                 joinpath(path, sizeof(path), repodir, ".git/url");
1128                 fpread = fopen(path, "r");
1129         }
1130         if (fpread) {
1131                 if (!fgets(cloneurl, sizeof(cloneurl), fpread))
1132                         cloneurl[0] = '\0';
1133                 cloneurl[strcspn(cloneurl, "\n")] = '\0';
1134                 fclose(fpread);
1135         }
1136
1137         /* check LICENSE */
1138         for (i = 0; i < sizeof(licensefiles) / sizeof(*licensefiles) && !license; i++) {
1139                 if (!git_revparse_single(&obj, repo, licensefiles[i]) &&
1140                     git_object_type(obj) == GIT_OBJ_BLOB)
1141                         license = licensefiles[i] + strlen("HEAD:");
1142                 git_object_free(obj);
1143         }
1144
1145         /* check README */
1146         for (i = 0; i < sizeof(readmefiles) / sizeof(*readmefiles) && !readme; i++) {
1147                 if (!git_revparse_single(&obj, repo, readmefiles[i]) &&
1148                     git_object_type(obj) == GIT_OBJ_BLOB)
1149                         readme = readmefiles[i] + strlen("HEAD:");
1150                 git_object_free(obj);
1151         }
1152
1153         if (!git_revparse_single(&obj, repo, "HEAD:.gitmodules") &&
1154             git_object_type(obj) == GIT_OBJ_BLOB)
1155                 submodules = ".gitmodules";
1156         git_object_free(obj);
1157
1158         /* log for HEAD */
1159         fp = efopen("log.html", "w");
1160         relpath = "";
1161         mkdir("commit", S_IRWXU | S_IRWXG | S_IRWXO);
1162         writeheader(fp, "Log");
1163         fputs("<table id=\"log\"><thead>\n<tr><td><b>Date</b></td>"
1164               "<td><b>Commit message</b></td>"
1165               "<td><b>Author</b></td><td class=\"num\" align=\"right\"><b>Files</b></td>"
1166               "<td class=\"num\" align=\"right\"><b>+</b></td>"
1167               "<td class=\"num\" align=\"right\"><b>-</b></td></tr>\n</thead><tbody>\n", fp);
1168
1169         if (cachefile && head) {
1170                 /* read from cache file (does not need to exist) */
1171                 if ((rcachefp = fopen(cachefile, "r"))) {
1172                         if (!fgets(lastoidstr, sizeof(lastoidstr), rcachefp))
1173                                 errx(1, "%s: no object id", cachefile);
1174                         if (git_oid_fromstr(&lastoid, lastoidstr))
1175                                 errx(1, "%s: invalid object id", cachefile);
1176                 }
1177
1178                 /* write log to (temporary) cache */
1179                 if ((fd = mkstemp(tmppath)) == -1)
1180                         err(1, "mkstemp");
1181                 if (!(wcachefp = fdopen(fd, "w")))
1182                         err(1, "fdopen: '%s'", tmppath);
1183                 /* write last commit id (HEAD) */
1184                 git_oid_tostr(buf, sizeof(buf), head);
1185                 fprintf(wcachefp, "%s\n", buf);
1186
1187                 writelog(fp, head);
1188
1189                 if (rcachefp) {
1190                         /* append previous log to log.html and the new cache */
1191                         while (!feof(rcachefp)) {
1192                                 n = fread(buf, 1, sizeof(buf), rcachefp);
1193                                 if (ferror(rcachefp))
1194                                         err(1, "fread");
1195                                 if (fwrite(buf, 1, n, fp) != n ||
1196                                     fwrite(buf, 1, n, wcachefp) != n)
1197                                         err(1, "fwrite");
1198                         }
1199                         fclose(rcachefp);
1200                 }
1201                 fclose(wcachefp);
1202         } else {
1203                 if (head)
1204                         writelog(fp, head);
1205         }
1206
1207         fputs("</tbody></table>", fp);
1208         writefooter(fp);
1209         fclose(fp);
1210
1211         /* files for HEAD */
1212         fp = efopen("files.html", "w");
1213         writeheader(fp, "Files");
1214         if (head)
1215                 writefiles(fp, head);
1216         writefooter(fp);
1217         fclose(fp);
1218
1219         /* summary page with branches and tags */
1220         fp = efopen("refs.html", "w");
1221         writeheader(fp, "Refs");
1222         writerefs(fp);
1223         writefooter(fp);
1224         fclose(fp);
1225
1226         /* Atom feed */
1227         fp = efopen("atom.xml", "w");
1228         writeatom(fp);
1229         fclose(fp);
1230
1231         /* rename new cache file on success */
1232         if (cachefile && head) {
1233                 if (rename(tmppath, cachefile))
1234                         err(1, "rename: '%s' to '%s'", tmppath, cachefile);
1235                 umask((mask = umask(0)));
1236                 if (chmod(cachefile,
1237                     (S_IRUSR|S_IWUSR|S_IRGRP|S_IWGRP|S_IROTH|S_IWOTH) & ~mask))
1238                         err(1, "chmod: '%s'", cachefile);
1239         }
1240
1241         /* cleanup */
1242         git_repository_free(repo);
1243         git_libgit2_shutdown();
1244
1245         return 0;
1246 }