tar-tree.con commit tar-tree: finish honoring extractor's umask in git-tar-tree. (3ac0ebb)
   1/*
   2 * Copyright (c) 2005 Rene Scharfe
   3 */
   4#include <time.h>
   5#include "cache.h"
   6
   7#define RECORDSIZE      (512)
   8#define BLOCKSIZE       (RECORDSIZE * 20)
   9
  10#define TYPEFLAG_AUTO           '\0'
  11#define TYPEFLAG_REG            '0'
  12#define TYPEFLAG_LNK            '2'
  13#define TYPEFLAG_DIR            '5'
  14#define TYPEFLAG_GLOBAL_HEADER  'g'
  15#define TYPEFLAG_EXT_HEADER     'x'
  16
  17#define EXT_HEADER_PATH         1
  18#define EXT_HEADER_LINKPATH     2
  19
  20static const char tar_tree_usage[] = "git-tar-tree <key> [basedir]";
  21
  22static char block[BLOCKSIZE];
  23static unsigned long offset;
  24
  25static const char *basedir;
  26static time_t archive_time;
  27
  28struct path_prefix {
  29        struct path_prefix *prev;
  30        const char *name;
  31};
  32
  33/* tries hard to write, either succeeds or dies in the attempt */
  34static void reliable_write(void *buf, unsigned long size)
  35{
  36        while (size > 0) {
  37                long ret = xwrite(1, buf, size);
  38                if (ret < 0) {
  39                        if (errno == EPIPE)
  40                                exit(0);
  41                        die("git-tar-tree: %s", strerror(errno));
  42                } else if (!ret) {
  43                        die("git-tar-tree: disk full?");
  44                }
  45                size -= ret;
  46                buf += ret;
  47        }
  48}
  49
  50/* writes out the whole block, but only if it is full */
  51static void write_if_needed(void)
  52{
  53        if (offset == BLOCKSIZE) {
  54                reliable_write(block, BLOCKSIZE);
  55                offset = 0;
  56        }
  57}
  58
  59/* acquire the next record from the buffer; user must call write_if_needed() */
  60static char *get_record(void)
  61{
  62        char *p = block + offset;
  63        memset(p, 0, RECORDSIZE);
  64        offset += RECORDSIZE;
  65        return p;
  66}
  67
  68/*
  69 * The end of tar archives is marked by 1024 nul bytes and after that
  70 * follows the rest of the block (if any).
  71 */
  72static void write_trailer(void)
  73{
  74        get_record();
  75        write_if_needed();
  76        get_record();
  77        write_if_needed();
  78        while (offset) {
  79                get_record();
  80                write_if_needed();
  81        }
  82}
  83
  84/*
  85 * queues up writes, so that all our write(2) calls write exactly one
  86 * full block; pads writes to RECORDSIZE
  87 */
  88static void write_blocked(void *buf, unsigned long size)
  89{
  90        unsigned long tail;
  91
  92        if (offset) {
  93                unsigned long chunk = BLOCKSIZE - offset;
  94                if (size < chunk)
  95                        chunk = size;
  96                memcpy(block + offset, buf, chunk);
  97                size -= chunk;
  98                offset += chunk;
  99                buf += chunk;
 100                write_if_needed();
 101        }
 102        while (size >= BLOCKSIZE) {
 103                reliable_write(buf, BLOCKSIZE);
 104                size -= BLOCKSIZE;
 105                buf += BLOCKSIZE;
 106        }
 107        if (size) {
 108                memcpy(block + offset, buf, size);
 109                buf += size;
 110                offset += size;
 111        }
 112        tail = offset % RECORDSIZE;
 113        if (tail)  {
 114                memset(block + offset, 0, RECORDSIZE - tail);
 115                offset += RECORDSIZE - tail;
 116        }
 117        write_if_needed();
 118}
 119
 120static void append_string(char **p, const char *s)
 121{
 122        unsigned int len = strlen(s);
 123        memcpy(*p, s, len);
 124        *p += len;
 125}
 126
 127static void append_char(char **p, char c)
 128{
 129        **p = c;
 130        *p += 1;
 131}
 132
 133static void append_path_prefix(char **buffer, struct path_prefix *prefix)
 134{
 135        if (!prefix)
 136                return;
 137        append_path_prefix(buffer, prefix->prev);
 138        append_string(buffer, prefix->name);
 139        append_char(buffer, '/');
 140}
 141
 142static unsigned int path_prefix_len(struct path_prefix *prefix)
 143{
 144        if (!prefix)
 145                return 0;
 146        return path_prefix_len(prefix->prev) + strlen(prefix->name) + 1;
 147}
 148
 149static void append_path(char **p, int is_dir, const char *basepath,
 150                        struct path_prefix *prefix, const char *path)
 151{
 152        if (basepath) {
 153                append_string(p, basepath);
 154                append_char(p, '/');
 155        }
 156        append_path_prefix(p, prefix);
 157        append_string(p, path);
 158        if (is_dir)
 159                append_char(p, '/');
 160}
 161
 162static unsigned int path_len(int is_dir, const char *basepath,
 163                             struct path_prefix *prefix, const char *path)
 164{
 165        unsigned int len = 0;
 166        if (basepath)
 167                len += strlen(basepath) + 1;
 168        len += path_prefix_len(prefix) + strlen(path);
 169        if (is_dir)
 170                len++;
 171        return len;
 172}
 173
 174static void append_extended_header_prefix(char **p, unsigned int size,
 175                                          const char *keyword)
 176{
 177        int len = sprintf(*p, "%u %s=", size, keyword);
 178        *p += len;
 179}
 180
 181static unsigned int extended_header_len(const char *keyword,
 182                                        unsigned int valuelen)
 183{
 184        /* "%u %s=%s\n" */
 185        unsigned int len = 1 + 1 + strlen(keyword) + 1 + valuelen + 1;
 186        if (len > 9)
 187                len++;
 188        if (len > 99)
 189                len++;
 190        return len;
 191}
 192
 193static void append_extended_header(char **p, const char *keyword,
 194                                   const char *value, unsigned int len)
 195{
 196        unsigned int size = extended_header_len(keyword, len);
 197        append_extended_header_prefix(p, size, keyword);
 198        memcpy(*p, value, len);
 199        *p += len;
 200        append_char(p, '\n');
 201}
 202
 203static void write_header(const unsigned char *, char, const char *, struct path_prefix *,
 204                         const char *, unsigned int, void *, unsigned long);
 205
 206/* stores a pax extended header directly in the block buffer */
 207static void write_extended_header(const char *headerfilename, int is_dir,
 208                                  unsigned int flags, const char *basepath,
 209                                  struct path_prefix *prefix,
 210                                  const char *path, unsigned int namelen,
 211                                  void *content, unsigned int contentsize)
 212{
 213        char *buffer, *p;
 214        unsigned int pathlen, size, linkpathlen = 0;
 215
 216        size = pathlen = extended_header_len("path", namelen);
 217        if (flags & EXT_HEADER_LINKPATH) {
 218                linkpathlen = extended_header_len("linkpath", contentsize);
 219                size += linkpathlen;
 220        }
 221        write_header(NULL, TYPEFLAG_EXT_HEADER, NULL, NULL, headerfilename,
 222                     0100600, NULL, size);
 223
 224        buffer = p = malloc(size);
 225        if (!buffer)
 226                die("git-tar-tree: %s", strerror(errno));
 227        append_extended_header_prefix(&p, pathlen, "path");
 228        append_path(&p, is_dir, basepath, prefix, path);
 229        append_char(&p, '\n');
 230        if (flags & EXT_HEADER_LINKPATH)
 231                append_extended_header(&p, "linkpath", content, contentsize);
 232        write_blocked(buffer, size);
 233        free(buffer);
 234}
 235
 236static void write_global_extended_header(const unsigned char *sha1)
 237{
 238        char *p;
 239        unsigned int size;
 240
 241        size = extended_header_len("comment", 40);
 242        write_header(NULL, TYPEFLAG_GLOBAL_HEADER, NULL, NULL,
 243                     "pax_global_header", 0100600, NULL, size);
 244
 245        p = get_record();
 246        append_extended_header(&p, "comment", sha1_to_hex(sha1), 40);
 247        write_if_needed();
 248}
 249
 250/* stores a ustar header directly in the block buffer */
 251static void write_header(const unsigned char *sha1, char typeflag, const char *basepath,
 252                         struct path_prefix *prefix, const char *path,
 253                         unsigned int mode, void *buffer, unsigned long size)
 254{
 255        unsigned int namelen; 
 256        char *header = NULL;
 257        unsigned int checksum = 0;
 258        int i;
 259        unsigned int ext_header = 0;
 260
 261        if (typeflag == TYPEFLAG_AUTO) {
 262                if (S_ISDIR(mode))
 263                        typeflag = TYPEFLAG_DIR;
 264                else if (S_ISLNK(mode))
 265                        typeflag = TYPEFLAG_LNK;
 266                else
 267                        typeflag = TYPEFLAG_REG;
 268        }
 269
 270        namelen = path_len(S_ISDIR(mode), basepath, prefix, path);
 271        if (namelen > 100)
 272                ext_header |= EXT_HEADER_PATH;
 273        if (typeflag == TYPEFLAG_LNK && size > 100)
 274                ext_header |= EXT_HEADER_LINKPATH;
 275
 276        /* the extended header must be written before the normal one */
 277        if (ext_header) {
 278                char headerfilename[51];
 279                sprintf(headerfilename, "%s.paxheader", sha1_to_hex(sha1));
 280                write_extended_header(headerfilename, S_ISDIR(mode),
 281                                      ext_header, basepath, prefix, path,
 282                                      namelen, buffer, size);
 283        }
 284
 285        header = get_record();
 286
 287        if (ext_header) {
 288                sprintf(header, "%s.data", sha1_to_hex(sha1));
 289        } else {
 290                char *p = header;
 291                append_path(&p, S_ISDIR(mode), basepath, prefix, path);
 292        }
 293
 294        if (typeflag == TYPEFLAG_LNK) {
 295                if (ext_header & EXT_HEADER_LINKPATH) {
 296                        sprintf(&header[157], "see %s.paxheader",
 297                                sha1_to_hex(sha1));
 298                } else {
 299                        if (buffer)
 300                                strncpy(&header[157], buffer, size);
 301                }
 302        }
 303
 304        if (S_ISDIR(mode))
 305                mode |= 0755;   /* GIT doesn't store permissions of dirs */
 306        if (S_ISLNK(mode))
 307                mode |= 0777;   /* ... nor of symlinks */
 308        sprintf(&header[100], "%07o", mode & 07777);
 309
 310        /* XXX: should we provide more meaningful info here? */
 311        sprintf(&header[108], "%07o", 0);       /* uid */
 312        sprintf(&header[116], "%07o", 0);       /* gid */
 313        strncpy(&header[265], "git", 31);       /* uname */
 314        strncpy(&header[297], "git", 31);       /* gname */
 315
 316        if (S_ISDIR(mode) || S_ISLNK(mode))
 317                size = 0;
 318        sprintf(&header[124], "%011lo", size);
 319        sprintf(&header[136], "%011lo", archive_time);
 320
 321        header[156] = typeflag;
 322
 323        memcpy(&header[257], "ustar", 6);
 324        memcpy(&header[263], "00", 2);
 325
 326        sprintf(&header[329], "%07o", 0);       /* devmajor */
 327        sprintf(&header[337], "%07o", 0);       /* devminor */
 328
 329        memset(&header[148], ' ', 8);
 330        for (i = 0; i < RECORDSIZE; i++)
 331                checksum += header[i];
 332        sprintf(&header[148], "%07o", checksum & 0x1fffff);
 333
 334        write_if_needed();
 335}
 336
 337static void traverse_tree(void *buffer, unsigned long size,
 338                          struct path_prefix *prefix)
 339{
 340        struct path_prefix this_prefix;
 341        this_prefix.prev = prefix;
 342
 343        while (size) {
 344                int namelen = strlen(buffer)+1;
 345                void *eltbuf;
 346                char elttype[20];
 347                unsigned long eltsize;
 348                unsigned char *sha1 = buffer + namelen;
 349                char *path = strchr(buffer, ' ') + 1;
 350                unsigned int mode;
 351
 352                if (size < namelen + 20 || sscanf(buffer, "%o", &mode) != 1)
 353                        die("corrupt 'tree' file");
 354                if (S_ISDIR(mode) || S_ISREG(mode))
 355                        mode |= (mode & 0100) ? 0777 : 0666;
 356                buffer = sha1 + 20;
 357                size -= namelen + 20;
 358
 359                eltbuf = read_sha1_file(sha1, elttype, &eltsize);
 360                if (!eltbuf)
 361                        die("cannot read %s", sha1_to_hex(sha1));
 362                write_header(sha1, TYPEFLAG_AUTO, basedir, prefix, path,
 363                             mode, eltbuf, eltsize);
 364                if (!strcmp(elttype, "tree")) {
 365                        this_prefix.name = path;
 366                        traverse_tree(eltbuf, eltsize, &this_prefix);
 367                } else if (!strcmp(elttype, "blob") && !S_ISLNK(mode)) {
 368                        write_blocked(eltbuf, eltsize);
 369                }
 370                free(eltbuf);
 371        }
 372}
 373
 374/* get commit time from committer line of commit object */
 375static time_t commit_time(void * buffer, unsigned long size)
 376{
 377        time_t result = 0;
 378        char *p = buffer;
 379
 380        while (size > 0) {
 381                char *endp = memchr(p, '\n', size);
 382                if (!endp || endp == p)
 383                        break;
 384                *endp = '\0';
 385                if (endp - p > 10 && !memcmp(p, "committer ", 10)) {
 386                        char *nump = strrchr(p, '>');
 387                        if (!nump)
 388                                break;
 389                        nump++;
 390                        result = strtoul(nump, &endp, 10);
 391                        if (*endp != ' ')
 392                                result = 0;
 393                        break;
 394                }
 395                size -= endp - p - 1;
 396                p = endp + 1;
 397        }
 398        return result;
 399}
 400
 401int main(int argc, char **argv)
 402{
 403        unsigned char sha1[20];
 404        unsigned char commit_sha1[20];
 405        void *buffer;
 406        unsigned long size;
 407
 408        setup_git_directory();
 409
 410        switch (argc) {
 411        case 3:
 412                basedir = argv[2];
 413                /* FALLTHROUGH */
 414        case 2:
 415                if (get_sha1(argv[1], sha1) < 0)
 416                        usage(tar_tree_usage);
 417                break;
 418        default:
 419                usage(tar_tree_usage);
 420        }
 421
 422        buffer = read_object_with_reference(sha1, "commit", &size, commit_sha1);
 423        if (buffer) {
 424                write_global_extended_header(commit_sha1);
 425                archive_time = commit_time(buffer, size);
 426                free(buffer);
 427        }
 428        buffer = read_object_with_reference(sha1, "tree", &size, NULL);
 429        if (!buffer)
 430                die("not a reference to a tag, commit or tree object: %s",
 431                    sha1_to_hex(sha1));
 432        if (!archive_time)
 433                archive_time = time(NULL);
 434        if (basedir)
 435                write_header((unsigned char *)"0", TYPEFLAG_DIR, NULL, NULL,
 436                        basedir, 040777, NULL, 0);
 437        traverse_tree(buffer, size, NULL);
 438        free(buffer);
 439        write_trailer();
 440        return 0;
 441}