cat-file: only split on whitespace when %(rest) is used

author Jeff King <peff@peff.net>
Fri, 2 Aug 2013 11:59:07 +0000 (04:59 -0700)

committer Junio C Hamano <gitster@pobox.com>
Mon, 5 Aug 2013 16:30:48 +0000 (09:30 -0700)
author: Jeff King <peff@peff.net>
Fri, 2 Aug 2013 11:59:07 +0000 (04:59 -0700)
committer: Junio C Hamano <gitster@pobox.com>
Mon, 5 Aug 2013 16:30:48 +0000 (09:30 -0700)
diff --git a/Documentation/git-cat-file.txt b/Documentation/git-cat-file.txt

index 10fbc6a373758437f23ef80245b3bd9e164add1f..21cffe2bcd0d5907efda9d525228e3f78a5cff65 100644 (file)
--- a/Documentation/git-cat-file.txt
+++ b/Documentation/git-cat-file.txt
@@ -86,10 +86,9 @@ BATCH OUTPUT
  ------------
  
  If `--batch` or `--batch-check` is given, `cat-file` will read objects
-from stdin, one per line, and print information about them.
-
-Each line is considered as a whole object name, and is parsed as if
-given to linkgit:git-rev-parse[1].
+from stdin, one per line, and print information about them. By default,
+the whole line is considered as an object, as if it were fed to
+linkgit:git-rev-parse[1].
  
  You can specify the information shown for each object by using a custom
  `<format>`. The `<format>` is copied literally to stdout for each
@@ -110,6 +109,13 @@ newline. The available atoms are:
         The size, in bytes, that the object takes up on disk. See the
         note about on-disk sizes in the `CAVEATS` section below.
  
+`rest`::
+       If this atom is used in the output string, input lines are split
+       at the first whitespace boundary. All characters before that
+       whitespace are considered to be the object name; characters
+       after that first run of whitespace (i.e., the "rest" of the
+       line) are output in place of the `%(rest)` atom.
+
  If no format is specified, the default format is `%(objectname)
  %(objecttype) %(objectsize)`.
  
diff --git a/builtin/cat-file.c b/builtin/cat-file.c

index 425346048bbba66874eb857985bed9937c44e1d6..41afaa534b02d8f8089973f3949ba507bd3cf94b 100644 (file)
--- a/builtin/cat-file.c
+++ b/builtin/cat-file.c
@@ -119,6 +119,7 @@ struct expand_data {
         enum object_type type;
         unsigned long size;
         unsigned long disk_size;
+       const char *rest;
  
         /*
          * If mark_query is true, we do not expand anything, but rather
@@ -126,6 +127,13 @@ struct expand_data {
          */
         int mark_query;
  
+       /*
+        * Whether to split the input on whitespace before feeding it to
+        * get_sha1; this is decided during the mark_query phase based on
+        * whether we have a %(rest) token in our format.
+        */
+       int split_on_whitespace;
+
         /*
          * After a mark_query run, this object_info is set up to be
          * passed to sha1_object_info_extended. It will point to the data
@@ -163,6 +171,11 @@ static void expand_atom(struct strbuf *sb, const char *atom, int len,
                         data->info.disk_sizep = &data->disk_size;
                 else
                         strbuf_addf(sb, "%lu", data->disk_size);
+       } else if (is_atom("rest", atom, len)) {
+               if (data->mark_query)
+                       data->split_on_whitespace = 1;
+               else if (data->rest)
+                       strbuf_addstr(sb, data->rest);
         } else
                 die("unknown format element: %.*s", len, atom);
  }
@@ -273,7 +286,23 @@ static int batch_objects(struct batch_options *opt)
         warn_on_object_refname_ambiguity = 0;
  
         while (strbuf_getline(&buf, stdin, '\n') != EOF) {
-               int error = batch_one_object(buf.buf, opt, &data);
+               int error;
+
+               if (data.split_on_whitespace) {
+                       /*
+                        * Split at first whitespace, tying off the beginning
+                        * of the string and saving the remainder (or NULL) in
+                        * data.rest.
+                        */
+                       char *p = strpbrk(buf.buf, " \t");
+                       if (p) {
+                               while (*p && strchr(" \t", *p))
+                                       *p++ = '\0';
+                       }
+                       data.rest = p;
+               }
+
+               error = batch_one_object(buf.buf, opt, &data);
                 if (error)
                         return error;
         }
diff --git a/t/t1006-cat-file.sh b/t/t1006-cat-file.sh

index 4e911fb43d8ea2c699b3a836547b618274db6e05..a420742494024e127d4e4233153c7054e077e471 100755 (executable)
--- a/t/t1006-cat-file.sh
+++ b/t/t1006-cat-file.sh
@@ -78,6 +78,13 @@ $content"
         echo $sha1 | git cat-file --batch-check="%(objecttype) %(objectname)" >actual &&
         test_cmp expect actual
      '
+
+    test_expect_success '--batch-check with %(rest)' '
+       echo "$type this is some extra content" >expect &&
+       echo "$sha1    this is some extra content" |
+               git cat-file --batch-check="%(objecttype) %(rest)" >actual &&
+       test_cmp expect actual
+    '
  }
  
  hello_content="Hello World"
@@ -91,6 +98,14 @@ test_expect_success "setup" '
  
  run_tests 'blob' $hello_sha1 $hello_size "$hello_content" "$hello_content"
  
+test_expect_success '--batch-check without %(rest) considers whole line' '
+       echo "$hello_sha1 blob $hello_size" >expect &&
+       git update-index --add --cacheinfo 100644 $hello_sha1 "white space" &&
+       test_when_finished "git update-index --remove \"white space\"" &&
+       echo ":white space" | git cat-file --batch-check >actual &&
+       test_cmp expect actual
+'
+
  tree_sha1=$(git write-tree)
  tree_size=33
  tree_pretty_content="100644 blob $hello_sha1   hello"
author	Jeff King <peff@peff.net>
author	Fri, 2 Aug 2013 11:59:07 +0000 (04:59 -0700)
committer	Junio C Hamano <gitster@pobox.com>
committer	Mon, 5 Aug 2013 16:30:48 +0000 (09:30 -0700)
Documentation/git-cat-file.txt		patch \| blob \| history
builtin/cat-file.c		patch \| blob \| history
t/t1006-cat-file.sh		patch \| blob \| history