The ownership of files created by git-archive is always
root:root. Add --owner and --group options which work
like the GNU tar equivalent to allow overriding these
defaults.

Signed-off-by: suzuki toshiya <mpsuz...@hiroshima-u.ac.jp>
---
 Documentation/git-archive.txt |  13 +++
 archive-tar.c                 |   8 +-
 archive.c                     | 224 ++++++++++++++++++++++++++++++++++++++++++
 archive.h                     |   4 +
 t/t5005-archive-uid-gid.sh    | 140 ++++++++++++++++++++++++++
 t/t5005/parse-tar-file.py     |  60 +++++++++++
 tar.h                         |   2 +
 7 files changed, 447 insertions(+), 4 deletions(-)
 create mode 100755 t/t5005-archive-uid-gid.sh
 create mode 100755 t/t5005/parse-tar-file.py

diff --git a/Documentation/git-archive.txt b/Documentation/git-archive.txt
index cfa1e4ebe..0d156f6c1 100644
--- a/Documentation/git-archive.txt
+++ b/Documentation/git-archive.txt
@@ -11,6 +11,7 @@ SYNOPSIS
 [verse]
 'git archive' [--format=<fmt>] [--list] [--prefix=<prefix>/] [<extra>]
              [-o <file> | --output=<file>] [--worktree-attributes]
+             [--owner [username[:uid]] [--group [groupname[:gid]]
              [--remote=<repo> [--exec=<git-upload-archive>]] <tree-ish>
              [<path>...]
 
@@ -63,6 +64,18 @@ OPTIONS
        This can be any options that the archiver backend understands.
        See next section.
 
+--owner=<name>[:<uid>]::
+       Force <name> as owner and <uid> as uid for the files in the tar
+       archive.  If <uid> is not supplied, <name> can be either a user
+       name or numeric UID.  In this case the missing part (UID or
+       name) will be inferred from the current host's user database.
+
+--group=<name>[:<gid>]::
+       Force <name> as group and <gid> as gid for the files in the tar
+       archive.  If <gid> is not supplied, <name> can be either a group
+       name or numeric GID.  In this case the missing part (GID or
+       name) will be inferred from the current host's group database.
+
 --remote=<repo>::
        Instead of making a tar archive from the local repository,
        retrieve a tar archive from a remote repository. Note that the
diff --git a/archive-tar.c b/archive-tar.c
index c6ed96ee7..ca6471870 100644
--- a/archive-tar.c
+++ b/archive-tar.c
@@ -204,10 +204,10 @@ static void prepare_header(struct archiver_args *args,
        xsnprintf(header->size, sizeof(header->size), "%011lo", S_ISREG(mode) ? 
size : 0);
        xsnprintf(header->mtime, sizeof(header->mtime), "%011lo", (unsigned 
long) args->time);
 
-       xsnprintf(header->uid, sizeof(header->uid), "%07o", 0);
-       xsnprintf(header->gid, sizeof(header->gid), "%07o", 0);
-       strlcpy(header->uname, "root", sizeof(header->uname));
-       strlcpy(header->gname, "root", sizeof(header->gname));
+       xsnprintf(header->uid, sizeof(header->uid), "%07lo", args->uid);
+       xsnprintf(header->gid, sizeof(header->gid), "%07lo", args->gid);
+       strlcpy(header->uname, args->uname, sizeof(header->uname));
+       strlcpy(header->gname, args->gname, sizeof(header->gname));
        xsnprintf(header->devmajor, sizeof(header->devmajor), "%07o", 0);
        xsnprintf(header->devminor, sizeof(header->devminor), "%07o", 0);
 
diff --git a/archive.c b/archive.c
index 0b7b62af0..aa4b16b75 100644
--- a/archive.c
+++ b/archive.c
@@ -8,6 +8,7 @@
 #include "parse-options.h"
 #include "unpack-trees.h"
 #include "dir.h"
+#include "tar.h"
 
 static char const * const archive_usage[] = {
        N_("git archive [<options>] <tree-ish> [<path>...]"),
@@ -417,6 +418,223 @@ static void parse_treeish_arg(const char **argv,
        { OPTION_SET_INT, (s), NULL, (v), NULL, "", \
          PARSE_OPT_NOARG | PARSE_OPT_NONEG | PARSE_OPT_HIDDEN, NULL, (p) }
 
+/*
+ * GNU tar --owner, --group options reject hexdigit, signed int values.
+ * strtol(), atoi() are too permissive to simulate the behaviour.
+ */
+#define STR_IS_DIGIT_OK 0
+#define STR_IS_NOT_DIGIT -1
+#define STR_IS_DIGIT_TOO_LARGE -2
+
+static int try_as_simple_digit(const char *s, unsigned long *dst)
+{
+       unsigned long ul;
+       char *endptr;
+
+       if (strlen(s) != strspn(s, "0123456789"))
+               return STR_IS_NOT_DIGIT;
+
+       errno = 0;
+       ul = strtoul(s, &endptr, 10);
+
+       /* catch ERANGE */
+       if (errno) {
+               errno = 0;
+               return STR_IS_DIGIT_TOO_LARGE;
+       }
+
+#if ULONG_MAX > 0xFFFFFFFFUL
+       /*
+        * --owner, --group rejects uid/gid greater than 32-bit
+        * limits, even on 64-bit platforms.
+        */
+       if (ul > 0xFFFFFFFFUL)
+               return STR_IS_DIGIT_TOO_LARGE;
+#endif
+
+       if (dst)
+               *dst = ul;
+       return STR_IS_DIGIT_OK;
+}
+
+static const char *skip_leading_colon(const char *s)
+{
+       const char *col_pos;
+
+       col_pos = strchr(s, ':');
+       if (!col_pos)
+               return s;
+
+       return (col_pos + 1);
+}
+
+#define STR_IS_NAME_COLON_DIGIT 0
+#define STR_HAS_NO_COLON -1
+#define STR_HAS_DIGIT_BROKEN -2
+#define STR_HAS_DIGIT_TOO_LARGE -3
+
+static int try_as_name_colon_digit(const char *s, const char **dst_s,
+               unsigned long *dst_ul)
+{
+       int r;
+       const char *s2;
+
+       s2 = skip_leading_colon(s);
+       if (s2 == s)
+               return STR_HAS_NO_COLON;
+
+       r = try_as_simple_digit(s2, dst_ul);
+       switch (r) {
+       case STR_IS_DIGIT_OK:
+               *dst_s = xstrndup(s, s2 - s - 1);
+               return STR_IS_NAME_COLON_DIGIT;
+       case STR_IS_DIGIT_TOO_LARGE:
+               return STR_HAS_DIGIT_TOO_LARGE;
+       default:
+               return STR_HAS_DIGIT_BROKEN;
+       }
+}
+
+#define NAME_ID_BOTH_GIVEN 0
+#define NAME_ID_ID_GUESSED 1
+#define NAME_ID_ID_UNTOUCHED 2
+#define NAME_ID_NAME_GUESSED 3
+#define NAME_ID_NAME_EMPTY 4
+#define NAME_ID_ERR_ID_TOO_LARGE -126
+#define NAME_ID_ERR_SYNTAX -127
+#define NAME_ID_ERR_PARAMS -128
+
+static int set_args_uname_uid(struct archiver_args *args,
+               const char *tar_owner)
+{
+       int r;
+       struct passwd *pw = NULL;
+
+       if (!args || !tar_owner)
+               return NAME_ID_ERR_PARAMS;
+
+       r = try_as_name_colon_digit(tar_owner, &(args->uname),
+                                   &(args->uid));
+       switch (r) {
+       case STR_IS_NAME_COLON_DIGIT:
+               return NAME_ID_BOTH_GIVEN;
+       case STR_HAS_DIGIT_TOO_LARGE:
+               return NAME_ID_ERR_ID_TOO_LARGE;
+       case STR_HAS_DIGIT_BROKEN:
+               return NAME_ID_ERR_SYNTAX;
+       }
+
+       /* the operand is known to be single token */
+
+       r = try_as_simple_digit(tar_owner, &(args->uid));
+       switch (r) {
+       case STR_IS_DIGIT_TOO_LARGE:
+               return NAME_ID_ERR_ID_TOO_LARGE;
+       case STR_IS_DIGIT_OK:
+               pw = getpwuid(args->uid);
+               if (!pw) {
+                       args->uname = xstrdup("");
+                       return NAME_ID_NAME_EMPTY;
+               }
+               args->uname = xstrdup(pw->pw_name);
+               return NAME_ID_NAME_GUESSED;
+       }
+
+       /* the operand is known to be non-digit */
+
+       args->uname = xstrdup(tar_owner);
+       pw = getpwnam(tar_owner);
+       if (!pw)
+               return NAME_ID_ID_UNTOUCHED;
+       args->uid = pw->pw_uid;
+       return NAME_ID_ID_GUESSED;
+}
+
+static int set_args_gname_gid(struct archiver_args *args,
+               const char *tar_group)
+{
+       int r;
+       struct group *gr = NULL;
+
+       if (!args || !tar_group)
+               return NAME_ID_ERR_PARAMS;
+
+       r = try_as_name_colon_digit(tar_group, &(args->gname),
+                                   &(args->gid));
+       switch (r) {
+       case STR_IS_NAME_COLON_DIGIT:
+               return NAME_ID_BOTH_GIVEN;
+       case STR_HAS_DIGIT_TOO_LARGE:
+               return NAME_ID_ERR_ID_TOO_LARGE;
+       case STR_HAS_DIGIT_BROKEN:
+               return NAME_ID_ERR_SYNTAX;
+       }
+
+       /* the operand is known to be single token */
+
+       r = try_as_simple_digit(tar_group, &(args->gid));
+       switch (r) {
+       case STR_IS_DIGIT_TOO_LARGE:
+               return NAME_ID_ERR_ID_TOO_LARGE;
+       case STR_IS_DIGIT_OK:
+               gr = getgrgid(args->gid);
+               if (!gr) {
+                       args->gname = xstrdup("");
+                       return NAME_ID_NAME_EMPTY;
+               }
+               args->gname = xstrdup(gr->gr_name);
+               return NAME_ID_NAME_GUESSED;
+       }
+
+       /* the operand is known to be non-digit */
+
+       args->gname = xstrdup(tar_group);
+       gr = getgrnam(tar_group);
+       if (!gr)
+               return NAME_ID_ID_UNTOUCHED;
+       args->gid = gr->gr_gid;
+       return NAME_ID_ID_GUESSED;
+}
+
+static void set_args_tar_owner_group(struct archiver_args *args,
+               const char *tar_owner, const char *tar_group)
+{
+       int r;
+
+       /* initialize by default values */
+       args->uname = xstrdup("root");
+       args->gname = xstrdup("root");
+       args->uid = 0;
+       args->gid = 0;
+
+       /*
+        * GNU tar --format=ustar checks if uid is in 0..209751.
+        * Too long digit string could not be dealt as numeric,
+        * it is rejected as a syntax error before range check.
+        */
+       r = set_args_uname_uid(args, tar_owner);
+       switch (r) {
+       case NAME_ID_ERR_ID_TOO_LARGE:
+       case NAME_ID_ERR_SYNTAX:
+               die("'%s': Invalid owner ID",
+                   skip_leading_colon(tar_owner));
+       }
+       if (args->uid > MAX_ID_IN_TAR_US)
+               die("value %ld out of uid_t range 0..%ld", args->uid,
+                    MAX_ID_IN_TAR_US);
+
+       r = set_args_gname_gid(args, tar_group);
+       switch (r) {
+       case NAME_ID_ERR_ID_TOO_LARGE:
+       case NAME_ID_ERR_SYNTAX:
+               die("'%s': Invalid group ID",
+                   skip_leading_colon(tar_group));
+       }
+       if (args->gid > MAX_ID_IN_TAR_US)
+               die("value %ld out of gid_t range 0..%ld", args->gid,
+                   MAX_ID_IN_TAR_US);
+}
+
 static int parse_archive_args(int argc, const char **argv,
                const struct archiver **ar, struct archiver_args *args,
                const char *name_hint, int is_remote)
@@ -431,6 +649,8 @@ static int parse_archive_args(int argc, const char **argv,
        int i;
        int list = 0;
        int worktree_attributes = 0;
+       const char *tar_owner = NULL;
+       const char *tar_group = NULL;
        struct option opts[] = {
                OPT_GROUP(""),
                OPT_STRING(0, "format", &format, N_("fmt"), N_("archive 
format")),
@@ -459,6 +679,8 @@ static int parse_archive_args(int argc, const char **argv,
                        N_("retrieve the archive from remote repository 
<repo>")),
                OPT_STRING(0, "exec", &exec, N_("command"),
                        N_("path to the remote git-upload-archive command")),
+               OPT_STRING(0, "owner", &tar_owner, N_("owner"), 
N_("<name[:uid]> in tar")),
+               OPT_STRING(0, "group", &tar_group, N_("group"), 
N_("<name[:gid]> in tar")),
                OPT_END()
        };
 
@@ -507,6 +729,8 @@ static int parse_archive_args(int argc, const char **argv,
        args->baselen = strlen(base);
        args->worktree_attributes = worktree_attributes;
 
+       set_args_tar_owner_group(args, tar_owner, tar_group);
+
        return argc;
 }
 
diff --git a/archive.h b/archive.h
index 62d1d82c1..b2cfb1e4e 100644
--- a/archive.h
+++ b/archive.h
@@ -15,6 +15,10 @@ struct archiver_args {
        unsigned int worktree_attributes : 1;
        unsigned int convert : 1;
        int compression_level;
+       unsigned long uid;
+       unsigned long gid;
+       const char *uname;
+       const char *gname;
 };
 
 #define ARCHIVER_WANT_COMPRESSION_LEVELS 1
diff --git a/t/t5005-archive-uid-gid.sh b/t/t5005-archive-uid-gid.sh
new file mode 100755
index 000000000..c5e08d890
--- /dev/null
+++ b/t/t5005-archive-uid-gid.sh
@@ -0,0 +1,140 @@
+#!/bin/sh
+
+test_description='test --owner --group options for git-archive'
+. ./test-lib.sh
+
+test_expect_success 'create commit with a few empty files' '
+       git init . 1>/dev/null 2>/dev/null &&
+       touch uid-gid-test.001 &&
+       mkdir uid-gid-test.002 &&
+       mkdir uid-gid-test.002/uid-gid-test.003 &&
+       git add uid-gid-test.001 &&
+       git add uid-gid-test.002 &&
+       git add uid-gid-test.002/uid-gid-test.003 &&
+       git commit -m "uid-gid-test" 2>/dev/null 1>/dev/null
+'
+
+check_uid_gid_uname_gname_in_tar() {
+       # $1 tar pathname
+       # $2 uid (digit in string)
+       # $3 gid (digit in string)
+       # $4 uname (string)
+       # $5 gname (string)
+       uid=`python "$TEST_DIRECTORY"/t5005/parse-tar-file.py --print=uid 
--fail-if-multi $1`
+       if test $? != 0 -o x"${uid}" != "x"$2
+       then
+               echo "(some) uid differs from the specified value"
+               return $?
+       fi
+
+       gid=`python "$TEST_DIRECTORY"/t5005/parse-tar-file.py --print=gid 
--fail-if-multi $1`
+       if test $? != 0 -o x"${gid}" != "x"$3
+       then
+               echo "(some) gid differs from the specified value"
+               return $?
+       fi
+
+       uname=`python "$TEST_DIRECTORY"/t5005/parse-tar-file.py --print=uname 
--fail-if-multi $1`
+       if test $? != 0 -o x"${uname}" != "x"$4
+       then
+               echo "(some) uname differs from the specified value"
+               return $?
+       fi
+
+       gname=`python "$TEST_DIRECTORY"/t5005/parse-tar-file.py --print=gname 
--fail-if-multi $1`
+       if test $? != 0 -o x"${gname}" != "x"$5
+       then
+               echo "(some) gname differs from the specified value"
+               return $?
+       fi
+
+       return 0
+}
+
+test_expect_success 'test a case with explicitly specified name/id, 
owner=nobody:1234 group=nogroup:5678' '
+       git archive --format=tar --owner nobody:1234 --group nogroup:5678 HEAD 
> uid-gid-test1.tar &&
+       check_uid_gid_uname_gname_in_tar uid-gid-test1.tar 1234 5678 nobody 
nogroup &&
+       return $?
+'
+
+test_expect_success 'test a case with only string is given, owner=(current my 
name) group=(current my group)' '
+       my_uid=`id -u` &&
+       my_gid=`id -g` &&
+       my_uname=`id -u -n` &&
+       my_gname=`id -g -n` &&
+       git archive --format=tar --owner ${my_uname} --group ${my_gname} HEAD > 
uid-gid-test2.tar &&
+       check_uid_gid_uname_gname_in_tar uid-gid-test2.tar ${my_uid} ${my_gid} 
${my_uname} ${my_gname} &&
+       return $?
+'
+
+test_expect_success 'test a case with only number is given, owner=(current my 
uid) group=(current my gid)' '
+       my_uid=`id -u` &&
+       my_gid=`id -g` &&
+       my_uname=`id -u -n` &&
+       my_gname=`id -g -n` &&
+       git archive --format=tar --owner ${my_uid} --group ${my_gid} HEAD > 
uid-gid-test3.tar &&
+       check_uid_gid_uname_gname_in_tar uid-gid-test3.tar ${my_uid} ${my_gid} 
${my_uname} ${my_gname} &&
+       return $?
+'
+
+test_expect_success 'test a case with only uid is given, owner=(current my 
uid)' '
+       my_uid=`id -u` &&
+       my_gid=`id -g` &&
+       my_uname=`id -u -n` &&
+       my_gname=`id -g -n` &&
+       git archive --format=tar --owner ${my_uid} HEAD > uid-gid-test4.tar &&
+       check_uid_gid_uname_gname_in_tar uid-gid-test4.tar ${my_uid} ${my_gid} 
${my_uname} ${my_gname} &&
+       return $?
+'
+
+test_expect_success 'test a case with no owner/group are given' '
+       git archive --format=tar HEAD > uid-gid-test5.tar &&
+       check_uid_gid_uname_gname_in_tar uid-gid-test5.tar 0 0 root root &&
+       return $?
+'
+
+test_expect_success 'test a case with max uid for ustar' '
+       git archive --format=tar --owner nobody:209751 --group nogroup:1234 
HEAD > uid-gid-test6.tar &&
+       check_uid_gid_uname_gname_in_tar uid-gid-test6.tar 209751 1234 nobody 
nogroup &&
+       return $?
+'
+
+test_expect_success 'test a case with max gid for ustar' '
+       git archive --format=tar --group nogroup:209751 --owner nobody:1234 
HEAD > uid-gid-test7.tar &&
+       check_uid_gid_uname_gname_in_tar uid-gid-test7.tar 1234 209751 nobody 
nogroup &&
+       return $?
+'
+
+test_expect_success 'test a case with uid greater than 32-bit (must fail)' '
+       test_must_fail git archive --format=tar --owner 4294967296 --group 1234 
HEAD >/dev/null
+'
+
+test_expect_success 'test a case with gid greater than 32-bit (must fail)' '
+       test_must_fail git archive --format=tar --group 4294967296 --owner 1234 
HEAD >/dev/null
+'
+
+test_expect_success 'test a case with uid greater than ustar limit (must 
fail)' '
+       test_must_fail git archive --format=tar --owner 2097152 --group 1234 
HEAD >/dev/null
+'
+
+test_expect_success 'test a case with gid greater than ustar limit (must 
fail)' '
+       test_must_fail git archive --format=tar --group 2097152 --owner 1234 
HEAD >/dev/null
+'
+
+test_expect_success 'test a case with valid username plus uid greater than 
32-bit (must fail)' '
+       test_must_fail git archive --format=tar --owner nobody:4294967296 HEAD 
>/dev/null
+'
+
+test_expect_success 'test a case with valid groupname plus gid greater than 
32-bit (must fail)' '
+       test_must_fail git archive --format=tar --group nogroup:4294967296 HEAD 
>/dev/null
+'
+
+test_expect_success 'test a case with valid username plus uid greater than 
ustar limit (must fail)' '
+       test_must_fail git archive --format=tar --owner nobody:2097152 HEAD 
>/dev/null
+'
+
+test_expect_success 'test a case with valid groupname plus gid greater than 
ustar limit (must fail)' '
+       test_must_fail git archive --format=tar --group nogroup:2097152 HEAD 
>/dev/null
+'
+
+test_done
diff --git a/t/t5005/parse-tar-file.py b/t/t5005/parse-tar-file.py
new file mode 100755
index 000000000..7d03b55d4
--- /dev/null
+++ b/t/t5005/parse-tar-file.py
@@ -0,0 +1,60 @@
+#!/usr/bin/env python
+
+import sys
+import getopt
+import tarfile
+
+optlist, args = getopt.getopt( sys.argv[1:], "", [
+                               "print=", "show=",
+                               "uniq",
+                               "fail-if-multi",
+                ] )
+
+infos_to_print = []
+uniq = False
+fail_if_multi = False
+
+for opt in optlist:
+    if opt[0] == "--print":
+        infos_to_print.append(opt[1])
+    elif opt[0] == "--show":
+        infos_to_print.append(opt[1])
+    elif opt[0] == "--uniq":
+        uniq = True
+    elif opt[0] == "--fail-if-multi":
+        uniq = True
+        fail_if_multi = True
+
+if len(infos_to_print) == 0:
+    infos_to_print = ["uid", "gid", "uname", "gname", "name"]
+
+if len(args) > 0:
+    tar = tarfile.open( path=args[0], mode="r|" )
+else:
+    tar = tarfile.open( mode="r|", fileobj=sys.stdin )
+
+out_lines = []
+for tarinfo in tar:
+    infos = []
+    for info_tag in infos_to_print:
+        if info_tag == "uid":
+            infos.append( str(tarinfo.uid) )
+        elif info_tag == "gid":
+            infos.append( str(tarinfo.gid) )
+        elif info_tag == "uname" or info_tag == "owner":
+            infos.append( tarinfo.uname )
+        elif info_tag == "gname" or info_tag == "group":
+            infos.append( tarinfo.gname )
+        elif info_tag == "name" or info_tag == "pathname":
+            infos.append( tarinfo.name )
+        out_lines.append( "\t".join(infos) )
+tar.close()
+
+if uniq:
+    out_lines = list(set(out_lines))
+    if fail_if_multi and (len(out_lines) > 1):
+        sys.stderr.write("*** not unique value, " + str(len(out_lines)) + " 
values found\n")
+        sys.exit(len(out_lines))
+
+for line in out_lines:
+    print line
diff --git a/tar.h b/tar.h
index 3467705e9..1e6b57470 100644
--- a/tar.h
+++ b/tar.h
@@ -5,6 +5,8 @@
 #define TYPEFLAG_GLOBAL_HEADER 'g'
 #define TYPEFLAG_EXT_HEADER    'x'
 
+#define MAX_ID_IN_TAR_US       0x1FFFFFUL
+
 struct ustar_header {
        char name[100];         /*   0 */
        char mode[8];           /* 100 */
-- 
2.11.0


Reply via email to