]> git.ipfire.org Git - thirdparty/git.git/commitdiff
diff --no-index: fix logic for paths ending in '/'
authorJacob Keller <jacob.e.keller@intel.com>
Wed, 24 Sep 2025 20:57:15 +0000 (13:57 -0700)
committerJunio C Hamano <gitster@pobox.com>
Thu, 25 Sep 2025 18:35:20 +0000 (11:35 -0700)
If one of the two provided paths for git diff --no-index ends in a '/',
a failure similar to the following occurs:

  $ git diff --no-index -- /tmp/ /tmp/ ':!'
  fatal: `pos + len' is too far after the end of the buffer

This occurs because of an incorrect calculation of the skip lengths in
diff_no_index(). The code wants to calculate the length of the string,
but add one in case the string doesn't end with a slash.

The method it uses is incorrect, as it always checks the trailing NUL
character of the string. This will never be a '/', so we always add one.
In the event that we *do* have a trailing slash, this will create an
off-by-one length error later when using the skip value.

The most straightforward fix would be to correct the skip1 and skip2
lengths by using ends_with().

However, Johannes made a good point that the existing logic is wasting a
lot of computation. We generate the match string by copying the path in
and then skipping almost all of it immediately with a potentially
expensive memmove() from the strbuf_remove() call. We also re-initialize
the match stringbuf each time we call read_directory_contents.

The read_directory_contents really wants a path that is rooted at the
start of the directory scan. We're currently building this by taking the
full path and stripping out the start portion. Instead, replace this
logic by building up the portion of the match as we go.

Start by initializing two strbuf in diff_no_index containing the empty
string. Pass these into queue_diff, which in turn passes the appropriate
left or right side into read_directory_contents.

As before, we build up the matches by appending elements to the match
path and then clearing them using strbuf_setlen.

In the recursive portion of the queue_diff algorithm, we build up new
match paths the same way that we build up new buffer paths, by appending
the elements and then clearing them with strbuf_setlen after each
iteration. This is cheaper as it avoids repeated allocations, and is a
bit simpler to track what is going on.

Add a couple of test cases that pass in paths already ending in '/', to
ensure the tests cover this regression.

Reported-by: Johannes Schindelin <Johannes.Schindelin@gmx.de>
Closes: https://lore.kernel.org/git/c75ec5f9-407a-6555-d4fb-bb629d54ec61@gmx.de/
Signed-off-by: Jacob Keller <jacob.e.keller@intel.com>
[jc: small leakfixes at the end of diff_no_index()]
Signed-off-by: Junio C Hamano <gitster@pobox.com>
diff-no-index.c
t/t4053-diff-no-index.sh

index 88ae4cee56ba41819cb7d6c332feb59b6e0fe5a8..f320424f05fe0f3c0a33f1fca937282f4621ee9c 100644 (file)
 
 static int read_directory_contents(const char *path, struct string_list *list,
                                   const struct pathspec *pathspec,
-                                  int skip)
+                                  struct strbuf *match)
 {
-       struct strbuf match = STRBUF_INIT;
-       int len;
+       int len = match->len;
        DIR *dir;
        struct dirent *e;
 
        if (!(dir = opendir(path)))
                return error("Could not open directory %s", path);
 
-       if (pathspec) {
-               strbuf_addstr(&match, path);
-               strbuf_complete(&match, '/');
-               strbuf_remove(&match, 0, skip);
-
-               len = match.len;
-       }
-
        while ((e = readdir_skip_dot_and_dotdot(dir))) {
                if (pathspec) {
                        int is_dir = 0;
 
-                       strbuf_setlen(&match, len);
-                       strbuf_addstr(&match, e->d_name);
+                       strbuf_setlen(match, len);
+                       strbuf_addstr(match, e->d_name);
                        if (NOT_CONSTANT(DTYPE(e)) != DT_UNKNOWN) {
                                is_dir = (DTYPE(e) == DT_DIR);
                        } else {
@@ -57,7 +48,7 @@ static int read_directory_contents(const char *path, struct string_list *list,
                        }
 
                        if (!match_leading_pathspec(NULL, pathspec,
-                                                   match.buf, match.len,
+                                                   match->buf, match->len,
                                                    0, NULL, is_dir))
                                continue;
                }
@@ -65,7 +56,7 @@ static int read_directory_contents(const char *path, struct string_list *list,
                string_list_insert(list, e->d_name);
        }
 
-       strbuf_release(&match);
+       strbuf_setlen(match, len);
        closedir(dir);
        return 0;
 }
@@ -169,7 +160,8 @@ static struct diff_filespec *noindex_filespec(const struct git_hash_algo *algop,
 
 static int queue_diff(struct diff_options *o, const struct git_hash_algo *algop,
                      const char *name1, const char *name2, int recursing,
-                     const struct pathspec *ps, int skip1, int skip2)
+                     const struct pathspec *ps,
+                     struct strbuf *ps_match1, struct strbuf *ps_match2)
 {
        int mode1 = 0, mode2 = 0;
        enum special special1 = SPECIAL_NONE, special2 = SPECIAL_NONE;
@@ -208,10 +200,12 @@ static int queue_diff(struct diff_options *o, const struct git_hash_algo *algop,
                struct string_list p2 = STRING_LIST_INIT_DUP;
                int i1, i2, ret = 0;
                size_t len1 = 0, len2 = 0;
+               size_t match1_len = ps_match1->len;
+               size_t match2_len = ps_match2->len;
 
-               if (name1 && read_directory_contents(name1, &p1, ps, skip1))
+               if (name1 && read_directory_contents(name1, &p1, ps, ps_match1))
                        return -1;
-               if (name2 && read_directory_contents(name2, &p2, ps, skip2)) {
+               if (name2 && read_directory_contents(name2, &p2, ps, ps_match2)) {
                        string_list_clear(&p1, 0);
                        return -1;
                }
@@ -235,6 +229,11 @@ static int queue_diff(struct diff_options *o, const struct git_hash_algo *algop,
                        strbuf_setlen(&buffer1, len1);
                        strbuf_setlen(&buffer2, len2);
 
+                       if (ps) {
+                               strbuf_setlen(ps_match1, match1_len);
+                               strbuf_setlen(ps_match2, match2_len);
+                       }
+
                        if (i1 == p1.nr)
                                comp = 1;
                        else if (i2 == p2.nr)
@@ -245,18 +244,28 @@ static int queue_diff(struct diff_options *o, const struct git_hash_algo *algop,
                        if (comp > 0)
                                n1 = NULL;
                        else {
-                               strbuf_addstr(&buffer1, p1.items[i1++].string);
+                               strbuf_addstr(&buffer1, p1.items[i1].string);
+                               if (ps) {
+                                       strbuf_addstr(ps_match1, p1.items[i1].string);
+                                       strbuf_complete(ps_match1, '/');
+                               }
                                n1 = buffer1.buf;
+                               i1++;
                        }
 
                        if (comp < 0)
                                n2 = NULL;
                        else {
-                               strbuf_addstr(&buffer2, p2.items[i2++].string);
+                               strbuf_addstr(&buffer2, p2.items[i2].string);
+                               if (ps) {
+                                       strbuf_addstr(ps_match2, p2.items[i2].string);
+                                       strbuf_complete(ps_match2, '/');
+                               }
                                n2 = buffer2.buf;
+                               i2++;
                        }
 
-                       ret = queue_diff(o, algop, n1, n2, 1, ps, skip1, skip2);
+                       ret = queue_diff(o, algop, n1, n2, 1, ps, ps_match1, ps_match2);
                }
                string_list_clear(&p1, 0);
                string_list_clear(&p2, 0);
@@ -346,7 +355,8 @@ int diff_no_index(struct rev_info *revs, const struct git_hash_algo *algop,
                  int implicit_no_index, int argc, const char **argv)
 {
        struct pathspec pathspec, *ps = NULL;
-       int i, no_index, skip1 = 0, skip2 = 0;
+       struct strbuf ps_match1 = STRBUF_INIT, ps_match2 = STRBUF_INIT;
+       int i, no_index;
        int ret = 1;
        const char *paths[2];
        char *to_free[ARRAY_SIZE(paths)] = { 0 };
@@ -387,11 +397,6 @@ int diff_no_index(struct rev_info *revs, const struct git_hash_algo *algop,
                               NULL, &argv[2]);
                if (pathspec.nr)
                        ps = &pathspec;
-
-               skip1 = strlen(paths[0]);
-               skip1 += paths[0][skip1] == '/' ? 0 : 1;
-               skip2 = strlen(paths[1]);
-               skip2 += paths[1][skip2] == '/' ? 0 : 1;
        } else if (argc > 2) {
                warning(_("Limiting comparison with pathspecs is only "
                          "supported if both paths are directories."));
@@ -415,7 +420,7 @@ int diff_no_index(struct rev_info *revs, const struct git_hash_algo *algop,
        revs->diffopt.flags.exit_with_status = 1;
 
        if (queue_diff(&revs->diffopt, algop, paths[0], paths[1], 0, ps,
-                      skip1, skip2))
+                      &ps_match1, &ps_match2))
                goto out;
        diff_set_mnemonic_prefix(&revs->diffopt, "1/", "2/");
        diffcore_std(&revs->diffopt);
@@ -431,6 +436,8 @@ out:
        for (i = 0; i < ARRAY_SIZE(to_free); i++)
                free(to_free[i]);
        strbuf_release(&replacement);
+       strbuf_release(&ps_match1);
+       strbuf_release(&ps_match2);
        if (ps)
                clear_pathspec(ps);
        return ret;
index 01db9243abfe4f38af2a988f9d753c14425fad3a..e0ea437685b0abd623e8050467a770c304ae962f 100755 (executable)
@@ -322,6 +322,22 @@ test_expect_success 'diff --no-index with pathspec' '
        test_cmp expect actual
 '
 
+test_expect_success 'diff --no-index first path ending in slash with pathspec' '
+       test_expect_code 1 git diff --name-status --no-index a/ b 1 >actual &&
+       cat >expect <<-EOF &&
+       D       a/1
+       EOF
+       test_cmp expect actual
+'
+
+test_expect_success 'diff --no-index second path ending in slash with pathspec' '
+       test_expect_code 1 git diff --name-status --no-index a b/ 1 >actual &&
+       cat >expect <<-EOF &&
+       D       a/1
+       EOF
+       test_cmp expect actual
+'
+
 test_expect_success 'diff --no-index with pathspec no matches' '
        test_expect_code 0 git diff --name-status --no-index a b missing
 '