]> git.ipfire.org Git - thirdparty/git.git/commitdiff
refs: allow reference location in refstorage config
authorKarthik Nayak <karthik.188@gmail.com>
Wed, 25 Feb 2026 09:40:45 +0000 (10:40 +0100)
committerJunio C Hamano <gitster@pobox.com>
Wed, 25 Feb 2026 17:38:41 +0000 (09:38 -0800)
The 'extensions.refStorage' config is used to specify the reference
backend for a given repository. Both the 'files' and 'reftable' backends
utilize the $GIT_DIR as the reference folder by default in
`get_main_ref_store()`.

Since the reference backends are pluggable, this means that they could
work with out-of-tree reference directories too. Extend the 'refStorage'
config to also support taking an URI input, where users can specify the
reference backend and the location.

Add the required changes to obtain and propagate this value to the
individual backends. Add the necessary documentation and tests.

Traditionally, for linked worktrees, references were stored in the
'$GIT_DIR/worktrees/<wt_id>' path. But when using an alternate reference
storage path, it doesn't make sense to store the main worktree
references in the new path, and the linked worktree references in the
$GIT_DIR. So, let's store linked worktree references in
'$ALTERNATE_REFERENCE_DIR/worktrees/<wt_id>'. To do this, create the
necessary files and folders while also adding stubs in the $GIT_DIR path
to ensure that it is still considered a Git directory.

Ideally, we would want to pass in a `struct worktree *` to individual
backends, instead of passing the `gitdir`. This allows them to handle
worktree specific logic. Currently, that is not possible since the
worktree code is:

  - Tied to using the global `the_repository` variable.

  - Is not setup before the reference database during initialization of
    the repository.

Add a TODO in 'refs.c' to ensure we can eventually make that change.

Helped-by: Patrick Steinhardt <ps@pks.im>
Signed-off-by: Karthik Nayak <karthik.188@gmail.com>
Signed-off-by: Junio C Hamano <gitster@pobox.com>
Documentation/config/extensions.adoc
builtin/worktree.c
refs.c
repository.c
repository.h
setup.c
setup.h
t/meson.build
t/t1423-ref-backend.sh [new file with mode: 0755]

index 532456644b770e7f9a8d15b5eaac9eef143a5315..329d02b3c4dd04251e14b345aafd73ff160420f6 100644 (file)
@@ -57,10 +57,24 @@ For historical reasons, this extension is respected regardless of the
 `core.repositoryFormatVersion` setting.
 
 refStorage:::
-       Specify the ref storage format to use. The acceptable values are:
+       Specify the ref storage format and a corresponding payload. The value
+       can be either a format name or a URI:
 +
 --
+* A format name alone (e.g., `reftable` or `files`).
+
+* A URI format `<format>://<payload>` explicitly specifies both the
+  format and payload (e.g., `reftable:///foo/bar`).
+
+Supported format names are:
+
 include::../ref-storage-format.adoc[]
+
+The payload is passed directly to the reference backend. For the files and
+reftable backends, this must be a filesystem path where the references will
+be stored. Defaulting to the commondir when no payload is provided. Relative
+paths are resolved relative to the `$GIT_DIR`. Future backends may support
+other payload schemes, e.g., postgres://127.0.0.1:5432?database=myrepo.
 --
 +
 Note that this setting should only be set by linkgit:git-init[1] or
index fbdaf2eb2eb85ce33e2001dfa5030fca9ddaeaf4..293e80837987b4ea756e4744dfd0414efb4ea53b 100644 (file)
@@ -425,6 +425,39 @@ static int make_worktree_orphan(const char * ref, const struct add_opts *opts,
        return run_command(&cp);
 }
 
+/*
+ * References for worktrees are generally stored in '$GIT_DIR/worktrees/<wt_id>'.
+ * But when using alternate reference directories, we want to store the worktree
+ * references in '$ALTERNATE_REFERENCE_DIR/worktrees/<wt_id>'.
+ *
+ * Create the necessary folder structure to facilitate the same. But to ensure
+ * that the former path is still considered a Git directory, add stubs.
+ */
+static void setup_alternate_ref_dir(struct worktree *wt, const char *wt_git_path)
+{
+       struct strbuf sb = STRBUF_INIT;
+       char *path;
+
+       path = wt->repo->ref_storage_payload;
+       if (!path)
+               return;
+
+       if (!is_absolute_path(path))
+               strbuf_addf(&sb, "%s/", wt->repo->commondir);
+
+       strbuf_addf(&sb, "%s/worktrees", path);
+       safe_create_dir(wt->repo, sb.buf, 1);
+       strbuf_addf(&sb, "/%s", wt->id);
+       safe_create_dir(wt->repo, sb.buf, 1);
+       strbuf_reset(&sb);
+
+       strbuf_addf(&sb, "this worktree stores references in %s/worktrees/%s",
+                   path, wt->id);
+       refs_create_refdir_stubs(wt->repo, wt_git_path, sb.buf);
+
+       strbuf_release(&sb);
+}
+
 static int add_worktree(const char *path, const char *refname,
                        const struct add_opts *opts)
 {
@@ -518,6 +551,7 @@ static int add_worktree(const char *path, const char *refname,
                ret = error(_("could not find created worktree '%s'"), name);
                goto done;
        }
+       setup_alternate_ref_dir(wt, sb_repo.buf);
        wt_refs = get_worktree_ref_store(wt);
 
        ret = ref_store_create_on_disk(wt_refs, REF_STORE_CREATE_ON_DISK_IS_WORKTREE, &sb);
diff --git a/refs.c b/refs.c
index ba2573eb7a339a953d918eb8b0d44c19c8592ff3..ef1902e85c707ded32aa195f0c1ac429c047bc26 100644 (file)
--- a/refs.c
+++ b/refs.c
@@ -2291,7 +2291,11 @@ static struct ref_store *ref_store_init(struct repository *repo,
        if (!be)
                BUG("reference backend is unknown");
 
-       refs = be->init(repo, NULL, gitdir, flags);
+       /*
+        * TODO Send in a 'struct worktree' instead of a 'gitdir', and
+        * allow the backend to handle how it wants to deal with worktrees.
+        */
+       refs = be->init(repo, repo->ref_storage_payload, gitdir, flags);
        return refs;
 }
 
index c7e75215ac2ab215c7bac325d2623373e6e2da0d..9815f081efa0aa5ce71573cf8147db3d178b9643 100644 (file)
@@ -193,9 +193,12 @@ void repo_set_compat_hash_algo(struct repository *repo, int algo)
 }
 
 void repo_set_ref_storage_format(struct repository *repo,
-                                enum ref_storage_format format)
+                                enum ref_storage_format format,
+                                const char *payload)
 {
        repo->ref_storage_format = format;
+       free(repo->ref_storage_payload);
+       repo->ref_storage_payload = xstrdup_or_null(payload);
 }
 
 /*
@@ -277,7 +280,8 @@ int repo_init(struct repository *repo,
 
        repo_set_hash_algo(repo, format.hash_algo);
        repo_set_compat_hash_algo(repo, format.compat_hash_algo);
-       repo_set_ref_storage_format(repo, format.ref_storage_format);
+       repo_set_ref_storage_format(repo, format.ref_storage_format,
+                                   format.ref_storage_payload);
        repo->repository_format_worktree_config = format.worktree_config;
        repo->repository_format_relative_worktrees = format.relative_worktrees;
        repo->repository_format_precious_objects = format.precious_objects;
@@ -369,6 +373,7 @@ void repo_clear(struct repository *repo)
        FREE_AND_NULL(repo->index_file);
        FREE_AND_NULL(repo->worktree);
        FREE_AND_NULL(repo->submodule_prefix);
+       FREE_AND_NULL(repo->ref_storage_payload);
 
        odb_free(repo->objects);
        repo->objects = NULL;
index 6063c4b846d031d657827f8b16d65af8c09e5b29..95e2333bad9463002e2d33af5ebfbdd5bd98eb48 100644 (file)
@@ -150,6 +150,11 @@ struct repository {
 
        /* Repository's reference storage format, as serialized on disk. */
        enum ref_storage_format ref_storage_format;
+       /*
+        * Reference storage information as needed for the backend. This contains
+        * only the payload from the reference URI without the schema.
+        */
+       char *ref_storage_payload;
 
        /* A unique-id for tracing purposes. */
        int trace2_repo_id;
@@ -204,7 +209,8 @@ void repo_set_worktree(struct repository *repo, const char *path);
 void repo_set_hash_algo(struct repository *repo, int algo);
 void repo_set_compat_hash_algo(struct repository *repo, int compat_algo);
 void repo_set_ref_storage_format(struct repository *repo,
-                                enum ref_storage_format format);
+                                enum ref_storage_format format,
+                                const char *payload);
 void initialize_repository(struct repository *repo);
 RESULT_MUST_BE_USED
 int repo_init(struct repository *r, const char *gitdir, const char *worktree);
diff --git a/setup.c b/setup.c
index 1fc9ae3872809cfa973514fb9dc40c4c107a6ea0..d407f3347b974e9ba1063941739acf121ce42478 100644 (file)
--- a/setup.c
+++ b/setup.c
@@ -632,6 +632,21 @@ static enum extension_result handle_extension_v0(const char *var,
                return EXTENSION_UNKNOWN;
 }
 
+static void parse_reference_uri(const char *value, char **format,
+                               char **payload)
+{
+       const char *schema_end;
+
+       schema_end = strstr(value, "://");
+       if (!schema_end) {
+               *format = xstrdup(value);
+               *payload = NULL;
+       } else {
+               *format = xstrndup(value, schema_end - value);
+               *payload = xstrdup_or_null(schema_end + 3);
+       }
+}
+
 /*
  * Record any new extensions in this function.
  */
@@ -674,10 +689,17 @@ static enum extension_result handle_extension(const char *var,
                return EXTENSION_OK;
        } else if (!strcmp(ext, "refstorage")) {
                unsigned int format;
+               char *format_str;
 
                if (!value)
                        return config_error_nonbool(var);
-               format = ref_storage_format_by_name(value);
+
+               parse_reference_uri(value, &format_str,
+                                   &data->ref_storage_payload);
+
+               format = ref_storage_format_by_name(format_str);
+               free(format_str);
+
                if (format == REF_STORAGE_FORMAT_UNKNOWN)
                        return error(_("invalid value for '%s': '%s'"),
                                     "extensions.refstorage", value);
@@ -850,6 +872,7 @@ void clear_repository_format(struct repository_format *format)
        string_list_clear(&format->v1_only_extensions, 0);
        free(format->work_tree);
        free(format->partial_clone);
+       free(format->ref_storage_payload);
        init_repository_format(format);
 }
 
@@ -1942,7 +1965,8 @@ const char *setup_git_directory_gently(int *nongit_ok)
                        repo_set_compat_hash_algo(the_repository,
                                                  repo_fmt.compat_hash_algo);
                        repo_set_ref_storage_format(the_repository,
-                                                   repo_fmt.ref_storage_format);
+                                                   repo_fmt.ref_storage_format,
+                                                   repo_fmt.ref_storage_payload);
                        the_repository->repository_format_worktree_config =
                                repo_fmt.worktree_config;
                        the_repository->repository_format_relative_worktrees =
@@ -2042,7 +2066,8 @@ void check_repository_format(struct repository_format *fmt)
        repo_set_hash_algo(the_repository, fmt->hash_algo);
        repo_set_compat_hash_algo(the_repository, fmt->compat_hash_algo);
        repo_set_ref_storage_format(the_repository,
-                                   fmt->ref_storage_format);
+                                   fmt->ref_storage_format,
+                                   fmt->ref_storage_payload);
        the_repository->repository_format_worktree_config =
                fmt->worktree_config;
        the_repository->repository_format_relative_worktrees =
@@ -2643,7 +2668,8 @@ static void repository_format_configure(struct repository_format *repo_fmt,
        } else {
                repo_fmt->ref_storage_format = REF_STORAGE_FORMAT_DEFAULT;
        }
-       repo_set_ref_storage_format(the_repository, repo_fmt->ref_storage_format);
+       repo_set_ref_storage_format(the_repository, repo_fmt->ref_storage_format,
+                                   repo_fmt->ref_storage_payload);
 }
 
 int init_db(const char *git_dir, const char *real_git_dir,
diff --git a/setup.h b/setup.h
index ddb9f6701c2df76d00f7d76a6fdff4c9e48670ce..093af39e844def049e11263971218ad2cd59b2d8 100644 (file)
--- a/setup.h
+++ b/setup.h
@@ -171,6 +171,7 @@ struct repository_format {
        int hash_algo;
        int compat_hash_algo;
        enum ref_storage_format ref_storage_format;
+       char *ref_storage_payload;
        int sparse_index;
        char *work_tree;
        struct string_list unknown_extensions;
index 459c52a48972e441e9325616940f5bca13b9ec83..11fc5a49ee2228b8950079ae649414a108efeef5 100644 (file)
@@ -210,6 +210,7 @@ integration_tests = [
   't1420-lost-found.sh',
   't1421-reflog-write.sh',
   't1422-show-ref-exists.sh',
+  't1423-ref-backend.sh',
   't1430-bad-ref-name.sh',
   't1450-fsck.sh',
   't1451-fsck-buffer.sh',
diff --git a/t/t1423-ref-backend.sh b/t/t1423-ref-backend.sh
new file mode 100755 (executable)
index 0000000..82cccb7
--- /dev/null
@@ -0,0 +1,159 @@
+#!/bin/sh
+
+test_description='Test reference backend URIs'
+
+. ./test-lib.sh
+
+# Run a git command with the provided reference storage. Reset the backend
+# post running the command.
+# Usage: run_with_uri <repo> <backend> <uri> <cmd>
+#   <repo> is the relative path to the repo to run the command in.
+#   <backend> is the original ref storage of the repo.
+#   <uri> is the new URI to be set for the ref storage.
+#   <cmd> is the git subcommand to be run in the repository.
+run_with_uri () {
+       repo=$1 &&
+       backend=$2 &&
+       uri=$3 &&
+       cmd=$4 &&
+
+       git -C "$repo" config set core.repositoryformatversion 1
+       git -C "$repo" config set extensions.refStorage "$uri" &&
+       git -C "$repo" $cmd &&
+       git -C "$repo" config set extensions.refStorage "$backend"
+}
+
+# Test a repository with a given reference storage by running and comparing
+# 'git refs list' before and after setting the new reference backend. If
+# err_msg is set, expect the command to fail and grep for the provided err_msg.
+# Usage: run_with_uri <repo> <backend> <uri> <cmd>
+#   <repo> is the relative path to the repo to run the command in.
+#   <backend> is the original ref storage of the repo.
+#   <uri> is the new URI to be set for the ref storage.
+#   <err_msg> (optional) if set, check if 'git-refs(1)' failed with the provided msg.
+test_refs_backend () {
+       repo=$1 &&
+       backend=$2 &&
+       uri=$3 &&
+       err_msg=$4 &&
+
+       git -C "$repo" config set core.repositoryformatversion 1 &&
+       if test -n "$err_msg";
+       then
+               git -C "$repo" config set extensions.refStorage "$uri" &&
+               test_must_fail git -C "$repo" refs list 2>err &&
+               test_grep "$err_msg" err
+       else
+               git -C "$repo" refs list >expect &&
+               run_with_uri "$repo" "$backend" "$uri" "refs list" >actual &&
+               test_cmp expect actual
+       fi
+}
+
+test_expect_success 'URI is invalid' '
+       test_when_finished "rm -rf repo" &&
+       git init repo &&
+       test_refs_backend repo files "reftable@/home/reftable" \
+               "invalid value for ${SQ}extensions.refstorage${SQ}"
+'
+
+test_expect_success 'URI ends with colon' '
+       test_when_finished "rm -rf repo" &&
+       git init repo &&
+       test_refs_backend repo files "reftable:" \
+               "invalid value for ${SQ}extensions.refstorage${SQ}"
+'
+
+test_expect_success 'unknown reference backend' '
+       test_when_finished "rm -rf repo" &&
+       git init repo &&
+       test_refs_backend repo files "db://.git" \
+               "invalid value for ${SQ}extensions.refstorage${SQ}"
+'
+
+ref_formats="files reftable"
+for from_format in $ref_formats
+do
+
+for to_format in $ref_formats
+do
+       if test "$from_format" = "$to_format"
+       then
+               continue
+       fi
+
+
+       for dir in "$(pwd)/repo/.git" "."
+       do
+
+               test_expect_success "read from $to_format backend, $dir dir" '
+                       test_when_finished "rm -rf repo" &&
+                       git init --ref-format=$from_format repo &&
+                       (
+                               cd repo &&
+                               test_commit 1 &&
+                               test_commit 2 &&
+                               test_commit 3 &&
+
+                               git refs migrate --dry-run --ref-format=$to_format >out &&
+                               BACKEND_PATH="$dir/$(sed "s/.* ${SQ}.git\/\(.*\)${SQ}/\1/" out)" &&
+                               test_refs_backend . $from_format "$to_format://$BACKEND_PATH" "$method"
+                       )
+               '
+
+               test_expect_success "write to $to_format backend, $dir dir" '
+                       test_when_finished "rm -rf repo" &&
+                       git init --ref-format=$from_format repo &&
+                       (
+                               cd repo &&
+                               test_commit 1 &&
+                               test_commit 2 &&
+                               test_commit 3 &&
+
+                               git refs migrate --dry-run --ref-format=$to_format >out &&
+                               BACKEND_PATH="$dir/$(sed "s/.* ${SQ}.git\/\(.*\)${SQ}/\1/" out)" &&
+
+                               test_refs_backend . $from_format "$to_format://$BACKEND_PATH" &&
+
+                               git refs list >expect &&
+                               run_with_uri . "$from_format" "$to_format://$BACKEND_PATH" "tag -d 1" &&
+                               git refs list >actual &&
+                               test_cmp expect actual &&
+
+                               git refs list | grep -v "refs/tags/1" >expect &&
+                               run_with_uri . "$from_format" "$to_format://$BACKEND_PATH" "refs list" >actual &&
+                               test_cmp expect actual
+                       )
+               '
+
+               test_expect_success "with worktree and $to_format backend, $dir dir" '
+                       test_when_finished "rm -rf repo wt" &&
+                       git init --ref-format=$from_format repo &&
+                       (
+                               cd repo &&
+                               test_commit 1 &&
+                               test_commit 2 &&
+                               test_commit 3 &&
+
+                               git refs migrate --dry-run --ref-format=$to_format >out &&
+                               BACKEND_PATH="$dir/$(sed "s/.* ${SQ}.git\/\(.*\)${SQ}/\1/" out)" &&
+
+                               git config set core.repositoryformatversion 1 &&
+                               git config set extensions.refStorage "$to_format://$BACKEND_PATH" &&
+
+                               git worktree add ../wt 2
+                       ) &&
+
+                       git -C repo for-each-ref --include-root-refs >expect &&
+                       git -C wt for-each-ref --include-root-refs >expect &&
+                       ! test_cmp expect actual &&
+
+                       git -C wt rev-parse 2 >expect &&
+                       git -C wt rev-parse HEAD >actual &&
+                       test_cmp expect actual
+               '
+       done # closes dir
+done # closes to_format
+done # closes from_format
+
+test_done