]> git.ipfire.org Git - thirdparty/git.git/commitdiff
builtin/history: implement "split" subcommand
authorPatrick Steinhardt <ps@pks.im>
Wed, 1 Oct 2025 15:57:38 +0000 (17:57 +0200)
committerJunio C Hamano <gitster@pobox.com>
Wed, 1 Oct 2025 19:33:30 +0000 (12:33 -0700)
It is quite a common use case that one wants to split up one commit into
multiple commits by moving parts of the changes of the original commit
out into a separate commit. This is quite an involved operation though:

  1. Identify the commit in question that is to be dropped.

  2. Perform an interactive rebase on top of that commit's parent.

  3. Modify the instruction sheet to "edit" the commit that is to be
     split up.

  4. Drop the commit via "git reset HEAD~".

  5. Stage changes that should go into the first commit and commit it.

  6. Stage changes that should go into the second commit and commit it.

  7. Finalize the rebase.

This is quite complex, and overall I would claim that most people who
are not experts in Git would struggle with this flow.

Introduce a new "split" subcommand for git-history(1) to make this way
easier. All the user needs to do is to say `git history split $COMMIT`.
From hereon, Git asks the user which parts of the commit shall be moved
out into a separate commit and, once done, asks the user for the commit
message. Git then creates that split-out commit and applies the original
commit on top of it.

Signed-off-by: Patrick Steinhardt <ps@pks.im>
Signed-off-by: Junio C Hamano <gitster@pobox.com>
Documentation/git-history.adoc
builtin/history.c
t/meson.build
t/t3452-history-split.sh [new file with mode: 0755]

index b55babe206eb43d239f4925011e09af1967dd9c2..83d675afeaab18dbadc72d11c18ce5b2b6bc47e1 100644 (file)
@@ -10,6 +10,7 @@ SYNOPSIS
 [synopsis]
 git history [<options>]
 git history reword [<options>] <commit>
+git history split [<options>] <commit> [--] [<pathspec>...]
 
 DESCRIPTION
 -----------
@@ -40,6 +41,26 @@ rewrite history in different ways:
        provided, then this command will spawn an editor with the current
        message of that commit.
 
+`split [--message=<message>] <commit> [--] [<pathspec>...]`::
+       Interactively split up <commit> into two commits by choosing
+       hunks introduced by it that will be moved into the new split-out
+       commit. These hunks will then be written into a new commit that
+       becomes the parent of the previous commit. The original commit
+       stays intact, except that its parent will be the newly split-out
+       commit.
++
+The commit message of the new commit will be asked for by launching the
+configured editor, unless it has been specified with the `-m` option.
+Authorship of the commit will be the same as for the original commit.
++
+If passed, _<pathspec>_ can be used to limit which changes shall be split out
+of the original commit. Files not matching any of the pathspecs will remain
+part of the original commit. For more details, see the 'pathspec' entry in
+linkgit:gitglossary[7].
++
+It is invalid to select either all or no hunks, as that would lead to
+one of the commits becoming empty.
+
 CONFIGURATION
 -------------
 
@@ -47,6 +68,47 @@ include::includes/cmd-config-section-all.adoc[]
 
 include::config/sequencer.adoc[]
 
+EXAMPLES
+--------
+
+Split a commit
+~~~~~~~~~~~~~~
+
+----------
+$ git log --stat --oneline
+3f81232 (HEAD -> main) original
+ bar | 1 +
+ foo | 1 +
+ 2 files changed, 2 insertions(+)
+
+$ git history split HEAD --message="split-out commit"
+diff --git a/bar b/bar
+new file mode 100644
+index 0000000..5716ca5
+--- /dev/null
++++ b/bar
+@@ -0,0 +1 @@
++bar
+(1/1) Stage addition [y,n,q,a,d,e,p,?]? y
+
+diff --git a/foo b/foo
+new file mode 100644
+index 0000000..257cc56
+--- /dev/null
++++ b/foo
+@@ -0,0 +1 @@
++foo
+(1/1) Stage addition [y,n,q,a,d,e,p,?]? n
+
+$ git log --stat --oneline
+7cebe64 (HEAD -> main) original
+ foo | 1 +
+ 1 file changed, 1 insertion(+)
+d1582f3 split-out commit
+ bar | 1 +
+ 1 file changed, 1 insertion(+)
+----------
+
 GIT
 ---
 Part of the linkgit:git[1] suite
index 7b2a0023e86909b4ba364e6d540abae5d8607ca4..8851a2945ebbb2cb17a2d96b0761f7d5f8d7067c 100644 (file)
@@ -1,6 +1,7 @@
 #define USE_THE_REPOSITORY_VARIABLE
 
 #include "builtin.h"
+#include "cache-tree.h"
 #include "commit-reach.h"
 #include "commit.h"
 #include "config.h"
 #include "hex.h"
 #include "oidmap.h"
 #include "parse-options.h"
+#include "path.h"
+#include "read-cache.h"
 #include "refs.h"
 #include "replay.h"
 #include "reset.h"
 #include "revision.h"
+#include "run-command.h"
 #include "sequencer.h"
 #include "strvec.h"
 #include "tree.h"
@@ -368,6 +372,225 @@ out:
        return ret;
 }
 
+static int split_commit(struct repository *repo,
+                       struct commit *original_commit,
+                       struct pathspec *pathspec,
+                       const char *commit_message,
+                       struct object_id *out)
+{
+       struct interactive_options interactive_opts = INTERACTIVE_OPTIONS_INIT;
+       struct strbuf index_file = STRBUF_INIT, split_message = STRBUF_INIT;
+       struct child_process read_tree_cmd = CHILD_PROCESS_INIT;
+       struct index_state index = INDEX_STATE_INIT(repo);
+       struct object_id original_commit_tree_oid, parent_tree_oid;
+       const char *original_message, *original_body, *ptr;
+       char original_commit_oid[GIT_MAX_HEXSZ + 1];
+       char *original_author = NULL;
+       struct commit_list *parents = NULL;
+       struct commit *first_commit;
+       struct tree *split_tree;
+       size_t len;
+       int ret;
+
+       if (original_commit->parents)
+               parent_tree_oid = *get_commit_tree_oid(original_commit->parents->item);
+       else
+               oidcpy(&parent_tree_oid, repo->hash_algo->empty_tree);
+       original_commit_tree_oid = *get_commit_tree_oid(original_commit);
+
+       /*
+       * Construct the first commit. This is done by taking the original
+       * commit parent's tree and selectively patching changes from the diff
+       * between that parent and its child.
+       */
+       repo_git_path_replace(repo, &index_file, "%s", "history-split.index");
+
+       read_tree_cmd.git_cmd = 1;
+       strvec_pushf(&read_tree_cmd.env, "GIT_INDEX_FILE=%s", index_file.buf);
+       strvec_push(&read_tree_cmd.args, "read-tree");
+       strvec_push(&read_tree_cmd.args, oid_to_hex(&parent_tree_oid));
+       ret = run_command(&read_tree_cmd);
+       if (ret < 0)
+               goto out;
+
+       ret = read_index_from(&index, index_file.buf, repo->gitdir);
+       if (ret < 0) {
+               ret = error(_("failed reading temporary index"));
+               goto out;
+       }
+
+       oid_to_hex_r(original_commit_oid, &original_commit->object.oid);
+       ret = run_add_p_index(repo, &index, index_file.buf, &interactive_opts,
+                             original_commit_oid, pathspec);
+       if (ret < 0)
+               goto out;
+
+       split_tree = write_in_core_index_as_tree(repo, &index);
+       if (!split_tree) {
+               ret = error(_("failed split tree"));
+               goto out;
+       }
+
+       unlink(index_file.buf);
+
+       /*
+       * We disallow the cases where either the split-out commit or the
+       * original commit would become empty. Consequently, if we see that the
+       * new tree ID matches either of those trees we abort.
+       */
+       if (oideq(&split_tree->object.oid, &parent_tree_oid)) {
+               ret = error(_("split commit is empty"));
+               goto out;
+       } else if (oideq(&split_tree->object.oid, &original_commit_tree_oid)) {
+               ret = error(_("split commit tree matches original commit"));
+               goto out;
+       }
+
+       /* We retain authorship of the original commit. */
+       original_message = repo_logmsg_reencode(repo, original_commit, NULL, NULL);
+       ptr = find_commit_header(original_message, "author", &len);
+       if (ptr)
+               original_author = xmemdupz(ptr, len);
+
+       ret = fill_commit_message(repo, &parent_tree_oid, &split_tree->object.oid,
+                                 "", commit_message, "split-out", &split_message);
+       if (ret < 0)
+               goto out;
+
+       ret = commit_tree(split_message.buf, split_message.len, &split_tree->object.oid,
+                         original_commit->parents, &out[0], original_author, NULL);
+       if (ret < 0) {
+               ret = error(_("failed writing split-out commit"));
+               goto out;
+       }
+
+       /*
+       * The second commit is much simpler to construct, as we can simply use
+       * the original commit details, except that we adjust its parent to be
+       * the newly split-out commit.
+       */
+       find_commit_subject(original_message, &original_body);
+       first_commit = lookup_commit_reference(repo, &out[0]);
+       commit_list_append(first_commit, &parents);
+
+       ret = commit_tree(original_body, strlen(original_body), &original_commit_tree_oid,
+                         parents, &out[1], original_author, NULL);
+       if (ret < 0) {
+               ret = error(_("failed writing second commit"));
+               goto out;
+       }
+
+       ret = 0;
+
+out:
+       if (index_file.len)
+               unlink(index_file.buf);
+       strbuf_release(&split_message);
+       strbuf_release(&index_file);
+       free_commit_list(parents);
+       free(original_author);
+       release_index(&index);
+       return ret;
+}
+
+static int cmd_history_split(int argc,
+                            const char **argv,
+                            const char *prefix,
+                            struct repository *repo)
+{
+       const char * const usage[] = {
+               N_("git history split [<options>] <commit>"),
+               NULL,
+       };
+       const char *commit_message = NULL;
+       struct option options[] = {
+               OPT_STRING('m', "message", &commit_message, N_("message"), N_("commit message")),
+               OPT_END(),
+       };
+       struct oidmap rewritten_commits = OIDMAP_INIT;
+       struct commit *original_commit, *parent, *head;
+       struct strvec commits = STRVEC_INIT;
+       struct commit_list *list = NULL;
+       struct object_id split_commits[2];
+       struct pathspec pathspec = { 0 };
+       int ret;
+
+       argc = parse_options(argc, argv, prefix, options, usage, 0);
+       if (argc < 1) {
+               ret = error(_("command expects a revision"));
+               goto out;
+       }
+       repo_config(repo, git_default_config, NULL);
+
+       original_commit = lookup_commit_reference_by_name(argv[0]);
+       if (!original_commit) {
+               ret = error(_("commit to be split cannot be found: %s"), argv[0]);
+               goto out;
+       }
+
+       if (original_commit->parents && original_commit->parents->next) {
+               ret = error(_("commit to be split must not be a merge commit"));
+               goto out;
+       }
+
+       parent = original_commit->parents ? original_commit->parents->item : NULL;
+       if (parent && repo_parse_commit(repo, parent)) {
+               ret = error(_("unable to parse commit %s"),
+                           oid_to_hex(&parent->object.oid));
+               goto out;
+       }
+
+       head = lookup_commit_reference_by_name("HEAD");
+       if (!head) {
+               ret = error(_("could not resolve HEAD to a commit"));
+               goto out;
+       }
+
+       commit_list_append(original_commit, &list);
+       if (!repo_is_descendant_of(repo, original_commit, list)) {
+               ret = error (_("split commit must be reachable from current HEAD commit"));
+               goto out;
+       }
+
+       parse_pathspec(&pathspec, 0,
+               PATHSPEC_PREFER_FULL | PATHSPEC_SYMLINK_LEADING_PATH | PATHSPEC_PREFIX_ORIGIN,
+               prefix, argv + 1);
+
+       /*
+       * Collect the list of commits that we'll have to reapply now already.
+       * This ensures that we'll abort early on in case the range of commits
+       * contains merges, which we do not yet handle.
+       */
+       ret = collect_commits(repo, parent, head, &commits);
+       if (ret < 0)
+               goto out;
+
+       /*
+        * Then we split up the commit and replace the original commit with the
+        * new new ones.
+        */
+       ret = split_commit(repo, original_commit, &pathspec,
+                          commit_message, split_commits);
+       if (ret < 0)
+               goto out;
+
+       replace_commits(&commits, &original_commit->object.oid,
+                       split_commits, ARRAY_SIZE(split_commits));
+
+       ret = apply_commits(repo, &commits, parent, head, "split");
+       if (ret < 0)
+               goto out;
+
+       ret = 0;
+
+out:
+       oidmap_clear(&rewritten_commits, 0);
+       clear_pathspec(&pathspec);
+       strvec_clear(&commits);
+       free_commit_list(list);
+       return ret;
+}
+
 int cmd_history(int argc,
                const char **argv,
                const char *prefix,
@@ -376,11 +599,13 @@ int cmd_history(int argc,
        const char * const usage[] = {
                N_("git history [<options>]"),
                N_("git history reword [<options>] <commit>"),
+               N_("git history split [<options>] <commit> [--] [<pathspec>...]"),
                NULL,
        };
        parse_opt_subcommand_fn *fn = NULL;
        struct option options[] = {
                OPT_SUBCOMMAND("reword", &fn, cmd_history_reword),
+               OPT_SUBCOMMAND("split", &fn, cmd_history_split),
                OPT_END(),
        };
 
index 2a742432026cecc9a7e80c75a5e813115c47f1ee..fb05be16ae247c5cf7ad208152c695c95ef9812a 100644 (file)
@@ -384,6 +384,7 @@ integration_tests = [
   't3438-rebase-broken-files.sh',
   't3450-history.sh',
   't3451-history-reword.sh',
+  't3452-history-split.sh',
   't3500-cherry.sh',
   't3501-revert-cherry-pick.sh',
   't3502-cherry-pick-merge.sh',
diff --git a/t/t3452-history-split.sh b/t/t3452-history-split.sh
new file mode 100755 (executable)
index 0000000..45d3b32
--- /dev/null
@@ -0,0 +1,432 @@
+#!/bin/sh
+
+test_description='tests for git-history split subcommand'
+
+. ./test-lib.sh
+
+set_fake_editor () {
+       write_script fake-editor.sh <<-\EOF &&
+       echo "split-out commit" >"$1"
+       EOF
+       test_set_editor "$(pwd)"/fake-editor.sh
+}
+
+expect_log () {
+       git log --format="%s" >actual &&
+       cat >expect &&
+       test_cmp expect actual
+}
+
+expect_tree_entries () {
+       git ls-tree --name-only "$1" >actual &&
+       cat >expect &&
+       test_cmp expect actual
+}
+
+test_expect_success 'refuses to work with merge commits' '
+       test_when_finished "rm -rf repo" &&
+       git init repo &&
+       (
+               cd repo &&
+               test_commit base &&
+               git branch branch &&
+               test_commit ours &&
+               git switch branch &&
+               test_commit theirs &&
+               git switch - &&
+               git merge theirs &&
+               test_must_fail git history split HEAD 2>err &&
+               test_grep "commit to be split must not be a merge commit" err &&
+               test_must_fail git history split HEAD~ 2>err &&
+               test_grep "cannot rearrange commit history with merges" err
+       )
+'
+
+test_expect_success 'can split up tip commit' '
+       test_when_finished "rm -rf repo" &&
+       git init repo &&
+       (
+               cd repo &&
+               test_commit initial &&
+               touch bar foo &&
+               git add . &&
+               git commit -m split-me &&
+
+               git symbolic-ref HEAD >expect &&
+               set_fake_editor &&
+               git history split HEAD <<-EOF &&
+               y
+               n
+               EOF
+               git symbolic-ref HEAD >actual &&
+               test_cmp expect actual &&
+
+               expect_log <<-EOF &&
+               split-me
+               split-out commit
+               initial
+               EOF
+
+               expect_tree_entries HEAD~ <<-EOF &&
+               bar
+               initial.t
+               EOF
+
+               expect_tree_entries HEAD <<-EOF
+               bar
+               foo
+               initial.t
+               EOF
+       )
+'
+
+test_expect_success 'can split up root commit' '
+       test_when_finished "rm -rf repo" &&
+       git init repo &&
+       (
+               cd repo &&
+               touch bar foo &&
+               git add . &&
+               git commit -m root &&
+               test_commit tip &&
+
+               set_fake_editor &&
+               git history split HEAD~ <<-EOF &&
+               y
+               n
+               EOF
+
+               expect_log <<-EOF &&
+               tip
+               root
+               split-out commit
+               EOF
+
+               expect_tree_entries HEAD~2 <<-EOF &&
+               bar
+               EOF
+
+               expect_tree_entries HEAD~ <<-EOF &&
+               bar
+               foo
+               EOF
+
+               expect_tree_entries HEAD <<-EOF
+               bar
+               foo
+               tip.t
+               EOF
+       )
+'
+
+test_expect_success 'can split up in-between commit' '
+       test_when_finished "rm -rf repo" &&
+       git init repo &&
+       (
+               cd repo &&
+               test_commit initial &&
+               touch bar foo &&
+               git add . &&
+               git commit -m split-me &&
+               test_commit tip &&
+
+               set_fake_editor &&
+               git history split HEAD~ <<-EOF &&
+               y
+               n
+               EOF
+
+               expect_log <<-EOF &&
+               tip
+               split-me
+               split-out commit
+               initial
+               EOF
+
+               expect_tree_entries HEAD~2 <<-EOF &&
+               bar
+               initial.t
+               EOF
+
+               expect_tree_entries HEAD~ <<-EOF &&
+               bar
+               foo
+               initial.t
+               EOF
+
+               expect_tree_entries HEAD <<-EOF
+               bar
+               foo
+               initial.t
+               tip.t
+               EOF
+       )
+'
+
+test_expect_success 'can pick multiple hunks' '
+       test_when_finished "rm -rf repo" &&
+       git init repo &&
+       (
+               cd repo &&
+               touch bar baz foo qux &&
+               git add . &&
+               git commit -m split-me &&
+
+               git history split HEAD -m "split-out commit" <<-EOF &&
+               y
+               n
+               y
+               n
+               EOF
+
+               expect_tree_entries HEAD~ <<-EOF &&
+               bar
+               foo
+               EOF
+
+               expect_tree_entries HEAD <<-EOF
+               bar
+               baz
+               foo
+               qux
+               EOF
+       )
+'
+
+
+test_expect_success 'can use only last hunk' '
+       test_when_finished "rm -rf repo" &&
+       git init repo &&
+       (
+               cd repo &&
+               touch bar foo &&
+               git add . &&
+               git commit -m split-me &&
+
+               git history split HEAD -m "split-out commit" <<-EOF &&
+               n
+               y
+               EOF
+
+               expect_log <<-EOF &&
+               split-me
+               split-out commit
+               EOF
+
+               expect_tree_entries HEAD~ <<-EOF &&
+               foo
+               EOF
+
+               expect_tree_entries HEAD <<-EOF
+               bar
+               foo
+               EOF
+       )
+'
+
+test_expect_success 'aborts with empty commit message' '
+       test_when_finished "rm -rf repo" &&
+       git init repo &&
+       (
+               cd repo &&
+               touch bar foo &&
+               git add . &&
+               git commit -m split-me &&
+
+               test_must_fail git history split HEAD -m "" <<-EOF 2>err &&
+               y
+               n
+               EOF
+               test_grep "Aborting commit due to empty commit message." err
+       )
+'
+
+test_expect_success 'can specify message via option' '
+       test_when_finished "rm -rf repo" &&
+       git init repo &&
+       (
+               cd repo &&
+               touch bar foo &&
+               git add . &&
+               git commit -m split-me &&
+
+               git history split HEAD -m "message option" <<-EOF &&
+               y
+               n
+               EOF
+
+               expect_log <<-EOF
+               split-me
+               message option
+               EOF
+       )
+'
+
+test_expect_success 'commit message editor sees split-out changes' '
+       test_when_finished "rm -rf repo" &&
+       git init repo &&
+       (
+               cd repo &&
+               touch bar foo &&
+               git add . &&
+               git commit -m split-me &&
+
+               write_script fake-editor.sh <<-\EOF &&
+               cp "$1" . &&
+               echo "some commit message" >>"$1"
+               EOF
+               test_set_editor "$(pwd)"/fake-editor.sh &&
+
+               git history split HEAD <<-EOF &&
+               y
+               n
+               EOF
+
+               cat >expect <<-EOF &&
+
+               # Please enter the commit message for the split-out changes. Lines starting
+               # with ${SQ}#${SQ} will be kept; you may remove them yourself if you want to.
+               # Changes to be committed:
+               #       new file:   bar
+               #
+               EOF
+               test_cmp expect COMMIT_EDITMSG &&
+
+               expect_log <<-EOF
+               split-me
+               some commit message
+               EOF
+       )
+'
+
+test_expect_success 'can use pathspec to limit what gets split' '
+       test_when_finished "rm -rf repo" &&
+       git init repo &&
+       (
+               cd repo &&
+               touch bar foo &&
+               git add . &&
+               git commit -m split-me &&
+
+               git history split HEAD -m "message option" -- foo <<-EOF &&
+               y
+               EOF
+
+               expect_tree_entries HEAD~ <<-EOF &&
+               foo
+               EOF
+
+               expect_tree_entries HEAD <<-EOF
+               bar
+               foo
+               EOF
+       )
+'
+
+test_expect_success 'refuses to create empty split-out commit' '
+       test_when_finished "rm -rf repo" &&
+       git init repo &&
+       (
+               cd repo &&
+               test_commit base &&
+               touch bar foo &&
+               git add . &&
+               git commit -m split-me &&
+
+               test_must_fail git history split HEAD 2>err <<-EOF &&
+               n
+               n
+               EOF
+               test_grep "split commit is empty" err
+       )
+'
+
+test_expect_success 'hooks are executed for rewritten commits' '
+       test_when_finished "rm -rf repo" &&
+       git init repo &&
+       (
+               cd repo &&
+               touch bar foo &&
+               git add . &&
+               git commit -m split-me &&
+               old_head=$(git rev-parse HEAD) &&
+
+               write_script .git/hooks/prepare-commit-msg <<-EOF &&
+               touch "$(pwd)/hooks.log"
+               EOF
+               write_script .git/hooks/post-commit <<-EOF &&
+               touch "$(pwd)/hooks.log"
+               EOF
+               write_script .git/hooks/post-rewrite <<-EOF &&
+               touch "$(pwd)/hooks.log"
+               EOF
+
+               set_fake_editor &&
+               git history split HEAD <<-EOF &&
+               y
+               n
+               EOF
+
+               expect_log <<-EOF &&
+               split-me
+               split-out commit
+               EOF
+
+               test_path_is_missing hooks.log
+       )
+'
+
+test_expect_success 'refuses to create empty original commit' '
+       test_when_finished "rm -rf repo" &&
+       git init repo &&
+       (
+               cd repo &&
+               touch bar foo &&
+               git add . &&
+               git commit -m split-me &&
+
+               test_must_fail git history split HEAD 2>err <<-EOF &&
+               y
+               y
+               EOF
+               test_grep "split commit tree matches original commit" err
+       )
+'
+
+test_expect_success 'retains changes in the worktree and index' '
+       test_when_finished "rm -rf repo" &&
+       git init repo &&
+       (
+               cd repo &&
+               echo a >a &&
+               echo b >b &&
+               git add . &&
+               git commit -m "initial commit" &&
+               echo a-modified >a &&
+               echo b-modified >b &&
+               git add b &&
+               git history split HEAD -m a-only <<-EOF &&
+               y
+               n
+               EOF
+
+               expect_tree_entries HEAD~ <<-EOF &&
+               a
+               EOF
+               expect_tree_entries HEAD <<-EOF &&
+               a
+               b
+               EOF
+
+               cat >expect <<-\EOF &&
+                M a
+               M  b
+               ?? actual
+               ?? expect
+               EOF
+               git status --porcelain >actual &&
+               test_cmp expect actual
+       )
+'
+
+test_done