diff mbox series

[v2] remote: introduce config to set prefetch refs

Message ID pull.1782.v2.git.1726409329993.gitgitgadget@gmail.com (mailing list archive)
State Superseded
Headers show
Series [v2] remote: introduce config to set prefetch refs | expand

Commit Message

Shubham Kanodia Sept. 15, 2024, 2:08 p.m. UTC
From: Shubham Kanodia <shubham.kanodia10@gmail.com>

This commit introduces a new configuration option,
remote.<name>.prefetchref, which allows users to specify specific
ref patterns to be prefetched during a git fetch --prefetch
operation.

The new option accepts a space-separated list of ref patterns.
When the --prefetch option is used with git fetch, only the refs
matching these patterns will be prefetched, instead of the
default behavior of prefetching all fetchable refs.

Example usage in .git/config:
[remote "origin"]
    prefetchref = "refs/heads/main refs/heads/feature/*"

This change allows users to optimize their prefetch operations, potentially
reducing network traffic and improving performance for large repositories
with many refs.

Signed-off-by: Shubham Kanodia <shubham.kanodia10@gmail.com>
---
    remote: introduce config to set prefetch refs

Published-As: https://github.com/gitgitgadget/git/releases/tag/pr-1782%2Fpastelsky%2Fsk%2Fremote-prefetchref-v2
Fetch-It-Via: git fetch https://github.com/gitgitgadget/git pr-1782/pastelsky/sk/remote-prefetchref-v2
Pull-Request: https://github.com/gitgitgadget/git/pull/1782

Range-diff vs v1:

 1:  3113d8b8635 ! 1:  f9f9e637bfa remote: introduce config to set prefetch refs
     @@ Documentation/config/remote.txt: remote.<name>.fetch::
       	linkgit:git-push[1].
      
       ## builtin/fetch.c ##
     -@@ builtin/fetch.c: static void find_non_local_tags(const struct ref *refs,
     - 	oidset_clear(&fetch_oids);
     +@@
     + #include "trace.h"
     + #include "trace2.h"
     + #include "bundle-uri.h"
     ++#include "wildmatch.h"
     + 
     + #define FORCED_UPDATES_DELAY_WARNING_IN_MS (10 * 1000)
     + 
     +@@ builtin/fetch.c: static void filter_prefetch_refspec(struct refspec *rs)
     + 	}
       }
       
     -+static void apply_prefetch_refspec(struct remote *remote, struct refspec *rs)
     ++static int matches_prefetch_refs(const char *refname, const struct string_list *prefetch_refs)
      +{
     -+	if (remote->prefetch_refs.nr > 0) {
     -+		int i;
     -+		for (i = 0; i < remote->prefetch_refs.nr; i++) {
     -+			const char *src = remote->prefetch_refs.items[i].string;
     -+			struct strbuf dst = STRBUF_INIT;
     -+
     -+			strbuf_addf(&dst, "refs/prefetch/%s/", remote->name);
     -+			if (starts_with(src, "refs/heads/")) {
     -+				strbuf_addstr(&dst, src + 11);
     -+			} else if (starts_with(src, "refs/")) {
     -+				strbuf_addstr(&dst, src + 5);
     -+			} else {
     -+				strbuf_addstr(&dst, src);
     -+			}
     ++	int i;
     ++	int has_positive = 0;
     ++	int matched_positive = 0;
     ++	int matched_negative = 0;
     ++
     ++	for (i = 0; i < prefetch_refs->nr; i++) {
     ++		const char *pattern = prefetch_refs->items[i].string;
     ++		int is_negative = (*pattern == '!');
     ++
     ++		if (is_negative)
     ++			pattern++;
     ++		else
     ++			has_positive = 1;
      +
     -+			refspec_appendf(rs, "%s:%s", src, dst.buf);
     -+			strbuf_release(&dst);
     ++		if (wildmatch(pattern, refname, 0) == 0) {
     ++			if (is_negative)
     ++				matched_negative = 1;
     ++			else
     ++				matched_positive = 1;
      +		}
      +	}
     ++
     ++	if (!has_positive)
     ++		return !matched_negative;
     ++
     ++	return matched_positive && !matched_negative;
      +}
      +
      +
     - static void filter_prefetch_refspec(struct refspec *rs)
     - {
     - 	int i;
     ++static void ref_remove(struct ref **head, struct ref *to_remove)
     ++{
     ++	struct ref **pp, *p;
     ++
     ++	for (pp = head; (p = *pp) != NULL; pp = &p->next) {
     ++		if (p == to_remove) {
     ++			*pp = p->next;
     ++			return;
     ++		}
     ++	}
     ++}
     ++
     + static struct ref *get_ref_map(struct remote *remote,
     + 			       const struct ref *remote_refs,
     + 			       struct refspec *rs,
      @@ builtin/fetch.c: static struct ref *get_ref_map(struct remote *remote,
       	int existing_refs_populated = 0;
       
       	filter_prefetch_refspec(rs);
     --	if (remote)
     -+	if (remote) {
     ++
     + 	if (remote)
       		filter_prefetch_refspec(&remote->fetch);
     -+		if (prefetch)
     -+			apply_prefetch_refspec(remote, rs);
     + 
     +@@ builtin/fetch.c: static struct ref *get_ref_map(struct remote *remote,
     + 	else
     + 		ref_map = apply_negative_refspecs(ref_map, &remote->fetch);
     + 
     ++	/**
     ++	 * Filter out advertised refs that we don't want to fetch during
     ++	 * prefetch if a prefetchref config is set
     ++	 */
     ++	if (prefetch && remote->prefetch_refs.nr) {
     ++		struct ref *ref, *next;
     ++		for (ref = ref_map; ref; ref = next) {
     ++			next = ref->next;
     ++
     ++			if (!matches_prefetch_refs(ref->name, &remote->prefetch_refs)) {
     ++					ref_remove(&ref_map, ref);
     ++					free_one_ref(ref);
     ++			}
     ++		}
      +	}
     ++
     + 	ref_map = ref_remove_duplicates(ref_map);
       
     - 	if (rs->nr) {
     - 		struct refspec *fetch_refspec;
     + 	for (rm = ref_map; rm; rm = rm->next) {
      
       ## remote.c ##
      @@ remote.c: static struct remote *make_remote(struct remote_state *remote_state,
     @@ t/t7900-maintenance.sh: test_expect_success 'prefetch multiple remotes' '
       	test_subcommand git fetch remote2 $fetchargs <skip-remote1.txt
       '
       
     -+test_expect_success 'prefetch only acts on remote.<name>.prefetchref refs if present' '
     -+	test_create_repo prefetch-test-mixed-patterns &&
     ++test_expect_success 'prefetch with positive prefetch ref patterns' '
     ++	test_create_repo filter-prefetch-positive &&
      +	(
     -+		cd prefetch-test-mixed-patterns &&
     ++		cd filter-prefetch-positive &&
      +		test_commit initial &&
     -+		git clone . clone1 &&
      +		git clone . clone2 &&
     -+
     -+		git remote add remote1 "file://$(pwd)/clone1" &&
      +		git remote add remote2 "file://$(pwd)/clone2" &&
      +
     -+		# Set single prefetchref pattern for remote1 and multiple for remote2
     -+		git config remote.remote1.prefetchref "refs/heads/foo" &&
     -+		git config remote.remote2.prefetchref "refs/heads/feature/* refs/heads/topic" &&
     -+
     -+		# Create branches in clone1 and push
     -+		(
     -+			cd clone1 &&
     -+			git checkout -b foo &&
     -+			test_commit foo-commit &&
     -+			git checkout -b feature/a &&
     -+			test_commit feature-a-commit &&
     -+			git checkout -b other &&
     -+			test_commit other-commit &&
     -+			git push origin foo feature/a other
     -+		) &&
     -+
     -+		# Create branches in clone2 and push
     -+		(
     -+			cd clone2 &&
     -+			git checkout -b topic &&
     -+			test_commit master-commit &&
     -+			git checkout -b feature/x &&
     -+			test_commit feature-x-commit &&
     -+			git checkout -b feature/y &&
     -+			test_commit feature-y-commit &&
     -+			git checkout -b dev &&
     -+			test_commit dev-commit &&
     -+			git push origin topic feature/x feature/y dev
     -+		) &&
     -+
     -+		# Run maintenance prefetch task
     -+		GIT_TRACE2_EVENT="$(pwd)/prefetch.txt" git maintenance run --task=prefetch 2>/dev/null &&
     -+
     -+		# Check that only specified refs were prefetched
     ++		cd clone2 &&
     ++		git checkout -b feature && test_commit feature-commit-2 &&
     ++		git checkout -b wip/test && test_commit wip-test-commit-2 &&
     ++		git checkout -b topic/x && test_commit topic-x-commit-2 &&
     ++		git push -f origin feature wip/test topic/x&&
     ++		cd .. &&
     ++
     ++		git config remote.remote2.prefetchref "refs/heads/feature" &&
      +		fetchargs="--prefetch --prune --no-tags --no-write-fetch-head --recurse-submodules=no --quiet" &&
     -+		test_subcommand git fetch remote1 $fetchargs <prefetch.txt &&
     -+		test_subcommand git fetch remote2 $fetchargs <prefetch.txt &&
     -+		ls -R .git/refs/prefetch &&
     -+
     -+		# Verify that only specified refs are in the prefetch refs for remote1
     -+		 git rev-parse refs/prefetch/remotes/remote1/foo &&
     -+		test_must_fail git rev-parse refs/prefetch/remotes/remote1/feature/a &&
     -+		test_must_fail git rev-parse refs/prefetch/remotes/remote1/other &&
     -+
     -+				# Verify that only specified refs are in the prefetch refs for remote2
     -+		git rev-parse refs/prefetch/remotes/remote2/feature/x &&
     -+		git rev-parse refs/prefetch/remotes/remote2/feature/y &&
     -+		git rev-parse refs/prefetch/remotes/remote2/topic &&
     -+		test_must_fail git rev-parse refs/prefetch/remotes/remote2/dev &&
     -+
     -+		# Fetch all refs and compare
     -+		git fetch --all &&
     -+		test_cmp_rev refs/remotes/remote1/foo refs/prefetch/remotes/remote1/foo &&
     -+		test_cmp_rev refs/remotes/remote2/feature/x refs/prefetch/remotes/remote2/feature/x &&
     -+		test_cmp_rev refs/remotes/remote2/feature/y refs/prefetch/remotes/remote2/feature/y &&
     -+		test_cmp_rev refs/remotes/remote2/topic refs/prefetch/remotes/remote2/topic
     ++		GIT_TRACE2_EVENT="$(pwd)/prefetch-positive.txt" git maintenance run --task=prefetch 2>/dev/null &&
     ++		test_subcommand git fetch remote2 $fetchargs <prefetch-positive.txt &&
     ++
     ++		git rev-parse refs/prefetch/remotes/remote2/feature &&
     ++		test_must_fail git rev-parse refs/prefetch/remotes/remote2/wip/test &&
     ++		test_must_fail git rev-parse refs/prefetch/remotes/remote2/topic/x
     ++	)
     ++'
     ++
     ++test_expect_success 'prefetch with negative prefetch ref patterns' '
     ++	test_create_repo filter-prefetch-negative &&
     ++	(
     ++		cd filter-prefetch-negative &&
     ++		test_commit initial &&
     ++		git clone . clone3 &&
     ++		git remote add remote3 "file://$(pwd)/clone3" &&
     ++		cat .git/config &&
     ++
     ++		cd clone3 &&
     ++		git checkout -b feature && test_commit feature-commit-3 &&
     ++		git checkout -b wip/test && test_commit wip-test-commit-3 &&
     ++		git checkout -b topic/x && test_commit topic-x-commit-3 &&
     ++		git push -f origin feature wip/test topic/x &&
     ++		cd .. &&
     ++
     ++		git config remote.remote3.prefetchref "!refs/heads/wip/*" &&
     ++		fetchargs="--prefetch --prune --no-tags --no-write-fetch-head --recurse-submodules=no --quiet" &&
     ++		GIT_TRACE2_EVENT="$(pwd)/prefetch-negative.txt" git maintenance run --task=prefetch 2>/dev/null &&
     ++		test_subcommand git fetch remote3 $fetchargs <prefetch-negative.txt &&
     ++		git rev-parse refs/prefetch/remotes/remote3/feature &&
     ++		git rev-parse refs/prefetch/remotes/remote3/topic/x &&
     ++		test_must_fail git rev-parse refs/prefetch/remotes/remote3/wip/test
     ++	)
     ++'
     ++
     ++test_expect_success 'prefetch with positive & negative prefetch ref patterns' '
     ++	test_create_repo filter-prefetch-mixed &&
     ++	(
     ++		cd filter-prefetch-mixed &&
     ++		test_commit initial &&
     ++		git clone . clone4 &&
     ++		git remote add remote4 "file://$(pwd)/clone4" &&
     ++
     ++		cd clone4 &&
     ++		git checkout -b feature && test_commit feature-commit-4 &&
     ++		git checkout -b topic/x && test_commit topic-x-commit-4 &&
     ++		git checkout -b topic/y && test_commit topic-y-commit-4 &&
     ++		git push -f origin feature topic/x topic/y &&
     ++		cd .. &&
     ++
     ++		git config remote.remote4.prefetchref "refs/heads/topic/* !refs/heads/topic/y" &&
     ++		# git config --add remote.remote4.prefetchref "!refs/topic/y" &&
     ++		cat .git/config &&
     ++		fetchargs="--prefetch --prune --no-tags --no-write-fetch-head --recurse-submodules=no --quiet" &&
     ++		GIT_TRACE2_EVENT="$(pwd)/prefetch-mixed.txt" git maintenance run --task=prefetch 2>/dev/null &&
     ++		test_subcommand git fetch remote4 $fetchargs <prefetch-mixed.txt &&
     ++
     ++		test_must_fail git rev-parse refs/prefetch/remotes/remote4/feature &&
     ++		test_must_fail git rev-parse refs/prefetch/remotes/remote4/topic/y &&
     ++		git rev-parse refs/prefetch/remotes/remote4/topic/x
      +	)
      +'
      +


 Documentation/config/remote.txt |  6 +++
 builtin/fetch.c                 | 61 +++++++++++++++++++++++++
 remote.c                        |  8 ++++
 remote.h                        |  3 ++
 t/t7900-maintenance.sh          | 80 +++++++++++++++++++++++++++++++++
 5 files changed, 158 insertions(+)


base-commit: 2e7b89e038c0c888acf61f1b4ee5a43d4dd5e94c
diff mbox series

Patch

diff --git a/Documentation/config/remote.txt b/Documentation/config/remote.txt
index 8efc53e836d..b25d76dd3b1 100644
--- a/Documentation/config/remote.txt
+++ b/Documentation/config/remote.txt
@@ -33,6 +33,12 @@  remote.<name>.fetch::
 	The default set of "refspec" for linkgit:git-fetch[1]. See
 	linkgit:git-fetch[1].
 
+remote.<name>.prefetchref::
+    Specify the refs to be prefetched when fetching from this remote.
+    The value is a space-separated list of ref patterns (e.g., "refs/heads/master refs/heads/develop*").
+    These patterns are used as the source part of the refspecs for prefetching.
+    This can be used to optimize fetch operations by specifying exactly which refs should be prefetched.
+
 remote.<name>.push::
 	The default set of "refspec" for linkgit:git-push[1]. See
 	linkgit:git-push[1].
diff --git a/builtin/fetch.c b/builtin/fetch.c
index b2b5aee5bf2..16c8a31c2e1 100644
--- a/builtin/fetch.c
+++ b/builtin/fetch.c
@@ -38,6 +38,7 @@ 
 #include "trace.h"
 #include "trace2.h"
 #include "bundle-uri.h"
+#include "wildmatch.h"
 
 #define FORCED_UPDATES_DELAY_WARNING_IN_MS (10 * 1000)
 
@@ -485,6 +486,49 @@  static void filter_prefetch_refspec(struct refspec *rs)
 	}
 }
 
+static int matches_prefetch_refs(const char *refname, const struct string_list *prefetch_refs)
+{
+	int i;
+	int has_positive = 0;
+	int matched_positive = 0;
+	int matched_negative = 0;
+
+	for (i = 0; i < prefetch_refs->nr; i++) {
+		const char *pattern = prefetch_refs->items[i].string;
+		int is_negative = (*pattern == '!');
+
+		if (is_negative)
+			pattern++;
+		else
+			has_positive = 1;
+
+		if (wildmatch(pattern, refname, 0) == 0) {
+			if (is_negative)
+				matched_negative = 1;
+			else
+				matched_positive = 1;
+		}
+	}
+
+	if (!has_positive)
+		return !matched_negative;
+
+	return matched_positive && !matched_negative;
+}
+
+
+static void ref_remove(struct ref **head, struct ref *to_remove)
+{
+	struct ref **pp, *p;
+
+	for (pp = head; (p = *pp) != NULL; pp = &p->next) {
+		if (p == to_remove) {
+			*pp = p->next;
+			return;
+		}
+	}
+}
+
 static struct ref *get_ref_map(struct remote *remote,
 			       const struct ref *remote_refs,
 			       struct refspec *rs,
@@ -502,6 +546,7 @@  static struct ref *get_ref_map(struct remote *remote,
 	int existing_refs_populated = 0;
 
 	filter_prefetch_refspec(rs);
+
 	if (remote)
 		filter_prefetch_refspec(&remote->fetch);
 
@@ -610,6 +655,22 @@  static struct ref *get_ref_map(struct remote *remote,
 	else
 		ref_map = apply_negative_refspecs(ref_map, &remote->fetch);
 
+	/**
+	 * Filter out advertised refs that we don't want to fetch during
+	 * prefetch if a prefetchref config is set
+	 */
+	if (prefetch && remote->prefetch_refs.nr) {
+		struct ref *ref, *next;
+		for (ref = ref_map; ref; ref = next) {
+			next = ref->next;
+
+			if (!matches_prefetch_refs(ref->name, &remote->prefetch_refs)) {
+					ref_remove(&ref_map, ref);
+					free_one_ref(ref);
+			}
+		}
+	}
+
 	ref_map = ref_remove_duplicates(ref_map);
 
 	for (rm = ref_map; rm; rm = rm->next) {
diff --git a/remote.c b/remote.c
index 8f3dee13186..b46d62b2c47 100644
--- a/remote.c
+++ b/remote.c
@@ -141,6 +141,7 @@  static struct remote *make_remote(struct remote_state *remote_state,
 	ret->prune = -1;  /* unspecified */
 	ret->prune_tags = -1;  /* unspecified */
 	ret->name = xstrndup(name, len);
+	string_list_init_dup(&ret->prefetch_refs);
 	refspec_init(&ret->push, REFSPEC_PUSH);
 	refspec_init(&ret->fetch, REFSPEC_FETCH);
 
@@ -166,6 +167,7 @@  static void remote_clear(struct remote *remote)
 	free((char *)remote->uploadpack);
 	FREE_AND_NULL(remote->http_proxy);
 	FREE_AND_NULL(remote->http_proxy_authmethod);
+	string_list_clear(&remote->prefetch_refs, 0);
 }
 
 static void add_merge(struct branch *branch, const char *name)
@@ -456,6 +458,12 @@  static int handle_config(const char *key, const char *value,
 		remote->prune = git_config_bool(key, value);
 	else if (!strcmp(subkey, "prunetags"))
 		remote->prune_tags = git_config_bool(key, value);
+	else if (!strcmp(subkey, "prefetchref")) {
+		if (!value)
+			return config_error_nonbool(key);
+		string_list_split(&remote->prefetch_refs, value, ' ', -1);
+		return 0;
+	}
 	else if (!strcmp(subkey, "url")) {
 		if (!value)
 			return config_error_nonbool(key);
diff --git a/remote.h b/remote.h
index b901b56746d..c18e68e0d8d 100644
--- a/remote.h
+++ b/remote.h
@@ -5,6 +5,7 @@ 
 #include "hashmap.h"
 #include "refspec.h"
 #include "strvec.h"
+#include "string-list.h"
 
 struct option;
 struct transport_ls_refs_options;
@@ -77,6 +78,8 @@  struct remote {
 
 	struct refspec fetch;
 
+	struct string_list prefetch_refs;
+
 	/*
 	 * The setting for whether to fetch tags (as a separate rule from the
 	 * configured refspecs);
diff --git a/t/t7900-maintenance.sh b/t/t7900-maintenance.sh
index abae7a97546..5b64257eb7d 100755
--- a/t/t7900-maintenance.sh
+++ b/t/t7900-maintenance.sh
@@ -245,6 +245,86 @@  test_expect_success 'prefetch multiple remotes' '
 	test_subcommand git fetch remote2 $fetchargs <skip-remote1.txt
 '
 
+test_expect_success 'prefetch with positive prefetch ref patterns' '
+	test_create_repo filter-prefetch-positive &&
+	(
+		cd filter-prefetch-positive &&
+		test_commit initial &&
+		git clone . clone2 &&
+		git remote add remote2 "file://$(pwd)/clone2" &&
+
+		cd clone2 &&
+		git checkout -b feature && test_commit feature-commit-2 &&
+		git checkout -b wip/test && test_commit wip-test-commit-2 &&
+		git checkout -b topic/x && test_commit topic-x-commit-2 &&
+		git push -f origin feature wip/test topic/x&&
+		cd .. &&
+
+		git config remote.remote2.prefetchref "refs/heads/feature" &&
+		fetchargs="--prefetch --prune --no-tags --no-write-fetch-head --recurse-submodules=no --quiet" &&
+		GIT_TRACE2_EVENT="$(pwd)/prefetch-positive.txt" git maintenance run --task=prefetch 2>/dev/null &&
+		test_subcommand git fetch remote2 $fetchargs <prefetch-positive.txt &&
+
+		git rev-parse refs/prefetch/remotes/remote2/feature &&
+		test_must_fail git rev-parse refs/prefetch/remotes/remote2/wip/test &&
+		test_must_fail git rev-parse refs/prefetch/remotes/remote2/topic/x
+	)
+'
+
+test_expect_success 'prefetch with negative prefetch ref patterns' '
+	test_create_repo filter-prefetch-negative &&
+	(
+		cd filter-prefetch-negative &&
+		test_commit initial &&
+		git clone . clone3 &&
+		git remote add remote3 "file://$(pwd)/clone3" &&
+		cat .git/config &&
+
+		cd clone3 &&
+		git checkout -b feature && test_commit feature-commit-3 &&
+		git checkout -b wip/test && test_commit wip-test-commit-3 &&
+		git checkout -b topic/x && test_commit topic-x-commit-3 &&
+		git push -f origin feature wip/test topic/x &&
+		cd .. &&
+
+		git config remote.remote3.prefetchref "!refs/heads/wip/*" &&
+		fetchargs="--prefetch --prune --no-tags --no-write-fetch-head --recurse-submodules=no --quiet" &&
+		GIT_TRACE2_EVENT="$(pwd)/prefetch-negative.txt" git maintenance run --task=prefetch 2>/dev/null &&
+		test_subcommand git fetch remote3 $fetchargs <prefetch-negative.txt &&
+		git rev-parse refs/prefetch/remotes/remote3/feature &&
+		git rev-parse refs/prefetch/remotes/remote3/topic/x &&
+		test_must_fail git rev-parse refs/prefetch/remotes/remote3/wip/test
+	)
+'
+
+test_expect_success 'prefetch with positive & negative prefetch ref patterns' '
+	test_create_repo filter-prefetch-mixed &&
+	(
+		cd filter-prefetch-mixed &&
+		test_commit initial &&
+		git clone . clone4 &&
+		git remote add remote4 "file://$(pwd)/clone4" &&
+
+		cd clone4 &&
+		git checkout -b feature && test_commit feature-commit-4 &&
+		git checkout -b topic/x && test_commit topic-x-commit-4 &&
+		git checkout -b topic/y && test_commit topic-y-commit-4 &&
+		git push -f origin feature topic/x topic/y &&
+		cd .. &&
+
+		git config remote.remote4.prefetchref "refs/heads/topic/* !refs/heads/topic/y" &&
+		# git config --add remote.remote4.prefetchref "!refs/topic/y" &&
+		cat .git/config &&
+		fetchargs="--prefetch --prune --no-tags --no-write-fetch-head --recurse-submodules=no --quiet" &&
+		GIT_TRACE2_EVENT="$(pwd)/prefetch-mixed.txt" git maintenance run --task=prefetch 2>/dev/null &&
+		test_subcommand git fetch remote4 $fetchargs <prefetch-mixed.txt &&
+
+		test_must_fail git rev-parse refs/prefetch/remotes/remote4/feature &&
+		test_must_fail git rev-parse refs/prefetch/remotes/remote4/topic/y &&
+		git rev-parse refs/prefetch/remotes/remote4/topic/x
+	)
+'
+
 test_expect_success 'loose-objects task' '
 	# Repack everything so we know the state of the object dir
 	git repack -adk &&