Skip to content

Commit

Permalink
path-walk: allow consumer to specify object types
Browse files Browse the repository at this point in the history
We add the ability to filter the object types in the path-walk API so
the callback function is called fewer times.

This adds the ability to ask for the commits in a list, as well. Future
changes will add the ability to visit annotated tags.

Signed-off-by: Derrick Stolee <stolee@gmail.com>
  • Loading branch information
derrickstolee authored and dscho committed Sep 26, 2024
1 parent 017e36a commit 3289262
Show file tree
Hide file tree
Showing 5 changed files with 141 additions and 9 deletions.
9 changes: 9 additions & 0 deletions Documentation/technical/api-path-walk.txt
Original file line number Diff line number Diff line change
Expand Up @@ -48,6 +48,15 @@ If you want the path-walk API to emit `UNINTERESTING` objects based on the
commit walk's boundary, be sure to set `revs.boundary` so the boundary
commits are emitted.

`commits`, `blobs`, `trees`::
By default, these members are enabled and signal that the path-walk
API should call the `path_fn` on objects of these types. Specialized
applications could disable some options to make it simpler to walk
the objects or to have fewer calls to `path_fn`.
+
While it is possible to walk only commits in this way, consumers would be
better off using the revision walk API instead.

Examples
--------

Expand Down
39 changes: 33 additions & 6 deletions path-walk.c
Original file line number Diff line number Diff line change
Expand Up @@ -84,6 +84,10 @@ static int add_children(struct path_walk_context *ctx,
if (S_ISGITLINK(entry.mode))
continue;

/* If the caller doesn't want blobs, then don't bother. */
if (!ctx->info->blobs && type == OBJ_BLOB)
continue;

if (type == OBJ_TREE) {
struct tree *child = lookup_tree(ctx->repo, &entry.oid);
o = child ? &child->object : NULL;
Expand Down Expand Up @@ -140,9 +144,11 @@ static int walk_path(struct path_walk_context *ctx,

list = strmap_get(&ctx->paths_to_lists, path);

/* Evaluate function pointer on this data. */
ret = ctx->info->path_fn(path, &list->oids, list->type,
ctx->info->path_fn_data);
/* Evaluate function pointer on this data, if requested. */
if ((list->type == OBJ_TREE && ctx->info->trees) ||
(list->type == OBJ_BLOB && ctx->info->blobs))
ret = ctx->info->path_fn(path, &list->oids, list->type,
ctx->info->path_fn_data);

/* Expand data for children. */
if (list->type == OBJ_TREE) {
Expand Down Expand Up @@ -184,6 +190,7 @@ int walk_objects_by_path(struct path_walk_info *info)
size_t commits_nr = 0, paths_nr = 0;
struct commit *c;
struct type_and_oid_list *root_tree_list;
struct type_and_oid_list *commit_list;
struct path_walk_context ctx = {
.repo = info->revs->repo,
.revs = info->revs,
Expand All @@ -194,19 +201,32 @@ int walk_objects_by_path(struct path_walk_info *info)

trace2_region_enter("path-walk", "commit-walk", info->revs->repo);

CALLOC_ARRAY(commit_list, 1);
commit_list->type = OBJ_COMMIT;

/* Insert a single list for the root tree into the paths. */
CALLOC_ARRAY(root_tree_list, 1);
root_tree_list->type = OBJ_TREE;
strmap_put(&ctx.paths_to_lists, root_path, root_tree_list);

if (prepare_revision_walk(info->revs))
die(_("failed to setup revision walk"));

while ((c = get_revision(info->revs))) {
struct object_id *oid = get_commit_tree_oid(c);
struct tree *t = lookup_tree(info->revs->repo, oid);
struct object_id *oid;
struct tree *t;
commits_nr++;

if (info->commits)
oid_array_append(&commit_list->oids,
&c->object.oid);

/* If we only care about commits, then skip trees. */
if (!info->trees && !info->blobs)
continue;

oid = get_commit_tree_oid(c);
t = lookup_tree(info->revs->repo, oid);

if (t)
oid_array_append(&root_tree_list->oids, oid);
else
Expand All @@ -216,6 +236,13 @@ int walk_objects_by_path(struct path_walk_info *info)
trace2_data_intmax("path-walk", ctx.repo, "commits", commits_nr);
trace2_region_leave("path-walk", "commit-walk", info->revs->repo);

/* Track all commits. */
if (info->commits)
ret = info->path_fn("", &commit_list->oids, OBJ_COMMIT,
info->path_fn_data);
oid_array_clear(&commit_list->oids);
free(commit_list);

string_list_append(&ctx.path_stack, root_path);

trace2_region_enter("path-walk", "path-walk", info->revs->repo);
Expand Down
13 changes: 12 additions & 1 deletion path-walk.h
Original file line number Diff line number Diff line change
Expand Up @@ -30,9 +30,20 @@ struct path_walk_info {
*/
path_fn path_fn;
void *path_fn_data;
/**
* Initialize which object types the path_fn should be called on. This
* could also limit the walk to skip blobs if not set.
*/
int commits;
int trees;
int blobs;
};

#define PATH_WALK_INFO_INIT { 0 }
#define PATH_WALK_INFO_INIT { \
.blobs = 1, \
.trees = 1, \
.commits = 1, \
}

/**
* Given the configuration of 'info', walk the commits based on 'info->revs' and
Expand Down
17 changes: 15 additions & 2 deletions t/helper/test-path-walk.c
Original file line number Diff line number Diff line change
Expand Up @@ -18,6 +18,7 @@ static const char * const path_walk_usage[] = {
};

struct path_walk_test_data {
uintmax_t commit_nr;
uintmax_t tree_nr;
uintmax_t blob_nr;
};
Expand All @@ -29,6 +30,11 @@ static int emit_block(const char *path, struct oid_array *oids,
const char *typestr;

switch (type) {
case OBJ_COMMIT:
typestr = "COMMIT";
tdata->commit_nr += oids->nr;
break;

case OBJ_TREE:
typestr = "TREE";
tdata->tree_nr += oids->nr;
Expand Down Expand Up @@ -56,6 +62,12 @@ int cmd__path_walk(int argc, const char **argv)
struct path_walk_info info = PATH_WALK_INFO_INIT;
struct path_walk_test_data data = { 0 };
struct option options[] = {
OPT_BOOL(0, "blobs", &info.blobs,
N_("toggle inclusion of blob objects")),
OPT_BOOL(0, "commits", &info.commits,
N_("toggle inclusion of commit objects")),
OPT_BOOL(0, "trees", &info.trees,
N_("toggle inclusion of tree objects")),
OPT_END(),
};

Expand All @@ -78,9 +90,10 @@ int cmd__path_walk(int argc, const char **argv)

res = walk_objects_by_path(&info);

printf("trees:%" PRIuMAX "\n"
printf("commits:%" PRIuMAX "\n"
"trees:%" PRIuMAX "\n"
"blobs:%" PRIuMAX "\n",
data.tree_nr, data.blob_nr);
data.commit_nr, data.tree_nr, data.blob_nr);

return res;
}
72 changes: 72 additions & 0 deletions t/t6601-path-walk.sh
Original file line number Diff line number Diff line change
Expand Up @@ -31,6 +31,11 @@ test_expect_success 'all' '
test-tool path-walk -- --all >out &&
cat >expect <<-EOF &&
COMMIT::$(git rev-parse topic)
COMMIT::$(git rev-parse base)
COMMIT::$(git rev-parse base~1)
COMMIT::$(git rev-parse base~2)
commits:4
TREE::$(git rev-parse topic^{tree})
TREE::$(git rev-parse base^{tree})
TREE::$(git rev-parse base~1^{tree})
Expand Down Expand Up @@ -60,6 +65,10 @@ test_expect_success 'topic only' '
test-tool path-walk -- topic >out &&
cat >expect <<-EOF &&
COMMIT::$(git rev-parse topic)
COMMIT::$(git rev-parse base~1)
COMMIT::$(git rev-parse base~2)
commits:3
TREE::$(git rev-parse topic^{tree})
TREE::$(git rev-parse base~1^{tree})
TREE::$(git rev-parse base~2^{tree})
Expand All @@ -86,6 +95,8 @@ test_expect_success 'topic, not base' '
test-tool path-walk -- topic --not base >out &&
cat >expect <<-EOF &&
COMMIT::$(git rev-parse topic)
commits:1
TREE::$(git rev-parse topic^{tree})
TREE:left/:$(git rev-parse topic:left)
TREE:right/:$(git rev-parse topic:right)
Expand All @@ -103,10 +114,71 @@ test_expect_success 'topic, not base' '
test_cmp expect.sorted out.sorted
'

test_expect_success 'topic, not base, only blobs' '
test-tool path-walk --no-trees --no-commits \
-- topic --not base >out &&
cat >expect <<-EOF &&
commits:0
trees:0
BLOB:a:$(git rev-parse topic:a)
BLOB:left/b:$(git rev-parse topic:left/b)
BLOB:right/c:$(git rev-parse topic:right/c)
BLOB:right/d:$(git rev-parse topic:right/d)
blobs:4
EOF
sort expect >expect.sorted &&
sort out >out.sorted &&
test_cmp expect.sorted out.sorted
'

# No, this doesn't make a lot of sense for the path-walk API,
# but it is possible to do.
test_expect_success 'topic, not base, only commits' '
test-tool path-walk --no-blobs --no-trees \
-- topic --not base >out &&
cat >expect <<-EOF &&
COMMIT::$(git rev-parse topic)
commits:1
trees:0
blobs:0
EOF
sort expect >expect.sorted &&
sort out >out.sorted &&
test_cmp expect.sorted out.sorted
'

test_expect_success 'topic, not base, only trees' '
test-tool path-walk --no-blobs --no-commits \
-- topic --not base >out &&
cat >expect <<-EOF &&
commits:0
TREE::$(git rev-parse topic^{tree})
TREE:left/:$(git rev-parse topic:left)
TREE:right/:$(git rev-parse topic:right)
trees:3
blobs:0
EOF
sort expect >expect.sorted &&
sort out >out.sorted &&
test_cmp expect.sorted out.sorted
'

test_expect_success 'topic, not base, boundary' '
test-tool path-walk -- --boundary topic --not base >out &&
cat >expect <<-EOF &&
COMMIT::$(git rev-parse topic)
COMMIT::$(git rev-parse base~1)
commits:2
TREE::$(git rev-parse topic^{tree})
TREE::$(git rev-parse base~1^{tree})
TREE:left/:$(git rev-parse base~1:left)
Expand Down

0 comments on commit 3289262

Please sign in to comment.