transport: add client support for object-info

Sometimes it is useful to get information about an object without having
to download it completely. The server logic has already been implemented
in “a2ba162cda (object-info: support for retrieving object info,
2021-04-20)”.

Add client functions to communicate with the server.

The client currently supports requesting a list of object ids with
feature 'size' from a v2 server. If a server does not
advertise the feature, then the client falls back
to making the request through 'fetch'.

Helped-by: Jonathan Tan <jonathantanmy@google.com>
Helped-by: Christian Couder <chriscool@tuxfamily.org>
Signed-off-by: Calvin Wan <calvinwan@google.com>
Signed-off-by: Eric Ju  <eric.peijian@gmail.com>
Signed-off-by: Taylor Blau <me@ttaylorr.com>
This commit is contained in:
Calvin Wan
2024-10-28 16:34:55 -04:00
committed by Taylor Blau
parent bc52916980
commit 8c4368da08
8 changed files with 216 additions and 5 deletions

View File

@@ -1024,6 +1024,7 @@ LIB_OBJS += ewah/ewah_rlw.o
LIB_OBJS += exec-cmd.o
LIB_OBJS += fetch-negotiator.o
LIB_OBJS += fetch-pack.o
LIB_OBJS += fetch-object-info.o
LIB_OBJS += fmt-merge-msg.o
LIB_OBJS += fsck.o
LIB_OBJS += fsmonitor.o

95
fetch-object-info.c Normal file
View File

@@ -0,0 +1,95 @@
#include "git-compat-util.h"
#include "gettext.h"
#include "hex.h"
#include "pkt-line.h"
#include "connect.h"
#include "oid-array.h"
#include "object-store-ll.h"
#include "fetch-object-info.h"
#include "string-list.h"
/**
* send_object_info_request sends git-cat-file object-info command and its
* arguments into the request buffer.
*/
static void send_object_info_request(const int fd_out, struct object_info_args *args)
{
struct strbuf req_buf = STRBUF_INIT;
write_command_and_capabilities(&req_buf, "object-info", args->server_options);
if (unsorted_string_list_has_string(args->object_info_options, "size"))
packet_buf_write(&req_buf, "size");
if (args->oids) {
for (size_t i = 0; i < args->oids->nr; i++)
packet_buf_write(&req_buf, "oid %s", oid_to_hex(&args->oids->oid[i]));
}
packet_buf_flush(&req_buf);
if (write_in_full(fd_out, req_buf.buf, req_buf.len) < 0)
die_errno(_("unable to write request to remote"));
strbuf_release(&req_buf);
}
/**
* fetch_object_info sends git-cat-file object-info command into the request buf
* and read the results from packets.
*/
int fetch_object_info(const enum protocol_version version, struct object_info_args *args,
struct packet_reader *reader, struct object_info *object_info_data,
const int stateless_rpc, const int fd_out)
{
int size_index = -1;
switch (version) {
case protocol_v2:
if (!server_supports_v2("object-info"))
return -1;
if (unsorted_string_list_has_string(args->object_info_options, "size")
&& !server_supports_feature("object-info", "size", 0))
return -1;
send_object_info_request(fd_out, args);
break;
case protocol_v1:
case protocol_v0:
die(_("wrong protocol version. expected v2"));
case protocol_unknown_version:
BUG("unknown protocol version");
}
for (size_t i = 0; i < args->object_info_options->nr; i++) {
if (packet_reader_read(reader) != PACKET_READ_NORMAL) {
check_stateless_delimiter(stateless_rpc, reader, "stateless delimiter expected");
return -1;
}
if (unsorted_string_list_has_string(args->object_info_options, reader->line)) {
if (!strcmp(reader->line, "size")) {
size_index = i;
for (size_t j = 0; j < args->oids->nr; j++)
object_info_data[j].sizep = xcalloc(1, sizeof(long));
}
continue;
}
return -1;
}
for (size_t i = 0; packet_reader_read(reader) == PACKET_READ_NORMAL && i < args->oids->nr; i++){
struct string_list object_info_values = STRING_LIST_INIT_DUP;
string_list_split(&object_info_values, reader->line, ' ', -1);
if (0 <= size_index) {
if (!strcmp(object_info_values.items[1 + size_index].string, ""))
die("object-info: not our ref %s",
object_info_values.items[0].string);
*object_info_data[i].sizep = strtoul(object_info_values.items[1 + size_index].string, NULL, 10);
}
string_list_clear(&object_info_values, 0);
}
check_stateless_delimiter(stateless_rpc, reader, "stateless delimiter expected");
return 0;
}

18
fetch-object-info.h Normal file
View File

@@ -0,0 +1,18 @@
#ifndef FETCH_OBJECT_INFO_H
#define FETCH_OBJECT_INFO_H
#include "pkt-line.h"
#include "protocol.h"
#include "object-store-ll.h"
struct object_info_args {
struct string_list *object_info_options;
const struct string_list *server_options;
struct oid_array *oids;
};
int fetch_object_info(enum protocol_version version, struct object_info_args *args,
struct packet_reader *reader, struct object_info *object_info_data,
int stateless_rpc, int fd_out);
#endif /* FETCH_OBJECT_INFO_H */

View File

@@ -1651,6 +1651,9 @@ static struct ref *do_fetch_pack_v2(struct fetch_pack_args *args,
if (args->depth > 0 || args->deepen_since || args->deepen_not)
args->deepen = 1;
if (args->object_info)
state = FETCH_SEND_REQUEST;
while (state != FETCH_DONE) {
switch (state) {
case FETCH_CHECK_LOCAL:

View File

@@ -16,6 +16,7 @@ struct fetch_pack_args {
const struct string_list *deepen_not;
struct list_objects_filter_options filter_options;
const struct string_list *server_options;
struct object_info *object_info_data;
/*
* If not NULL, during packfile negotiation, fetch-pack will send "have"
@@ -42,6 +43,7 @@ struct fetch_pack_args {
unsigned reject_shallow_remote:1;
unsigned deepen:1;
unsigned refetch:1;
unsigned object_info:1;
/*
* Indicate that the remote of this request is a promisor remote. The

View File

@@ -709,8 +709,8 @@ static int fetch_refs(struct transport *transport,
/*
* If we reach here, then the server, the client, and/or the transport
* helper does not support protocol v2. --negotiate-only requires
* protocol v2.
* helper does not support protocol v2. --negotiate-only and cat-file
* remote-object-info require protocol v2.
*/
if (data->transport_options.acked_commits) {
warning(_("--negotiate-only requires protocol v2"));
@@ -726,6 +726,13 @@ static int fetch_refs(struct transport *transport,
free_refs(dummy);
}
/* fail the command explicitly to avoid further commands input. */
if (transport->smart_options->object_info)
die(_("remote-object-info requires protocol v2"));
if (!data->get_refs_list_called)
get_refs_list_using_list(transport, 0);
count = 0;
for (i = 0; i < nr_heads; i++)
if (!(to_fetch[i]->status & REF_STATUS_UPTODATE))

View File

@@ -9,6 +9,7 @@
#include "hook.h"
#include "pkt-line.h"
#include "fetch-pack.h"
#include "fetch-object-info.h"
#include "remote.h"
#include "connect.h"
#include "send-pack.h"
@@ -418,6 +419,7 @@ static int fetch_refs_via_pack(struct transport *transport,
struct ref *refs = NULL;
struct fetch_pack_args args;
struct ref *refs_tmp = NULL, **to_fetch_dup = NULL;
struct ref *object_info_refs = NULL;
memset(&args, 0, sizeof(args));
args.uploadpack = data->options.uploadpack;
@@ -444,11 +446,71 @@ static int fetch_refs_via_pack(struct transport *transport,
args.server_options = transport->server_options;
args.negotiation_tips = data->options.negotiation_tips;
args.reject_shallow_remote = transport->smart_options->reject_shallow;
args.object_info = transport->smart_options->object_info;
if (!data->finished_handshake) {
int i;
if (transport->smart_options
&& transport->smart_options->object_info
&& transport->smart_options->object_info_oids->nr > 0) {
struct ref *ref_itr = object_info_refs = alloc_ref("");
struct packet_reader reader;
struct object_info_args obj_info_args = { 0 };
obj_info_args.server_options = transport->server_options;
obj_info_args.object_info_options = transport->smart_options->object_info_options;
obj_info_args.oids = transport->smart_options->object_info_oids;
connect_setup(transport, 0);
packet_reader_init(&reader, data->fd[0], NULL, 0,
PACKET_READ_CHOMP_NEWLINE |
PACKET_READ_GENTLE_ON_EOF |
PACKET_READ_DIE_ON_ERR_PACKET);
data->version = discover_version(&reader);
transport->hash_algo = reader.hash_algo;
if (!fetch_object_info(data->version, &obj_info_args, &reader,
data->options.object_info_data, transport->stateless_rpc,
data->fd[1])) {
/*
* If the code reaches here, fetch_object_info is successful and
* remote object info are retrieved from packets (i.e. without
* downloading the objects).
*/
goto cleanup;
}
/*
* If the code reaches here, it means we can't retrieve object info from
* packets, and we will fallback to downland the pack files.
* We set quiet and no_progress to be true, so that the internal call to
* fetch-pack is less verbose.
*/
args.object_info_data = data->options.object_info_data;
args.quiet = 1;
args.no_progress = 1;
/*
* Allocate memory for object info data according to oids.
* The actual results will be retrieved later from the downloaded
* pack files.
*/
for (size_t i = 0; i < transport->smart_options->object_info_oids->nr; i++) {
ref_itr->old_oid = transport->smart_options->object_info_oids->oid[i];
ref_itr->exact_oid = 1;
if (i == transport->smart_options->object_info_oids->nr - 1)
/* last element, no need to allocate to next */
ref_itr->next = NULL;
else
ref_itr->next = alloc_ref("");
ref_itr = ref_itr->next;
}
transport->remote_refs = object_info_refs;
} else if (!data->finished_handshake) {
int must_list_refs = 0;
for (i = 0; i < nr_heads; i++) {
for (int i = 0; i < nr_heads; i++) {
if (!to_fetch[i]->exact_oid) {
must_list_refs = 1;
break;
@@ -494,6 +556,17 @@ static int fetch_refs_via_pack(struct transport *transport,
&transport->pack_lockfiles, data->version);
data->finished_handshake = 0;
/* Retrieve object info data from the downloaded pack files */
if (args.object_info) {
struct ref *ref_cpy_reader = object_info_refs;
for (int i = 0; ref_cpy_reader; i++) {
oid_object_info_extended(the_repository, &ref_cpy_reader->old_oid,
&args.object_info_data[i], OBJECT_INFO_LOOKUP_REPLACE);
ref_cpy_reader = ref_cpy_reader->next;
}
}
data->options.self_contained_and_connected =
args.self_contained_and_connected;
data->options.connectivity_checked = args.connectivity_checked;
@@ -504,6 +577,7 @@ static int fetch_refs_via_pack(struct transport *transport,
ret = -1;
cleanup:
free_refs(object_info_refs);
close(data->fd[0]);
if (data->fd[1] >= 0)
close(data->fd[1]);

View File

@@ -5,6 +5,7 @@
#include "remote.h"
#include "list-objects-filter-options.h"
#include "string-list.h"
#include "object-store.h"
struct git_transport_options {
unsigned thin : 1;
@@ -30,6 +31,12 @@ struct git_transport_options {
*/
unsigned connectivity_checked:1;
/*
* Transport will attempt to pull only object-info. Fallbacks
* to pulling entire object if object-info is not supported.
*/
unsigned object_info : 1;
int depth;
const char *deepen_since;
const struct string_list *deepen_not;
@@ -53,6 +60,10 @@ struct git_transport_options {
* common commits to this oidset instead of fetching any packfiles.
*/
struct oidset *acked_commits;
struct oid_array *object_info_oids;
struct object_info *object_info_data;
struct string_list *object_info_options;
};
enum transport_family {