2018-03-15 18:31:19 +01:00
|
|
|
#include "cache.h"
|
|
|
|
#include "repository.h"
|
|
|
|
#include "config.h"
|
|
|
|
#include "pkt-line.h"
|
|
|
|
#include "version.h"
|
2020-07-28 22:23:39 +02:00
|
|
|
#include "strvec.h"
|
2018-03-15 18:31:20 +01:00
|
|
|
#include "ls-refs.h"
|
2021-04-21 01:38:31 +02:00
|
|
|
#include "protocol-caps.h"
|
2018-03-15 18:31:19 +01:00
|
|
|
#include "serve.h"
|
2018-03-15 18:31:27 +01:00
|
|
|
#include "upload-pack.h"
|
2018-03-15 18:31:19 +01:00
|
|
|
|
2020-11-12 00:29:29 +01:00
|
|
|
static int advertise_sid;
|
|
|
|
|
2018-03-15 18:31:20 +01:00
|
|
|
static int always_advertise(struct repository *r,
|
|
|
|
struct strbuf *value)
|
|
|
|
{
|
|
|
|
return 1;
|
|
|
|
}
|
|
|
|
|
2018-03-15 18:31:19 +01:00
|
|
|
static int agent_advertise(struct repository *r,
|
|
|
|
struct strbuf *value)
|
|
|
|
{
|
|
|
|
if (value)
|
|
|
|
strbuf_addstr(value, git_user_agent_sanitized());
|
|
|
|
return 1;
|
|
|
|
}
|
|
|
|
|
2020-05-25 21:59:17 +02:00
|
|
|
static int object_format_advertise(struct repository *r,
|
|
|
|
struct strbuf *value)
|
|
|
|
{
|
|
|
|
if (value)
|
|
|
|
strbuf_addstr(value, r->hash_algo->name);
|
|
|
|
return 1;
|
|
|
|
}
|
|
|
|
|
2020-11-12 00:29:29 +01:00
|
|
|
static int session_id_advertise(struct repository *r, struct strbuf *value)
|
|
|
|
{
|
|
|
|
if (!advertise_sid)
|
|
|
|
return 0;
|
|
|
|
if (value)
|
|
|
|
strbuf_addstr(value, trace2_session_id());
|
|
|
|
return 1;
|
|
|
|
}
|
|
|
|
|
2018-03-15 18:31:19 +01:00
|
|
|
struct protocol_capability {
|
|
|
|
/*
|
|
|
|
* The name of the capability. The server uses this name when
|
|
|
|
* advertising this capability, and the client uses this name to
|
|
|
|
* specify this capability.
|
|
|
|
*/
|
|
|
|
const char *name;
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Function queried to see if a capability should be advertised.
|
|
|
|
* Optionally a value can be specified by adding it to 'value'.
|
|
|
|
* If a value is added to 'value', the server will advertise this
|
|
|
|
* capability as "<name>=<value>" instead of "<name>".
|
|
|
|
*/
|
|
|
|
int (*advertise)(struct repository *r, struct strbuf *value);
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Function called when a client requests the capability as a command.
|
|
|
|
* The function will be provided the capabilities requested via 'keys'
|
|
|
|
* as well as a struct packet_reader 'request' which the command should
|
|
|
|
* use to read the command specific part of the request. Every command
|
|
|
|
* MUST read until a flush packet is seen before sending a response.
|
|
|
|
*
|
|
|
|
* This field should be NULL for capabilities which are not commands.
|
|
|
|
*/
|
|
|
|
int (*command)(struct repository *r,
|
2020-07-28 22:25:12 +02:00
|
|
|
struct strvec *keys,
|
2018-03-15 18:31:19 +01:00
|
|
|
struct packet_reader *request);
|
|
|
|
};
|
|
|
|
|
|
|
|
static struct protocol_capability capabilities[] = {
|
|
|
|
{ "agent", agent_advertise, NULL },
|
ls-refs: report unborn targets of symrefs
When cloning, we choose the default branch based on the remote HEAD.
But if there is no remote HEAD reported (which could happen if the
target of the remote HEAD is unborn), we'll fall back to using our local
init.defaultBranch. Traditionally this hasn't been a big deal, because
most repos used "master" as the default. But these days it is likely to
cause confusion if the server and client implementations choose
different values (e.g., if the remote started with "main", we may choose
"master" locally, create commits there, and then the user is surprised
when they push to "master" and not "main").
To solve this, the remote needs to communicate the target of the HEAD
symref, even if it is unborn, and "git clone" needs to use this
information.
Currently, symrefs that have unborn targets (such as in this case) are
not communicated by the protocol. Teach Git to advertise and support the
"unborn" feature in "ls-refs" (by default, this is advertised, but
server administrators may turn this off through the lsrefs.unborn
config). This feature indicates that "ls-refs" supports the "unborn"
argument; when it is specified, "ls-refs" will send the HEAD symref with
the name of its unborn target.
This change is only for protocol v2. A similar change for protocol v0
would require independent protocol design (there being no analogous
position to signal support for "unborn") and client-side plumbing of the
data required, so the scope of this patch set is limited to protocol v2.
The client side will be updated to use this in a subsequent commit.
Signed-off-by: Jonathan Tan <jonathantanmy@google.com>
Signed-off-by: Junio C Hamano <gitster@pobox.com>
2021-02-05 21:48:47 +01:00
|
|
|
{ "ls-refs", ls_refs_advertise, ls_refs },
|
2018-03-15 18:31:28 +01:00
|
|
|
{ "fetch", upload_pack_advertise, upload_pack_v2 },
|
2018-04-24 00:46:22 +02:00
|
|
|
{ "server-option", always_advertise, NULL },
|
2020-05-25 21:59:17 +02:00
|
|
|
{ "object-format", object_format_advertise, NULL },
|
2020-11-12 00:29:29 +01:00
|
|
|
{ "session-id", session_id_advertise, NULL },
|
2021-04-21 01:38:31 +02:00
|
|
|
{ "object-info", always_advertise, cap_object_info },
|
2018-03-15 18:31:19 +01:00
|
|
|
};
|
|
|
|
|
|
|
|
static void advertise_capabilities(void)
|
|
|
|
{
|
|
|
|
struct strbuf capability = STRBUF_INIT;
|
|
|
|
struct strbuf value = STRBUF_INIT;
|
|
|
|
int i;
|
|
|
|
|
|
|
|
for (i = 0; i < ARRAY_SIZE(capabilities); i++) {
|
|
|
|
struct protocol_capability *c = &capabilities[i];
|
|
|
|
|
|
|
|
if (c->advertise(the_repository, &value)) {
|
|
|
|
strbuf_addstr(&capability, c->name);
|
|
|
|
|
|
|
|
if (value.len) {
|
|
|
|
strbuf_addch(&capability, '=');
|
|
|
|
strbuf_addbuf(&capability, &value);
|
|
|
|
}
|
|
|
|
|
|
|
|
strbuf_addch(&capability, '\n');
|
|
|
|
packet_write(1, capability.buf, capability.len);
|
|
|
|
}
|
|
|
|
|
|
|
|
strbuf_reset(&capability);
|
|
|
|
strbuf_reset(&value);
|
|
|
|
}
|
|
|
|
|
|
|
|
packet_flush(1);
|
|
|
|
strbuf_release(&capability);
|
|
|
|
strbuf_release(&value);
|
|
|
|
}
|
|
|
|
|
|
|
|
static struct protocol_capability *get_capability(const char *key)
|
|
|
|
{
|
|
|
|
int i;
|
|
|
|
|
|
|
|
if (!key)
|
|
|
|
return NULL;
|
|
|
|
|
|
|
|
for (i = 0; i < ARRAY_SIZE(capabilities); i++) {
|
|
|
|
struct protocol_capability *c = &capabilities[i];
|
|
|
|
const char *out;
|
|
|
|
if (skip_prefix(key, c->name, &out) && (!*out || *out == '='))
|
|
|
|
return c;
|
|
|
|
}
|
|
|
|
|
|
|
|
return NULL;
|
|
|
|
}
|
|
|
|
|
|
|
|
static int is_valid_capability(const char *key)
|
|
|
|
{
|
|
|
|
const struct protocol_capability *c = get_capability(key);
|
|
|
|
|
|
|
|
return c && c->advertise(the_repository, NULL);
|
|
|
|
}
|
|
|
|
|
|
|
|
static int is_command(const char *key, struct protocol_capability **command)
|
|
|
|
{
|
|
|
|
const char *out;
|
|
|
|
|
|
|
|
if (skip_prefix(key, "command=", &out)) {
|
|
|
|
struct protocol_capability *cmd = get_capability(out);
|
|
|
|
|
|
|
|
if (*command)
|
|
|
|
die("command '%s' requested after already requesting command '%s'",
|
|
|
|
out, (*command)->name);
|
|
|
|
if (!cmd || !cmd->advertise(the_repository, NULL) || !cmd->command)
|
|
|
|
die("invalid command '%s'", out);
|
|
|
|
|
|
|
|
*command = cmd;
|
|
|
|
return 1;
|
|
|
|
}
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2020-07-28 22:25:12 +02:00
|
|
|
int has_capability(const struct strvec *keys, const char *capability,
|
2018-03-15 18:31:19 +01:00
|
|
|
const char **value)
|
|
|
|
{
|
|
|
|
int i;
|
2020-07-29 02:37:20 +02:00
|
|
|
for (i = 0; i < keys->nr; i++) {
|
2018-03-15 18:31:19 +01:00
|
|
|
const char *out;
|
2020-07-29 02:37:20 +02:00
|
|
|
if (skip_prefix(keys->v[i], capability, &out) &&
|
2018-03-15 18:31:19 +01:00
|
|
|
(!*out || *out == '=')) {
|
|
|
|
if (value) {
|
|
|
|
if (*out == '=')
|
|
|
|
out++;
|
|
|
|
*value = out;
|
|
|
|
}
|
|
|
|
return 1;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2020-07-28 22:25:12 +02:00
|
|
|
static void check_algorithm(struct repository *r, struct strvec *keys)
|
2020-05-25 21:59:17 +02:00
|
|
|
{
|
|
|
|
int client = GIT_HASH_SHA1, server = hash_algo_by_ptr(r->hash_algo);
|
|
|
|
const char *algo_name;
|
|
|
|
|
|
|
|
if (has_capability(keys, "object-format", &algo_name)) {
|
|
|
|
client = hash_algo_by_name(algo_name);
|
|
|
|
if (client == GIT_HASH_UNKNOWN)
|
|
|
|
die("unknown object format '%s'", algo_name);
|
|
|
|
}
|
|
|
|
|
|
|
|
if (client != server)
|
|
|
|
die("mismatched object format: server %s; client %s\n",
|
|
|
|
r->hash_algo->name, hash_algos[client].name);
|
|
|
|
}
|
|
|
|
|
2018-03-15 18:31:19 +01:00
|
|
|
enum request_state {
|
|
|
|
PROCESS_REQUEST_KEYS,
|
|
|
|
PROCESS_REQUEST_DONE,
|
|
|
|
};
|
|
|
|
|
|
|
|
static int process_request(void)
|
|
|
|
{
|
|
|
|
enum request_state state = PROCESS_REQUEST_KEYS;
|
|
|
|
struct packet_reader reader;
|
2020-07-28 22:25:12 +02:00
|
|
|
struct strvec keys = STRVEC_INIT;
|
2018-03-15 18:31:19 +01:00
|
|
|
struct protocol_capability *command = NULL;
|
2020-11-12 00:29:32 +01:00
|
|
|
const char *client_sid;
|
2018-03-15 18:31:19 +01:00
|
|
|
|
|
|
|
packet_reader_init(&reader, 0, NULL, 0,
|
|
|
|
PACKET_READ_CHOMP_NEWLINE |
|
pack-protocol.txt: accept error packets in any context
In the Git pack protocol definition, an error packet may appear only in
a certain context. However, servers can face a runtime error (e.g. I/O
error) at an arbitrary timing. This patch changes the protocol to allow
an error packet to be sent instead of any packet.
Without this protocol spec change, when a server cannot process a
request, there's no way to tell that to a client. Since the server
cannot produce a valid response, it would be forced to cut a connection
without telling why. With this protocol spec change, the server can be
more gentle in this situation. An old client may see these error packets
as an unexpected packet, but this is not worse than having an unexpected
EOF.
Following this protocol spec change, the error packet handling code is
moved to pkt-line.c. Implementation wise, this implementation uses
pkt-line to communicate with a subprocess. Since this is not a part of
Git protocol, it's possible that a packet that is not supposed to be an
error packet is mistakenly parsed as an error packet. This error packet
handling is enabled only for the Git pack protocol parsing code
considering this.
Signed-off-by: Masaya Suzuki <masayasuzuki@google.com>
Signed-off-by: Junio C Hamano <gitster@pobox.com>
2018-12-29 22:19:15 +01:00
|
|
|
PACKET_READ_GENTLE_ON_EOF |
|
|
|
|
PACKET_READ_DIE_ON_ERR_PACKET);
|
2018-03-15 18:31:19 +01:00
|
|
|
|
|
|
|
/*
|
|
|
|
* Check to see if the client closed their end before sending another
|
|
|
|
* request. If so we can terminate the connection.
|
|
|
|
*/
|
|
|
|
if (packet_reader_peek(&reader) == PACKET_READ_EOF)
|
|
|
|
return 1;
|
pack-protocol.txt: accept error packets in any context
In the Git pack protocol definition, an error packet may appear only in
a certain context. However, servers can face a runtime error (e.g. I/O
error) at an arbitrary timing. This patch changes the protocol to allow
an error packet to be sent instead of any packet.
Without this protocol spec change, when a server cannot process a
request, there's no way to tell that to a client. Since the server
cannot produce a valid response, it would be forced to cut a connection
without telling why. With this protocol spec change, the server can be
more gentle in this situation. An old client may see these error packets
as an unexpected packet, but this is not worse than having an unexpected
EOF.
Following this protocol spec change, the error packet handling code is
moved to pkt-line.c. Implementation wise, this implementation uses
pkt-line to communicate with a subprocess. Since this is not a part of
Git protocol, it's possible that a packet that is not supposed to be an
error packet is mistakenly parsed as an error packet. This error packet
handling is enabled only for the Git pack protocol parsing code
considering this.
Signed-off-by: Masaya Suzuki <masayasuzuki@google.com>
Signed-off-by: Junio C Hamano <gitster@pobox.com>
2018-12-29 22:19:15 +01:00
|
|
|
reader.options &= ~PACKET_READ_GENTLE_ON_EOF;
|
2018-03-15 18:31:19 +01:00
|
|
|
|
|
|
|
while (state != PROCESS_REQUEST_DONE) {
|
|
|
|
switch (packet_reader_peek(&reader)) {
|
|
|
|
case PACKET_READ_EOF:
|
|
|
|
BUG("Should have already died when seeing EOF");
|
|
|
|
case PACKET_READ_NORMAL:
|
|
|
|
/* collect request; a sequence of keys and values */
|
|
|
|
if (is_command(reader.line, &command) ||
|
|
|
|
is_valid_capability(reader.line))
|
2020-07-28 22:25:12 +02:00
|
|
|
strvec_push(&keys, reader.line);
|
2018-03-15 18:31:19 +01:00
|
|
|
else
|
|
|
|
die("unknown capability '%s'", reader.line);
|
|
|
|
|
|
|
|
/* Consume the peeked line */
|
|
|
|
packet_reader_read(&reader);
|
|
|
|
break;
|
|
|
|
case PACKET_READ_FLUSH:
|
|
|
|
/*
|
|
|
|
* If no command and no keys were given then the client
|
|
|
|
* wanted to terminate the connection.
|
|
|
|
*/
|
2020-07-29 02:37:20 +02:00
|
|
|
if (!keys.nr)
|
2018-03-15 18:31:19 +01:00
|
|
|
return 1;
|
|
|
|
|
|
|
|
/*
|
|
|
|
* The flush packet isn't consume here like it is in
|
|
|
|
* the other parts of this switch statement. This is
|
|
|
|
* so that the command can read the flush packet and
|
|
|
|
* see the end of the request in the same way it would
|
|
|
|
* if command specific arguments were provided after a
|
|
|
|
* delim packet.
|
|
|
|
*/
|
|
|
|
state = PROCESS_REQUEST_DONE;
|
|
|
|
break;
|
|
|
|
case PACKET_READ_DELIM:
|
|
|
|
/* Consume the peeked line */
|
|
|
|
packet_reader_read(&reader);
|
|
|
|
|
|
|
|
state = PROCESS_REQUEST_DONE;
|
|
|
|
break;
|
2020-05-19 12:53:59 +02:00
|
|
|
case PACKET_READ_RESPONSE_END:
|
2021-07-09 04:27:22 +02:00
|
|
|
BUG("unexpected response end packet");
|
2018-03-15 18:31:19 +01:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
if (!command)
|
|
|
|
die("no command requested");
|
|
|
|
|
2020-05-25 21:59:17 +02:00
|
|
|
check_algorithm(the_repository, &keys);
|
|
|
|
|
2020-11-12 00:29:32 +01:00
|
|
|
if (has_capability(&keys, "session-id", &client_sid))
|
|
|
|
trace2_data_string("transfer", NULL, "client-sid", client_sid);
|
|
|
|
|
2018-03-15 18:31:19 +01:00
|
|
|
command->command(the_repository, &keys, &reader);
|
|
|
|
|
2020-07-28 22:25:12 +02:00
|
|
|
strvec_clear(&keys);
|
2018-03-15 18:31:19 +01:00
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* Main serve loop for protocol version 2 */
|
|
|
|
void serve(struct serve_options *options)
|
|
|
|
{
|
2020-11-12 00:29:29 +01:00
|
|
|
git_config_get_bool("transfer.advertisesid", &advertise_sid);
|
|
|
|
|
2018-03-15 18:31:19 +01:00
|
|
|
if (options->advertise_capabilities || !options->stateless_rpc) {
|
|
|
|
/* serve by default supports v2 */
|
|
|
|
packet_write_fmt(1, "version 2\n");
|
|
|
|
|
|
|
|
advertise_capabilities();
|
|
|
|
/*
|
|
|
|
* If only the list of capabilities was requested exit
|
|
|
|
* immediately after advertising capabilities
|
|
|
|
*/
|
|
|
|
if (options->advertise_capabilities)
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* If stateless-rpc was requested then exit after
|
|
|
|
* a single request/response exchange
|
|
|
|
*/
|
|
|
|
if (options->stateless_rpc) {
|
|
|
|
process_request();
|
|
|
|
} else {
|
|
|
|
for (;;)
|
|
|
|
if (process_request())
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|