Support delimited data regions in fast-import.
During testing its nice to not have to feed the length of a data chunk to the 'data' command of fast-import. Instead we would prefer to be able to establish a data chunk much like shell's << operator and use a line delimiter to denote the end of the input. So now if a data command is started as 'data <<EOF' we will look for a terminator line containing only the string EOF on that line. Once found, we stop the data command. Everything between the two lines is used as the data value. The 'data <<' syntax is slower than 'data n', as we don't know how many bytes to expect and instead must grow our buffer on the fly. It also has the problem that the frontend must use a string which will not appear on a line by itself in the input, and the data region will always end in an LF. For these reasons real import frontends are encouraged to continue to use _only_ 'data n'. Signed-off-by: Shawn O. Pearce <spearce@spearce.org>
This commit is contained in:
parent
e5808826c4
commit
3b4dce0275
@ -50,14 +50,21 @@ Format of STDIN stream:
|
|||||||
# a new mark directive with the old idnum.
|
# a new mark directive with the old idnum.
|
||||||
#
|
#
|
||||||
mark ::= 'mark' sp idnum lf;
|
mark ::= 'mark' sp idnum lf;
|
||||||
|
data ::= (delimited_data | exact_data)
|
||||||
|
lf;
|
||||||
|
|
||||||
|
# note: delim may be any string but must not contain lf.
|
||||||
|
# data_line may contain any data but must not be exactly
|
||||||
|
# delim.
|
||||||
|
delimited_data ::= 'data' sp '<<' delim lf
|
||||||
|
(data_line lf)*
|
||||||
|
delim lf;
|
||||||
|
|
||||||
# note: declen indicates the length of binary_data in bytes.
|
# note: declen indicates the length of binary_data in bytes.
|
||||||
# declen does not include the lf preceeding or trailing the
|
# declen does not include the lf preceeding the binary data.
|
||||||
# binary data.
|
|
||||||
#
|
#
|
||||||
data ::= 'data' sp declen lf
|
exact_data ::= 'data' sp declen lf
|
||||||
binary_data
|
binary_data;
|
||||||
lf;
|
|
||||||
|
|
||||||
# note: quoted strings are C-style quoting supporting \c for
|
# note: quoted strings are C-style quoting supporting \c for
|
||||||
# common escapes of 'c' (e..g \n, \t, \\, \") or \nnn where nnn
|
# common escapes of 'c' (e..g \n, \t, \\, \") or \nnn where nnn
|
||||||
@ -1334,22 +1341,49 @@ static void cmd_mark(void)
|
|||||||
|
|
||||||
static void* cmd_data (size_t *size)
|
static void* cmd_data (size_t *size)
|
||||||
{
|
{
|
||||||
size_t n = 0;
|
|
||||||
void *buffer;
|
|
||||||
size_t length;
|
size_t length;
|
||||||
|
char *buffer;
|
||||||
|
|
||||||
if (strncmp("data ", command_buf.buf, 5))
|
if (strncmp("data ", command_buf.buf, 5))
|
||||||
die("Expected 'data n' command, found: %s", command_buf.buf);
|
die("Expected 'data n' command, found: %s", command_buf.buf);
|
||||||
|
|
||||||
|
if (!strncmp("<<", command_buf.buf + 5, 2)) {
|
||||||
|
char *term = xstrdup(command_buf.buf + 5 + 2);
|
||||||
|
size_t sz = 8192, term_len = command_buf.len - 5 - 2;
|
||||||
|
length = 0;
|
||||||
|
buffer = xmalloc(sz);
|
||||||
|
for (;;) {
|
||||||
|
read_next_command();
|
||||||
|
if (command_buf.eof)
|
||||||
|
die("EOF in data (terminator '%s' not found)", term);
|
||||||
|
if (term_len == command_buf.len
|
||||||
|
&& !strcmp(term, command_buf.buf))
|
||||||
|
break;
|
||||||
|
if (sz < (length + command_buf.len)) {
|
||||||
|
sz = sz * 3 / 2 + 16;
|
||||||
|
if (sz < (length + command_buf.len))
|
||||||
|
sz = length + command_buf.len;
|
||||||
|
buffer = xrealloc(buffer, sz);
|
||||||
|
}
|
||||||
|
memcpy(buffer + length,
|
||||||
|
command_buf.buf,
|
||||||
|
command_buf.len - 1);
|
||||||
|
length += command_buf.len - 1;
|
||||||
|
buffer[length++] = '\n';
|
||||||
|
}
|
||||||
|
free(term);
|
||||||
|
}
|
||||||
|
else {
|
||||||
|
size_t n = 0;
|
||||||
length = strtoul(command_buf.buf + 5, NULL, 10);
|
length = strtoul(command_buf.buf + 5, NULL, 10);
|
||||||
buffer = xmalloc(length);
|
buffer = xmalloc(length);
|
||||||
|
|
||||||
while (n < length) {
|
while (n < length) {
|
||||||
size_t s = fread((char*)buffer + n, 1, length - n, stdin);
|
size_t s = fread(buffer + n, 1, length - n, stdin);
|
||||||
if (!s && feof(stdin))
|
if (!s && feof(stdin))
|
||||||
die("EOF in data (%lu bytes remaining)", length - n);
|
die("EOF in data (%lu bytes remaining)", length - n);
|
||||||
n += s;
|
n += s;
|
||||||
}
|
}
|
||||||
|
}
|
||||||
|
|
||||||
if (fgetc(stdin) != '\n')
|
if (fgetc(stdin) != '\n')
|
||||||
die("An lf did not trail the binary data as expected.");
|
die("An lf did not trail the binary data as expected.");
|
||||||
|
Loading…
Reference in New Issue
Block a user