Support delimited data regions in fast-import.

During testing its nice to not have to feed the length of a data
chunk to the 'data' command of fast-import.  Instead we would
prefer to be able to establish a data chunk much like shell's <<
operator and use a line delimiter to denote the end of the input.

So now if a data command is started as 'data <<EOF' we will look
for a terminator line containing only the string EOF on that line.
Once found, we stop the data command.  Everything between the two
lines is used as the data value.

The 'data <<' syntax is slower than 'data n', as we don't know how
many bytes to expect and instead must grow our buffer on the fly.
It also has the problem that the frontend must use a string which
will not appear on a line by itself in the input, and the data
region will always end in an LF.  For these reasons real import
frontends are encouraged to continue to use _only_ 'data n'.

Signed-off-by: Shawn O. Pearce <spearce@spearce.org>
This commit is contained in:
Shawn O. Pearce 2007-01-18 13:14:27 -05:00
parent e5808826c4
commit 3b4dce0275

View File

@ -50,14 +50,21 @@ Format of STDIN stream:
# a new mark directive with the old idnum. # a new mark directive with the old idnum.
# #
mark ::= 'mark' sp idnum lf; mark ::= 'mark' sp idnum lf;
data ::= (delimited_data | exact_data)
lf;
# note: delim may be any string but must not contain lf.
# data_line may contain any data but must not be exactly
# delim.
delimited_data ::= 'data' sp '<<' delim lf
(data_line lf)*
delim lf;
# note: declen indicates the length of binary_data in bytes. # note: declen indicates the length of binary_data in bytes.
# declen does not include the lf preceeding or trailing the # declen does not include the lf preceeding the binary data.
# binary data.
# #
data ::= 'data' sp declen lf exact_data ::= 'data' sp declen lf
binary_data binary_data;
lf;
# note: quoted strings are C-style quoting supporting \c for # note: quoted strings are C-style quoting supporting \c for
# common escapes of 'c' (e..g \n, \t, \\, \") or \nnn where nnn # common escapes of 'c' (e..g \n, \t, \\, \") or \nnn where nnn
@ -1334,22 +1341,49 @@ static void cmd_mark(void)
static void* cmd_data (size_t *size) static void* cmd_data (size_t *size)
{ {
size_t n = 0;
void *buffer;
size_t length; size_t length;
char *buffer;
if (strncmp("data ", command_buf.buf, 5)) if (strncmp("data ", command_buf.buf, 5))
die("Expected 'data n' command, found: %s", command_buf.buf); die("Expected 'data n' command, found: %s", command_buf.buf);
if (!strncmp("<<", command_buf.buf + 5, 2)) {
char *term = xstrdup(command_buf.buf + 5 + 2);
size_t sz = 8192, term_len = command_buf.len - 5 - 2;
length = 0;
buffer = xmalloc(sz);
for (;;) {
read_next_command();
if (command_buf.eof)
die("EOF in data (terminator '%s' not found)", term);
if (term_len == command_buf.len
&& !strcmp(term, command_buf.buf))
break;
if (sz < (length + command_buf.len)) {
sz = sz * 3 / 2 + 16;
if (sz < (length + command_buf.len))
sz = length + command_buf.len;
buffer = xrealloc(buffer, sz);
}
memcpy(buffer + length,
command_buf.buf,
command_buf.len - 1);
length += command_buf.len - 1;
buffer[length++] = '\n';
}
free(term);
}
else {
size_t n = 0;
length = strtoul(command_buf.buf + 5, NULL, 10); length = strtoul(command_buf.buf + 5, NULL, 10);
buffer = xmalloc(length); buffer = xmalloc(length);
while (n < length) { while (n < length) {
size_t s = fread((char*)buffer + n, 1, length - n, stdin); size_t s = fread(buffer + n, 1, length - n, stdin);
if (!s && feof(stdin)) if (!s && feof(stdin))
die("EOF in data (%lu bytes remaining)", length - n); die("EOF in data (%lu bytes remaining)", length - n);
n += s; n += s;
} }
}
if (fgetc(stdin) != '\n') if (fgetc(stdin) != '\n')
die("An lf did not trail the binary data as expected."); die("An lf did not trail the binary data as expected.");