Merge branch 'sb/daemon'

* sb/daemon:
  daemon.c: minor style fixup
  git-daemon: rewrite kindergarden, new option --max-connections
  git-daemon: Simplify dead-children reaping logic
  git-daemon: use LOG_PID, simplify logging code
  git-daemon: call logerror() instead of error()
This commit is contained in:
Junio C Hamano 2008-08-30 08:17:15 -07:00
commit ff1e8bfcd6
2 changed files with 110 additions and 200 deletions

View File

@ -9,8 +9,9 @@ SYNOPSIS
-------- --------
[verse] [verse]
'git daemon' [--verbose] [--syslog] [--export-all] 'git daemon' [--verbose] [--syslog] [--export-all]
[--timeout=n] [--init-timeout=n] [--strict-paths] [--timeout=n] [--init-timeout=n] [--max-connections=n]
[--base-path=path] [--user-path | --user-path=path] [--strict-paths] [--base-path=path] [--base-path-relaxed]
[--user-path | --user-path=path]
[--interpolated-path=pathtemplate] [--interpolated-path=pathtemplate]
[--reuseaddr] [--detach] [--pid-file=file] [--reuseaddr] [--detach] [--pid-file=file]
[--enable=service] [--disable=service] [--enable=service] [--disable=service]
@ -99,6 +100,10 @@ OPTIONS
it takes for the server to process the sub-request and time spent it takes for the server to process the sub-request and time spent
waiting for next client's request. waiting for next client's request.
--max-connections::
Maximum number of concurrent clients, defaults to 32. Set it to
zero for no limit.
--syslog:: --syslog::
Log to syslog instead of stderr. Note that this option does not imply Log to syslog instead of stderr. Note that this option does not imply
--verbose, thus by default only error conditions will be logged. --verbose, thus by default only error conditions will be logged.

295
daemon.c
View File

@ -16,12 +16,11 @@
static int log_syslog; static int log_syslog;
static int verbose; static int verbose;
static int reuseaddr; static int reuseaddr;
static int child_handler_pipe[2];
static const char daemon_usage[] = static const char daemon_usage[] =
"git daemon [--verbose] [--syslog] [--export-all]\n" "git daemon [--verbose] [--syslog] [--export-all]\n"
" [--timeout=n] [--init-timeout=n] [--strict-paths]\n" " [--timeout=n] [--init-timeout=n] [--max-connections=n]\n"
" [--base-path=path] [--base-path-relaxed]\n" " [--strict-paths] [--base-path=path] [--base-path-relaxed]\n"
" [--user-path | --user-path=path]\n" " [--user-path | --user-path=path]\n"
" [--interpolated-path=path]\n" " [--interpolated-path=path]\n"
" [--reuseaddr] [--detach] [--pid-file=file]\n" " [--reuseaddr] [--detach] [--pid-file=file]\n"
@ -78,38 +77,19 @@ static struct interp interp_table[] = {
static void logreport(int priority, const char *err, va_list params) static void logreport(int priority, const char *err, va_list params)
{ {
/* We should do a single write so that it is atomic and output
* of several processes do not get intermingled. */
char buf[1024];
int buflen;
int maxlen, msglen;
/* sizeof(buf) should be big enough for "[pid] \n" */
buflen = snprintf(buf, sizeof(buf), "[%ld] ", (long) getpid());
maxlen = sizeof(buf) - buflen - 1; /* -1 for our own LF */
msglen = vsnprintf(buf + buflen, maxlen, err, params);
if (log_syslog) { if (log_syslog) {
char buf[1024];
vsnprintf(buf, sizeof(buf), err, params);
syslog(priority, "%s", buf); syslog(priority, "%s", buf);
return; } else {
} /*
* Since stderr is set to linebuffered mode, the
/* maxlen counted our own LF but also counts space given to * logging of different processes will not overlap
* vsnprintf for the terminating NUL. We want to make sure that
* we have space for our own LF and NUL after the "meat" of the
* message, so truncate it at maxlen - 1.
*/ */
if (msglen > maxlen - 1) fprintf(stderr, "[%d] ", (int)getpid());
msglen = maxlen - 1; vfprintf(stderr, err, params);
else if (msglen < 0) fputc('\n', stderr);
msglen = 0; /* Protect against weird return values. */ }
buflen += msglen;
buf[buflen++] = '\n';
buf[buflen] = '\0';
write_in_full(2, buf, buflen);
} }
static void logerror(const char *err, ...) static void logerror(const char *err, ...)
@ -604,69 +584,46 @@ static int execute(struct sockaddr *addr)
return -1; return -1;
} }
static int max_connections = 32;
/* static unsigned int live_children;
* We count spawned/reaped separately, just to avoid any
* races when updating them from signals. The SIGCHLD handler
* will only update children_reaped, and the fork logic will
* only update children_spawned.
*
* MAX_CHILDREN should be a power-of-two to make the modulus
* operation cheap. It should also be at least twice
* the maximum number of connections we will ever allow.
*/
#define MAX_CHILDREN 128
static int max_connections = 25;
/* These are updated by the signal handler */
static volatile unsigned int children_reaped;
static pid_t dead_child[MAX_CHILDREN];
/* These are updated by the main loop */
static unsigned int children_spawned;
static unsigned int children_deleted;
static struct child { static struct child {
struct child *next;
pid_t pid; pid_t pid;
int addrlen;
struct sockaddr_storage address; struct sockaddr_storage address;
} live_child[MAX_CHILDREN]; } *firstborn;
static void add_child(int idx, pid_t pid, struct sockaddr *addr, int addrlen) static void add_child(pid_t pid, struct sockaddr *addr, int addrlen)
{ {
live_child[idx].pid = pid; struct child *newborn, **cradle;
live_child[idx].addrlen = addrlen;
memcpy(&live_child[idx].address, addr, addrlen);
}
/* /*
* Walk from "deleted" to "spawned", and remove child "pid". * This must be xcalloc() -- we'll compare the whole sockaddr_storage
* * but individual address may be shorter.
* We move everything up by one, since the new "deleted" will
* be one higher.
*/ */
static void remove_child(pid_t pid, unsigned deleted, unsigned spawned) newborn = xcalloc(1, sizeof(*newborn));
{ live_children++;
struct child n; newborn->pid = pid;
memcpy(&newborn->address, addr, addrlen);
deleted %= MAX_CHILDREN; for (cradle = &firstborn; *cradle; cradle = &(*cradle)->next)
spawned %= MAX_CHILDREN; if (!memcmp(&(*cradle)->address, &newborn->address,
if (live_child[deleted].pid == pid) { sizeof(newborn->address)))
live_child[deleted].pid = -1; break;
return; newborn->next = *cradle;
*cradle = newborn;
} }
n = live_child[deleted];
for (;;) { static void remove_child(pid_t pid)
struct child m; {
deleted = (deleted + 1) % MAX_CHILDREN; struct child **cradle, *blanket;
if (deleted == spawned)
die("could not find dead child %d\n", pid); for (cradle = &firstborn; (blanket = *cradle); cradle = &blanket->next)
m = live_child[deleted]; if (blanket->pid == pid) {
live_child[deleted] = n; *cradle = blanket->next;
if (m.pid == pid) live_children--;
return; free(blanket);
n = m; break;
} }
} }
@ -674,99 +631,60 @@ static void remove_child(pid_t pid, unsigned deleted, unsigned spawned)
* This gets called if the number of connections grows * This gets called if the number of connections grows
* past "max_connections". * past "max_connections".
* *
* We _should_ start off by searching for connections * We kill the newest connection from a duplicate IP.
* from the same IP, and if there is some address wth
* multiple connections, we should kill that first.
*
* As it is, we just "randomly" kill 25% of the connections,
* and our pseudo-random generator sucks too. I have no
* shame.
*
* Really, this is just a place-holder for a _real_ algorithm.
*/ */
static void kill_some_children(int signo, unsigned start, unsigned stop) static void kill_some_child(void)
{ {
start %= MAX_CHILDREN; const struct child *blanket, *next;
stop %= MAX_CHILDREN;
while (start != stop) { if (!(blanket = firstborn))
if (!(start & 3)) return;
kill(live_child[start].pid, signo);
start = (start + 1) % MAX_CHILDREN; for (; (next = blanket->next); blanket = next)
if (!memcmp(&blanket->address, &next->address,
sizeof(next->address))) {
kill(blanket->pid, SIGTERM);
break;
} }
} }
static void check_dead_children(void) static void check_dead_children(void)
{ {
unsigned spawned, reaped, deleted; int status;
pid_t pid;
spawned = children_spawned; while ((pid = waitpid(-1, &status, WNOHANG)) > 0) {
reaped = children_reaped; const char *dead = "";
deleted = children_deleted; remove_child(pid);
if (!WIFEXITED(status) || (WEXITSTATUS(status) > 0))
while (deleted < reaped) { dead = " (with error)";
pid_t pid = dead_child[deleted % MAX_CHILDREN]; loginfo("[%d] Disconnected%s", (int)pid, dead);
const char *dead = pid < 0 ? " (with error)" : "";
if (pid < 0)
pid = -pid;
/* XXX: Custom logging, since we don't wanna getpid() */
if (verbose) {
if (log_syslog)
syslog(LOG_INFO, "[%d] Disconnected%s",
pid, dead);
else
fprintf(stderr, "[%d] Disconnected%s\n",
pid, dead);
}
remove_child(pid, deleted, spawned);
deleted++;
}
children_deleted = deleted;
}
static void check_max_connections(void)
{
for (;;) {
int active;
unsigned spawned, deleted;
check_dead_children();
spawned = children_spawned;
deleted = children_deleted;
active = spawned - deleted;
if (active <= max_connections)
break;
/* Kill some unstarted connections with SIGTERM */
kill_some_children(SIGTERM, deleted, spawned);
if (active <= max_connections << 1)
break;
/* If the SIGTERM thing isn't helping use SIGKILL */
kill_some_children(SIGKILL, deleted, spawned);
sleep(1);
} }
} }
static void handle(int incoming, struct sockaddr *addr, int addrlen) static void handle(int incoming, struct sockaddr *addr, int addrlen)
{ {
pid_t pid = fork(); pid_t pid;
if (pid) {
unsigned idx;
if (max_connections && live_children >= max_connections) {
kill_some_child();
sleep(1); /* give it some time to die */
check_dead_children();
if (live_children >= max_connections) {
close(incoming); close(incoming);
if (pid < 0) logerror("Too many children, dropping connection");
return; return;
}
}
idx = children_spawned % MAX_CHILDREN; if ((pid = fork())) {
children_spawned++; close(incoming);
add_child(idx, pid, addr, addrlen); if (pid < 0) {
logerror("Couldn't fork %s", strerror(errno));
return;
}
check_max_connections(); add_child(pid, addr, addrlen);
return; return;
} }
@ -779,21 +697,11 @@ static void handle(int incoming, struct sockaddr *addr, int addrlen)
static void child_handler(int signo) static void child_handler(int signo)
{ {
for (;;) { /*
int status; * Otherwise empty handler because systemcalls will get interrupted
pid_t pid = waitpid(-1, &status, WNOHANG); * upon signal receipt
* SysV needs the handler to be rearmed
if (pid > 0) { */
unsigned reaped = children_reaped;
if (!WIFEXITED(status) || WEXITSTATUS(status) > 0)
pid = -pid;
dead_child[reaped % MAX_CHILDREN] = pid;
children_reaped = reaped + 1;
write(child_handler_pipe[1], &status, 1);
continue;
}
break;
}
signal(SIGCHLD, child_handler); signal(SIGCHLD, child_handler);
} }
@ -836,7 +744,7 @@ static int socksetup(char *listen_addr, int listen_port, int **socklist_p)
if (sockfd < 0) if (sockfd < 0)
continue; continue;
if (sockfd >= FD_SETSIZE) { if (sockfd >= FD_SETSIZE) {
error("too large socket descriptor."); logerror("Socket descriptor too large");
close(sockfd); close(sockfd);
continue; continue;
} }
@ -936,35 +844,28 @@ static int service_loop(int socknum, int *socklist)
struct pollfd *pfd; struct pollfd *pfd;
int i; int i;
if (pipe(child_handler_pipe) < 0) pfd = xcalloc(socknum, sizeof(struct pollfd));
die ("Could not set up pipe for child handler");
pfd = xcalloc(socknum + 1, sizeof(struct pollfd));
for (i = 0; i < socknum; i++) { for (i = 0; i < socknum; i++) {
pfd[i].fd = socklist[i]; pfd[i].fd = socklist[i];
pfd[i].events = POLLIN; pfd[i].events = POLLIN;
} }
pfd[socknum].fd = child_handler_pipe[0];
pfd[socknum].events = POLLIN;
signal(SIGCHLD, child_handler); signal(SIGCHLD, child_handler);
for (;;) { for (;;) {
int i; int i;
if (poll(pfd, socknum + 1, -1) < 0) { check_dead_children();
if (poll(pfd, socknum, -1) < 0) {
if (errno != EINTR) { if (errno != EINTR) {
error("poll failed, resuming: %s", logerror("Poll failed, resuming: %s",
strerror(errno)); strerror(errno));
sleep(1); sleep(1);
} }
continue; continue;
} }
if (pfd[socknum].revents & POLLIN) {
read(child_handler_pipe[0], &i, 1);
check_dead_children();
}
for (i = 0; i < socknum; i++) { for (i = 0; i < socknum; i++) {
if (pfd[i].revents & POLLIN) { if (pfd[i].revents & POLLIN) {
@ -1055,11 +956,6 @@ int main(int argc, char **argv)
gid_t gid = 0; gid_t gid = 0;
int i; int i;
/* Without this we cannot rely on waitpid() to tell
* what happened to our children.
*/
signal(SIGCHLD, SIG_DFL);
for (i = 1; i < argc; i++) { for (i = 1; i < argc; i++) {
char *arg = argv[i]; char *arg = argv[i];
@ -1105,6 +1001,12 @@ int main(int argc, char **argv)
init_timeout = atoi(arg+15); init_timeout = atoi(arg+15);
continue; continue;
} }
if (!prefixcmp(arg, "--max-connections=")) {
max_connections = atoi(arg+18);
if (max_connections < 0)
max_connections = 0; /* unlimited */
continue;
}
if (!strcmp(arg, "--strict-paths")) { if (!strcmp(arg, "--strict-paths")) {
strict_paths = 1; strict_paths = 1;
continue; continue;
@ -1178,9 +1080,10 @@ int main(int argc, char **argv)
} }
if (log_syslog) { if (log_syslog) {
openlog("git-daemon", 0, LOG_DAEMON); openlog("git-daemon", LOG_PID, LOG_DAEMON);
set_die_routine(daemon_die); set_die_routine(daemon_die);
} } else
setlinebuf(stderr); /* avoid splitting a message in the middle */
if (inetd_mode && (group_name || user_name)) if (inetd_mode && (group_name || user_name))
die("--user and --group are incompatible with --inetd"); die("--user and --group are incompatible with --inetd");
@ -1233,8 +1136,10 @@ int main(int argc, char **argv)
return execute(peer); return execute(peer);
} }
if (detach) if (detach) {
daemonize(); daemonize();
loginfo("Ready to rumble");
}
else else
sanitize_stdfds(); sanitize_stdfds();