view usr/src/cmd/svc/configd/configd.c @ 13718:eff5ad995241

Backed out changeset 33bb96bf701a (missing bugid)
author Garrett D'Amore <garrett@damore.org>
date Sat, 09 Jun 2012 17:38:51 -0700
parents 33bb96bf701a
children da056fdd2d14
line wrap: on
line source

/*
 * CDDL HEADER START
 *
 * The contents of this file are subject to the terms of the
 * Common Development and Distribution License (the "License").
 * You may not use this file except in compliance with the License.
 *
 * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
 * or http://www.opensolaris.org/os/licensing.
 * See the License for the specific language governing permissions
 * and limitations under the License.
 *
 * When distributing Covered Code, include this CDDL HEADER in each
 * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
 * If applicable, add the following below this CDDL HEADER, with the
 * fields enclosed by brackets "[]" replaced with your own identifying
 * information: Portions Copyright [yyyy] [name of copyright owner]
 *
 * CDDL HEADER END
 */
/*
 * Copyright 2008 Sun Microsystems, Inc.  All rights reserved.
 * Use is subject to license terms.
 */

#pragma ident	"%Z%%M%	%I%	%E% SMI"

#include <assert.h>
#include <door.h>
#include <errno.h>
#include <fcntl.h>
#include <limits.h>
#include <priv.h>
#include <procfs.h>
#include <pthread.h>
#include <signal.h>
#include <stdarg.h>
#include <stdio.h>
#include <stdio_ext.h>
#include <stdlib.h>
#include <string.h>
#include <syslog.h>
#include <sys/corectl.h>
#include <sys/resource.h>
#include <sys/stat.h>
#include <sys/wait.h>
#include <ucontext.h>
#include <unistd.h>

#include "configd.h"

/*
 * This file manages the overall startup and shutdown of configd, as well
 * as managing its door thread pool and per-thread datastructures.
 *
 * 1.  Per-thread Datastructures
 * -----------------------------
 * Each configd thread has an associated thread_info_t which contains its
 * current state.  A pointer is kept to this in TSD, keyed by thread_info_key.
 * The thread_info_ts for all threads in configd are kept on a single global
 * list, thread_list.  After creation, the state in the thread_info structure
 * is only modified by the associated thread, so no locking is needed.  A TSD
 * destructor removes the thread_info from the global list and frees it at
 * pthread_exit() time.
 *
 * Threads access their per-thread data using thread_self()
 *
 * The thread_list is protected by thread_lock, a leaf lock.
 *
 * 2. Door Thread Pool Management
 * ------------------------------
 * Whenever door_return(3door) returns from the kernel and there are no
 * other configd threads waiting for requests, libdoor automatically
 * invokes a function registered with door_server_create(), to request a new
 * door server thread.  The default function just creates a thread that calls
 * door_return(3door).  Unfortunately, since it can take a while for the new
 * thread to *get* to door_return(3door), a stream of requests can cause a
 * large number of threads to be created, even though they aren't all needed.
 *
 * In our callback, new_server_needed(), we limit ourself to two new threads
 * at a time -- this logic is handled in reserve_new_thread().  This keeps
 * us from creating an absurd number of threads in response to peaking load.
 */
static pthread_key_t	thread_info_key;
static pthread_attr_t	thread_attr;

static pthread_mutex_t	thread_lock = PTHREAD_MUTEX_INITIALIZER;
int			num_started;	/* number actually running */
int			num_servers;	/* number in-progress or running */
static uu_list_pool_t	*thread_pool;
uu_list_t		*thread_list;

static thread_info_t	main_thread_info;

static int	finished;

static pid_t	privileged_pid = 0;
static int	privileged_psinfo_fd = -1;

static int	privileged_user = 0;

static priv_set_t *privileged_privs;

static int	log_to_syslog = 0;

int		is_main_repository = 1;

int		max_repository_backups = 4;

#define	CONFIGD_MAX_FDS		262144

/*
 * Thanks, Mike
 */
void
abort_handler(int sig, siginfo_t *sip, ucontext_t *ucp)
{
	struct sigaction act;

	(void) sigemptyset(&act.sa_mask);
	act.sa_handler = SIG_DFL;
	act.sa_flags = 0;
	(void) sigaction(sig, &act, NULL);

	(void) printstack(2);

	if (sip != NULL && SI_FROMUSER(sip))
		(void) pthread_kill(pthread_self(), sig);
	(void) sigfillset(&ucp->uc_sigmask);
	(void) sigdelset(&ucp->uc_sigmask, sig);
	ucp->uc_flags |= UC_SIGMASK;
	(void) setcontext(ucp);
}

/*
 * Don't want to have more than a couple thread creates outstanding
 */
static int
reserve_new_thread(void)
{
	(void) pthread_mutex_lock(&thread_lock);
	assert(num_started >= 0);
	if (num_servers > num_started + 1) {
		(void) pthread_mutex_unlock(&thread_lock);
		return (0);
	}
	++num_servers;
	(void) pthread_mutex_unlock(&thread_lock);
	return (1);
}

static void
thread_info_free(thread_info_t *ti)
{
	uu_list_node_fini(ti, &ti->ti_node, thread_pool);
	if (ti->ti_ucred != NULL)
		uu_free(ti->ti_ucred);
	uu_free(ti);
}

static void
thread_exiting(void *arg)
{
	thread_info_t *ti = arg;

	if (ti != NULL)
		log_enter(&ti->ti_log);

	(void) pthread_mutex_lock(&thread_lock);
	if (ti != NULL) {
		num_started--;
		uu_list_remove(thread_list, ti);
	}
	assert(num_servers > 0);
	--num_servers;

	if (num_servers == 0) {
		configd_critical("no door server threads\n");
		abort();
	}
	(void) pthread_mutex_unlock(&thread_lock);

	if (ti != NULL && ti != &main_thread_info)
		thread_info_free(ti);
}

void
thread_newstate(thread_info_t *ti, thread_state_t newstate)
{
	ti->ti_ucred_read = 0;			/* invalidate cached ucred */
	if (newstate != ti->ti_state) {
		ti->ti_prev_state = ti->ti_state;
		ti->ti_state = newstate;
		ti->ti_lastchange = gethrtime();
	}
}

thread_info_t *
thread_self(void)
{
	return (pthread_getspecific(thread_info_key));
}

/*
 * get_ucred() returns NULL if it was unable to get the credential
 * information.
 */
ucred_t *
get_ucred(void)
{
	thread_info_t *ti = thread_self();
	ucred_t **ret = &ti->ti_ucred;

	if (ti->ti_ucred_read)
		return (*ret);			/* cached value */

	if (door_ucred(ret) != 0)
		return (NULL);
	ti->ti_ucred_read = 1;

	return (*ret);
}

int
ucred_is_privileged(ucred_t *uc)
{
	const priv_set_t *ps;

	if ((ps = ucred_getprivset(uc, PRIV_EFFECTIVE)) != NULL) {
		if (priv_isfullset(ps))
			return (1);		/* process has all privs */

		if (privileged_privs != NULL &&
		    priv_issubset(privileged_privs, ps))
			return (1);		/* process has zone privs */
	}

	return (0);
}

/*
 * The purpose of this function is to get the audit session data for use in
 * generating SMF audit events.  We use a single audit session per client.
 *
 * get_audit_session() may return NULL.  It is legal to use a NULL pointer
 * in subsequent calls to adt_* functions.
 */
adt_session_data_t *
get_audit_session(void)
{
	thread_info_t	*ti = thread_self();

	return (ti->ti_active_client->rc_adt_session);
}

static void *
thread_start(void *arg)
{
	thread_info_t *ti = arg;

	(void) pthread_setcancelstate(PTHREAD_CANCEL_DISABLE, NULL);

	(void) pthread_mutex_lock(&thread_lock);
	num_started++;
	(void) uu_list_insert_after(thread_list, uu_list_last(thread_list),
	    ti);
	(void) pthread_mutex_unlock(&thread_lock);
	(void) pthread_setspecific(thread_info_key, ti);

	thread_newstate(ti, TI_DOOR_RETURN);

	/*
	 * Start handling door calls
	 */
	(void) door_return(NULL, 0, NULL, 0);
	return (arg);
}

static void
new_thread_needed(door_info_t *dip)
{
	thread_info_t *ti;

	sigset_t new, old;

	assert(dip == NULL);

	if (!reserve_new_thread())
		return;

	if ((ti = uu_zalloc(sizeof (*ti))) == NULL)
		goto fail;

	uu_list_node_init(ti, &ti->ti_node, thread_pool);
	ti->ti_state = TI_CREATED;
	ti->ti_prev_state = TI_CREATED;

	if ((ti->ti_ucred = uu_zalloc(ucred_size())) == NULL)
		goto fail;

	(void) sigfillset(&new);
	(void) pthread_sigmask(SIG_SETMASK, &new, &old);
	if ((errno = pthread_create(&ti->ti_thread, &thread_attr, thread_start,
	    ti)) != 0) {
		(void) pthread_sigmask(SIG_SETMASK, &old, NULL);
		goto fail;
	}

	(void) pthread_sigmask(SIG_SETMASK, &old, NULL);
	return;

fail:
	/*
	 * Since the thread_info structure was never linked onto the
	 * thread list, thread_exiting() can't handle the cleanup.
	 */
	thread_exiting(NULL);
	if (ti != NULL)
		thread_info_free(ti);
}

int
create_connection(ucred_t *uc, repository_door_request_t *rp,
    size_t rp_size, int *out_fd)
{
	int flags;
	int privileged = 0;
	uint32_t debugflags = 0;
	psinfo_t info;

	if (privileged_pid != 0) {
		/*
		 * in privileged pid mode, we only allow connections from
		 * our original parent -- the psinfo read verifies that
		 * it is the same process which we started with.
		 */
		if (ucred_getpid(uc) != privileged_pid ||
		    read(privileged_psinfo_fd, &info, sizeof (info)) !=
		    sizeof (info))
			return (REPOSITORY_DOOR_FAIL_PERMISSION_DENIED);

		privileged = 1;			/* he gets full privileges */
	} else if (privileged_user != 0) {
		/*
		 * in privileged user mode, only one particular user is
		 * allowed to connect to us, and he can do anything.
		 */
		if (ucred_geteuid(uc) != privileged_user)
			return (REPOSITORY_DOOR_FAIL_PERMISSION_DENIED);

		privileged = 1;
	}

	/*
	 * Check that rp, of size rp_size, is large enough to
	 * contain field 'f'.  If so, write the value into *out, and return 1.
	 * Otherwise, return 0.
	 */
#define	GET_ARG(rp, rp_size, f, out)					\
	(((rp_size) >= offsetofend(repository_door_request_t, f)) ?	\
	    ((*(out) = (rp)->f), 1) : 0)

	if (!GET_ARG(rp, rp_size, rdr_flags, &flags))
		return (REPOSITORY_DOOR_FAIL_BAD_REQUEST);

#if (REPOSITORY_DOOR_FLAG_ALL != REPOSITORY_DOOR_FLAG_DEBUG)
#error Need to update flag checks
#endif

	if (flags & ~REPOSITORY_DOOR_FLAG_ALL)
		return (REPOSITORY_DOOR_FAIL_BAD_FLAG);

	if (flags & REPOSITORY_DOOR_FLAG_DEBUG)
		if (!GET_ARG(rp, rp_size, rdr_debug, &debugflags))
			return (REPOSITORY_DOOR_FAIL_BAD_REQUEST);
#undef GET_ARG

	return (create_client(ucred_getpid(uc), debugflags, privileged,
	    out_fd));
}

void
configd_vlog(int severity, const char *prefix, const char *message,
    va_list args)
{
	if (log_to_syslog)
		vsyslog(severity, message, args);
	else {
		flockfile(stderr);
		if (prefix != NULL)
			(void) fprintf(stderr, "%s", prefix);
		(void) vfprintf(stderr, message, args);
		if (message[0] == 0 || message[strlen(message) - 1] != '\n')
			(void) fprintf(stderr, "\n");
		funlockfile(stderr);
	}
}

void
configd_vcritical(const char *message, va_list args)
{
	configd_vlog(LOG_CRIT, "svc.configd: Fatal error: ", message, args);
}

void
configd_critical(const char *message, ...)
{
	va_list args;
	va_start(args, message);
	configd_vcritical(message, args);
	va_end(args);
}

void
configd_info(const char *message, ...)
{
	va_list args;
	va_start(args, message);
	configd_vlog(LOG_INFO, "svc.configd: ", message, args);
	va_end(args);
}

static void
usage(const char *prog, int ret)
{
	(void) fprintf(stderr,
	    "usage: %s [-np] [-d door_path] [-r repository_path]\n"
	    "    [-t nonpersist_repository]\n", prog);
	exit(ret);
}

/*ARGSUSED*/
static void
handler(int sig, siginfo_t *info, void *data)
{
	finished = 1;
}

static int pipe_fd = -1;

static int
daemonize_start(void)
{
	char data;
	int status;

	int filedes[2];
	pid_t pid;

	(void) close(0);
	(void) dup2(2, 1);		/* stderr only */

	if (pipe(filedes) < 0)
		return (-1);

	if ((pid = fork1()) < 0)
		return (-1);

	if (pid != 0) {
		/*
		 * parent
		 */
		struct sigaction act;

		act.sa_sigaction = SIG_DFL;
		(void) sigemptyset(&act.sa_mask);
		act.sa_flags = 0;

		(void) sigaction(SIGPIPE, &act, NULL);	/* ignore SIGPIPE */

		(void) close(filedes[1]);
		if (read(filedes[0], &data, 1) == 1) {
			/* presume success */
			_exit(CONFIGD_EXIT_OKAY);
		}

		status = -1;
		(void) wait4(pid, &status, 0, NULL);
		if (WIFEXITED(status))
			_exit(WEXITSTATUS(status));
		else
			_exit(-1);
	}

	/*
	 * child
	 */
	pipe_fd = filedes[1];
	(void) close(filedes[0]);

	/*
	 * generic Unix setup
	 */
	(void) setsid();
	(void) umask(0077);

	return (0);
}

static void
daemonize_ready(void)
{
	char data = '\0';

	/*
	 * wake the parent
	 */
	(void) write(pipe_fd, &data, 1);
	(void) close(pipe_fd);
}

const char *
regularize_path(const char *dir, const char *base, char *tmpbuf)
{
	if (base == NULL)
		return (NULL);
	if (base[0] == '/')
		return (base);

	if (snprintf(tmpbuf, PATH_MAX, "%s/%s", dir, base) >= PATH_MAX) {
		(void) fprintf(stderr, "svc.configd: %s/%s: path too long\n",
		    dir, base);
		exit(CONFIGD_EXIT_BAD_ARGS);
	}

	return (tmpbuf);
}

int
main(int argc, char *argv[])
{
	thread_info_t *ti = &main_thread_info;

	char pidpath[sizeof ("/proc/" "/psinfo") + 10];

	struct rlimit fd_new;

	const char *endptr;
	sigset_t myset;
	int c;
	int ret;
	int fd;

	char curdir[PATH_MAX];
	char dbtmp[PATH_MAX];
	char npdbtmp[PATH_MAX];
	char doortmp[PATH_MAX];

	const char *dbpath = NULL;
	const char *npdbpath = NULL;
	const char *doorpath = REPOSITORY_DOOR_NAME;
	struct sigaction act;

	int daemonize = 1;		/* default to daemonizing */
	int have_npdb = 1;

	closefrom(3);			/* get rid of extraneous fds */

	if (getcwd(curdir, sizeof (curdir)) == NULL) {
		(void) fprintf(stderr,
		    "%s: unable to get current directory: %s\n",
		    argv[0], strerror(errno));
		exit(CONFIGD_EXIT_INIT_FAILED);
	}

	while ((c = getopt(argc, argv, "Dnpd:r:t:")) != -1) {
		switch (c) {
		case 'n':
			daemonize = 0;
			break;
		case 'd':
			doorpath = regularize_path(curdir, optarg, doortmp);
			have_npdb = 0;		/* default to no non-persist */
			break;
		case 'p':
			log_to_syslog = 0;	/* don't use syslog */

			/*
			 * If our parent exits while we're opening its /proc
			 * psinfo, we're vulnerable to a pid wrapping.  To
			 * protect against that, re-check our ppid after
			 * opening it.
			 */
			privileged_pid = getppid();
			(void) snprintf(pidpath, sizeof (pidpath),
			    "/proc/%d/psinfo", privileged_pid);
			if ((fd = open(pidpath, O_RDONLY)) < 0 ||
			    getppid() != privileged_pid) {
				(void) fprintf(stderr,
				    "%s: unable to get parent info\n", argv[0]);
				exit(CONFIGD_EXIT_BAD_ARGS);
			}
			privileged_psinfo_fd = fd;
			break;
		case 'r':
			dbpath = regularize_path(curdir, optarg, dbtmp);
			is_main_repository = 0;
			break;
		case 't':
			npdbpath = regularize_path(curdir, optarg, npdbtmp);
			is_main_repository = 0;
			break;
		default:
			usage(argv[0], CONFIGD_EXIT_BAD_ARGS);
			break;
		}
	}

	/*
	 * If we're not running as root, allow our euid full access, and
	 * everyone else no access.
	 */
	if (privileged_pid == 0 && geteuid() != 0) {
		privileged_user = geteuid();
	}

	privileged_privs = priv_str_to_set("zone", "", &endptr);
	if (endptr != NULL && privileged_privs != NULL) {
		priv_freeset(privileged_privs);
		privileged_privs = NULL;
	}

	openlog("svc.configd", LOG_PID | LOG_CONS, LOG_DAEMON);
	(void) setlogmask(LOG_UPTO(LOG_NOTICE));

	/*
	 * if a non-persist db is specified, always enable it
	 */
	if (npdbpath)
		have_npdb = 1;

	if (optind != argc)
		usage(argv[0], CONFIGD_EXIT_BAD_ARGS);

	if (daemonize) {
		if (getuid() == 0)
			(void) chdir("/");
		if (daemonize_start() < 0) {
			(void) perror("unable to daemonize");
			exit(CONFIGD_EXIT_INIT_FAILED);
		}
	}
	if (getuid() == 0)
		(void) core_set_process_path(CONFIGD_CORE,
		    strlen(CONFIGD_CORE) + 1, getpid());

	/*
	 * this should be enabled once we can drop privileges and still get
	 * a core dump.
	 */
#if 0
	/* turn off basic privileges we do not need */
	(void) priv_set(PRIV_OFF, PRIV_PERMITTED, PRIV_FILE_LINK_ANY,
	    PRIV_PROC_EXEC, PRIV_PROC_FORK, PRIV_PROC_SESSION, NULL);
#endif

	/* not that we can exec, but to be safe, shut them all off... */
	(void) priv_set(PRIV_SET, PRIV_INHERITABLE, NULL);

	(void) sigfillset(&act.sa_mask);

	/* signals to ignore */
	act.sa_sigaction = SIG_IGN;
	act.sa_flags = 0;
	(void) sigaction(SIGPIPE, &act, NULL);
	(void) sigaction(SIGALRM, &act, NULL);
	(void) sigaction(SIGUSR1, &act, NULL);
	(void) sigaction(SIGUSR2, &act, NULL);
	(void) sigaction(SIGPOLL, &act, NULL);

	/* signals to abort on */
	act.sa_sigaction = (void (*)(int, siginfo_t *, void *))&abort_handler;
	act.sa_flags = SA_SIGINFO;

	(void) sigaction(SIGABRT, &act, NULL);

	/* signals to handle */
	act.sa_sigaction = &handler;
	act.sa_flags = SA_SIGINFO;

	(void) sigaction(SIGHUP, &act, NULL);
	(void) sigaction(SIGINT, &act, NULL);
	(void) sigaction(SIGTERM, &act, NULL);

	(void) sigemptyset(&myset);
	(void) sigaddset(&myset, SIGHUP);
	(void) sigaddset(&myset, SIGINT);
	(void) sigaddset(&myset, SIGTERM);

	if ((errno = pthread_attr_init(&thread_attr)) != 0) {
		(void) perror("initializing");
		exit(CONFIGD_EXIT_INIT_FAILED);
	}

	/*
	 * Set the hard and soft limits to CONFIGD_MAX_FDS.
	 */
	fd_new.rlim_max = fd_new.rlim_cur = CONFIGD_MAX_FDS;
	(void) setrlimit(RLIMIT_NOFILE, &fd_new);

#ifndef NATIVE_BUILD /* Allow building on snv_38 and earlier; remove later. */
	(void) enable_extended_FILE_stdio(-1, -1);
#endif

	if ((ret = backend_init(dbpath, npdbpath, have_npdb)) !=
	    CONFIGD_EXIT_OKAY)
		exit(ret);

	if (!client_init())
		exit(CONFIGD_EXIT_INIT_FAILED);

	if (!rc_node_init())
		exit(CONFIGD_EXIT_INIT_FAILED);

	(void) pthread_attr_setdetachstate(&thread_attr,
	    PTHREAD_CREATE_DETACHED);
	(void) pthread_attr_setscope(&thread_attr, PTHREAD_SCOPE_SYSTEM);

	if ((errno = pthread_key_create(&thread_info_key,
	    thread_exiting)) != 0) {
		perror("pthread_key_create");
		exit(CONFIGD_EXIT_INIT_FAILED);
	}

	if ((thread_pool = uu_list_pool_create("thread_pool",
	    sizeof (thread_info_t), offsetof(thread_info_t, ti_node),
	    NULL, UU_LIST_POOL_DEBUG)) == NULL) {
		configd_critical("uu_list_pool_create: %s\n",
		    uu_strerror(uu_error()));
		exit(CONFIGD_EXIT_INIT_FAILED);
	}

	if ((thread_list = uu_list_create(thread_pool, NULL, 0)) == NULL) {
		configd_critical("uu_list_create: %s\n",
		    uu_strerror(uu_error()));
		exit(CONFIGD_EXIT_INIT_FAILED);
	}

	(void) memset(ti, '\0', sizeof (*ti));
	uu_list_node_init(ti, &ti->ti_node, thread_pool);
	(void) uu_list_insert_before(thread_list, uu_list_first(thread_list),
	    ti);

	ti->ti_thread = pthread_self();
	ti->ti_state = TI_SIGNAL_WAIT;
	ti->ti_prev_state = TI_SIGNAL_WAIT;

	(void) pthread_setspecific(thread_info_key, ti);

	(void) door_server_create(new_thread_needed);

	if (!setup_main_door(doorpath)) {
		configd_critical("Setting up main door failed.\n");
		exit(CONFIGD_EXIT_DOOR_INIT_FAILED);
	}

	if (daemonize)
		daemonize_ready();

	(void) pthread_sigmask(SIG_BLOCK, &myset, NULL);
	while (!finished) {
		int sig = sigwait(&myset);
		if (sig > 0) {
			break;
		}
	}

	backend_fini();

	return (CONFIGD_EXIT_OKAY);
}