Skip site navigation (1)Skip section navigation (2)
Date:      Wed, 30 Mar 2011 17:48:15 +0000 (UTC)
From:      Edward Tomasz Napierala <trasz@FreeBSD.org>
To:        src-committers@freebsd.org, svn-src-all@freebsd.org, svn-src-head@freebsd.org
Subject:   svn commit: r220163 - in head/sys: compat/freebsd32 conf kern sys
Message-ID:  <201103301748.p2UHmF0g070602@svn.freebsd.org>

next in thread | raw e-mail | index | archive | help
Author: trasz
Date: Wed Mar 30 17:48:15 2011
New Revision: 220163
URL: http://svn.freebsd.org/changeset/base/220163

Log:
  Add rctl.  It's used by racct to take user-configurable actions based
  on the set of rules it maintains and the current resource usage.  It also
  privides userland API to manage that ruleset.
  
  Sponsored by:	The FreeBSD Foundation
  Reviewed by:	kib (earlier version)

Added:
  head/sys/kern/kern_rctl.c   (contents, props changed)
  head/sys/sys/rctl.h   (contents, props changed)
Modified:
  head/sys/compat/freebsd32/syscalls.master
  head/sys/conf/NOTES
  head/sys/conf/files
  head/sys/conf/options
  head/sys/kern/kern_jail.c
  head/sys/kern/syscalls.master
  head/sys/sys/priv.h

Modified: head/sys/compat/freebsd32/syscalls.master
==============================================================================
--- head/sys/compat/freebsd32/syscalls.master	Wed Mar 30 17:37:04 2011	(r220162)
+++ head/sys/compat/freebsd32/syscalls.master	Wed Mar 30 17:48:15 2011	(r220163)
@@ -965,3 +965,18 @@
 523	AUE_NULL	NOPROTO	{ int getloginclass(char *namebuf, \
 				    size_t namelen); }
 524	AUE_NULL	NOPROTO	{ int setloginclass(const char *namebuf); }
+525	AUE_NULL	NOPROTO	{ int rctl_get_racct(const void *inbufp, \
+				    size_t inbuflen, void *outbufp, \
+				    size_t outbuflen); }
+526	AUE_NULL	NOPROTO	{ int rctl_get_rules(const void *inbufp, \
+				    size_t inbuflen, void *outbufp, \
+				    size_t outbuflen); }
+527	AUE_NULL	NOPROTO	{ int rctl_get_limits(const void *inbufp, \
+				    size_t inbuflen, void *outbufp, \
+				    size_t outbuflen); }
+528	AUE_NULL	NOPROTO	{ int rctl_add_rule(const void *inbufp, \
+				    size_t inbuflen, void *outbufp, \
+				    size_t outbuflen); }
+529	AUE_NULL	NOPROTO	{ int rctl_remove_rule(const void *inbufp, \
+				    size_t inbuflen, void *outbufp, \
+				    size_t outbuflen); }

Modified: head/sys/conf/NOTES
==============================================================================
--- head/sys/conf/NOTES	Wed Mar 30 17:37:04 2011	(r220162)
+++ head/sys/conf/NOTES	Wed Mar 30 17:48:15 2011	(r220163)
@@ -2933,6 +2933,9 @@ options 	AAC_DEBUG	# Debugging levels:
 # Resource Accounting
 options 	RACCT
 
+# Resource Limits
+options 	RCTL
+
 # Yet more undocumented options for linting.
 # BKTR_ALLOC_PAGES has no effect except to cause warnings, and
 # BROOKTREE_ALLOC_PAGES hasn't actually been superseded by it, since the

Modified: head/sys/conf/files
==============================================================================
--- head/sys/conf/files	Wed Mar 30 17:37:04 2011	(r220162)
+++ head/sys/conf/files	Wed Mar 30 17:48:15 2011	(r220163)
@@ -2226,6 +2226,7 @@ kern/kern_priv.c		standard
 kern/kern_proc.c		standard
 kern/kern_prot.c		standard
 kern/kern_racct.c		standard
+kern/kern_rctl.c		standard
 kern/kern_resource.c		standard
 kern/kern_rmlock.c		standard
 kern/kern_rwlock.c		standard

Modified: head/sys/conf/options
==============================================================================
--- head/sys/conf/options	Wed Mar 30 17:37:04 2011	(r220162)
+++ head/sys/conf/options	Wed Mar 30 17:48:15 2011	(r220163)
@@ -876,6 +876,9 @@ IPOIB_CM	opt_ofed.h
 # Resource Accounting
 RACCT		opt_global.h
 
+# Resource Limits
+RCTL		opt_global.h
+
 # At least one of the AR71XX ubiquiti boards has a Redboot configuration
 # that "lies" about the amount of RAM it has. Until a cleaner method is
 # defined, this option will suffice in overriding what Redboot says.

Modified: head/sys/kern/kern_jail.c
==============================================================================
--- head/sys/kern/kern_jail.c	Wed Mar 30 17:37:04 2011	(r220162)
+++ head/sys/kern/kern_jail.c	Wed Mar 30 17:48:15 2011	(r220163)
@@ -50,6 +50,7 @@ __FBSDID("$FreeBSD$");
 #include <sys/lock.h>
 #include <sys/mutex.h>
 #include <sys/racct.h>
+#include <sys/rctl.h>
 #include <sys/sx.h>
 #include <sys/sysent.h>
 #include <sys/namei.h>
@@ -2532,6 +2533,9 @@ prison_deref(struct prison *pr, int flag
 		if (pr->pr_cpuset != NULL)
 			cpuset_rel(pr->pr_cpuset);
 		osd_jail_exit(pr);
+#ifdef RCTL
+		rctl_racct_release(pr->pr_racct);
+#endif
 		racct_destroy(&pr->pr_racct);
 		free(pr, M_PRISON);
 

Added: head/sys/kern/kern_rctl.c
==============================================================================
--- /dev/null	00:00:00 1970	(empty, because file is newly added)
+++ head/sys/kern/kern_rctl.c	Wed Mar 30 17:48:15 2011	(r220163)
@@ -0,0 +1,1850 @@
+/*-
+ * Copyright (c) 2010 The FreeBSD Foundation
+ * All rights reserved.
+ *
+ * This software was developed by Edward Tomasz Napierala under sponsorship
+ * from the FreeBSD Foundation.
+ *
+ * Redistribution and use in source and binary forms, with or without
+ * modification, are permitted provided that the following conditions
+ * are met:
+ * 1. Redistributions of source code must retain the above copyright
+ *    notice, this list of conditions and the following disclaimer.
+ * 2. Redistributions in binary form must reproduce the above copyright
+ *    notice, this list of conditions and the following disclaimer in the
+ *    documentation and/or other materials provided with the distribution.
+ *
+ * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
+ * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
+ * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+ * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
+ * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+ * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+ * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+ * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+ * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+ * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+ * SUCH DAMAGE.
+ *
+ * $FreeBSD$
+ */
+
+#include <sys/cdefs.h>
+__FBSDID("$FreeBSD$");
+
+#include <sys/param.h>
+#include <sys/bus.h>
+#include <sys/malloc.h>
+#include <sys/queue.h>
+#include <sys/refcount.h>
+#include <sys/jail.h>
+#include <sys/kernel.h>
+#include <sys/limits.h>
+#include <sys/loginclass.h>
+#include <sys/priv.h>
+#include <sys/proc.h>
+#include <sys/racct.h>
+#include <sys/rctl.h>
+#include <sys/resourcevar.h>
+#include <sys/sx.h>
+#include <sys/sysent.h>
+#include <sys/sysproto.h>
+#include <sys/systm.h>
+#include <sys/types.h>
+#include <sys/eventhandler.h>
+#include <sys/lock.h>
+#include <sys/mutex.h>
+#include <sys/rwlock.h>
+#include <sys/sbuf.h>
+#include <sys/taskqueue.h>
+#include <sys/tree.h>
+#include <vm/uma.h>
+
+#ifdef RCTL
+#ifndef RACCT
+#error "The RCTL option requires the RACCT option"
+#endif
+
+FEATURE(rctl, "Resource Limits");
+
+#define	HRF_DEFAULT		0
+#define	HRF_DONT_INHERIT	1
+#define	HRF_DONT_ACCUMULATE	2
+
+/* Default buffer size for rctl_get_rules(2). */
+#define	RCTL_DEFAULT_BUFSIZE	4096
+#define	RCTL_LOG_BUFSIZE	128
+
+/*
+ * 'rctl_rule_link' connects a rule with every racct it's related to.
+ * For example, rule 'user:X:openfiles:deny=N/process' is linked
+ * with uidinfo for user X, and to each process of that user.
+ */
+struct rctl_rule_link {
+	LIST_ENTRY(rctl_rule_link)	rrl_next;
+	struct rctl_rule		*rrl_rule;
+	int				rrl_exceeded;
+};
+
+struct dict {
+	const char	*d_name;
+	int		d_value;
+};
+
+static struct dict subjectnames[] = {
+	{ "process", RCTL_SUBJECT_TYPE_PROCESS },
+	{ "user", RCTL_SUBJECT_TYPE_USER },
+	{ "loginclass", RCTL_SUBJECT_TYPE_LOGINCLASS },
+	{ "jail", RCTL_SUBJECT_TYPE_JAIL },
+	{ NULL, -1 }};
+
+static struct dict resourcenames[] = {
+	{ "cpu", RACCT_CPU },
+	{ "fsize", RACCT_FSIZE },
+	{ "data", RACCT_DATA },
+	{ "stack", RACCT_STACK },
+	{ "core", RACCT_CORE },
+	{ "rss", RACCT_RSS },
+	{ "memlock", RACCT_MEMLOCK },
+	{ "nproc", RACCT_NPROC },
+	{ "nofile", RACCT_NOFILE },
+	{ "sbsize", RACCT_SBSIZE },
+	{ "vmem", RACCT_VMEM },
+	{ "npts", RACCT_NPTS },
+	{ "swap", RACCT_SWAP },
+	{ "nthr", RACCT_NTHR },
+	{ "msgqqueued", RACCT_MSGQQUEUED },
+	{ "msgqsize", RACCT_MSGQSIZE },
+	{ "nmsgq", RACCT_NMSGQ },
+	{ "nsem", RACCT_NSEM },
+	{ "nsemop", RACCT_NSEMOP },
+	{ "nshm", RACCT_NSHM },
+	{ "shmsize", RACCT_SHMSIZE },
+	{ "wallclock", RACCT_WALLCLOCK },
+	{ NULL, -1 }};
+
+static struct dict actionnames[] = {
+	{ "sighup", RCTL_ACTION_SIGHUP },
+	{ "sigint", RCTL_ACTION_SIGINT },
+	{ "sigquit", RCTL_ACTION_SIGQUIT },
+	{ "sigill", RCTL_ACTION_SIGILL },
+	{ "sigtrap", RCTL_ACTION_SIGTRAP },
+	{ "sigabrt", RCTL_ACTION_SIGABRT },
+	{ "sigemt", RCTL_ACTION_SIGEMT },
+	{ "sigfpe", RCTL_ACTION_SIGFPE },
+	{ "sigkill", RCTL_ACTION_SIGKILL },
+	{ "sigbus", RCTL_ACTION_SIGBUS },
+	{ "sigsegv", RCTL_ACTION_SIGSEGV },
+	{ "sigsys", RCTL_ACTION_SIGSYS },
+	{ "sigpipe", RCTL_ACTION_SIGPIPE },
+	{ "sigalrm", RCTL_ACTION_SIGALRM },
+	{ "sigterm", RCTL_ACTION_SIGTERM },
+	{ "sigurg", RCTL_ACTION_SIGURG },
+	{ "sigstop", RCTL_ACTION_SIGSTOP },
+	{ "sigtstp", RCTL_ACTION_SIGTSTP },
+	{ "sigchld", RCTL_ACTION_SIGCHLD },
+	{ "sigttin", RCTL_ACTION_SIGTTIN },
+	{ "sigttou", RCTL_ACTION_SIGTTOU },
+	{ "sigio", RCTL_ACTION_SIGIO },
+	{ "sigxcpu", RCTL_ACTION_SIGXCPU },
+	{ "sigxfsz", RCTL_ACTION_SIGXFSZ },
+	{ "sigvtalrm", RCTL_ACTION_SIGVTALRM },
+	{ "sigprof", RCTL_ACTION_SIGPROF },
+	{ "sigwinch", RCTL_ACTION_SIGWINCH },
+	{ "siginfo", RCTL_ACTION_SIGINFO },
+	{ "sigusr1", RCTL_ACTION_SIGUSR1 },
+	{ "sigusr2", RCTL_ACTION_SIGUSR2 },
+	{ "sigthr", RCTL_ACTION_SIGTHR },
+	{ "deny", RCTL_ACTION_DENY },
+	{ "log", RCTL_ACTION_LOG },
+	{ "devctl", RCTL_ACTION_DEVCTL },
+	{ NULL, -1 }};
+
+static void rctl_init(void);
+SYSINIT(rctl, SI_SUB_RACCT, SI_ORDER_FIRST, rctl_init, NULL);
+
+static uma_zone_t rctl_rule_link_zone;
+static uma_zone_t rctl_rule_zone;
+static struct rwlock rctl_lock;
+RW_SYSINIT(rctl_lock, &rctl_lock, "RCTL lock");
+
+static int rctl_rule_fully_specified(const struct rctl_rule *rule);
+static void rctl_rule_to_sbuf(struct sbuf *sb, const struct rctl_rule *rule);
+
+MALLOC_DEFINE(M_RCTL, "rctl", "Resource Limits");
+
+static const char *
+rctl_subject_type_name(int subject)
+{
+	int i;
+
+	for (i = 0; subjectnames[i].d_name != NULL; i++) {
+		if (subjectnames[i].d_value == subject)
+			return (subjectnames[i].d_name);
+	}
+
+	panic("rctl_subject_type_name: unknown subject type %d", subject);
+}
+
+static const char *
+rctl_action_name(int action)
+{
+	int i;
+
+	for (i = 0; actionnames[i].d_name != NULL; i++) {
+		if (actionnames[i].d_value == action)
+			return (actionnames[i].d_name);
+	}
+
+	panic("rctl_action_name: unknown action %d", action);
+}
+
+const char *
+rctl_resource_name(int resource)
+{
+	int i;
+
+	for (i = 0; resourcenames[i].d_name != NULL; i++) {
+		if (resourcenames[i].d_value == resource)
+			return (resourcenames[i].d_name);
+	}
+
+	panic("rctl_resource_name: unknown resource %d", resource);
+}
+
+/*
+ * Return the amount of resource that can be allocated by 'p' before
+ * hitting 'rule'.
+ */
+static int64_t
+rctl_available_resource(const struct proc *p, const struct rctl_rule *rule)
+{
+	int resource;
+	int64_t available = INT64_MAX;
+	struct ucred *cred = p->p_ucred;
+
+	rw_assert(&rctl_lock, RA_LOCKED);
+
+	resource = rule->rr_resource;
+	switch (rule->rr_per) {
+	case RCTL_SUBJECT_TYPE_PROCESS:
+		available = rule->rr_amount -
+		    p->p_racct->r_resources[resource];
+		break;
+	case RCTL_SUBJECT_TYPE_USER:
+		available = rule->rr_amount -
+		    cred->cr_ruidinfo->ui_racct->r_resources[resource];
+		break;
+	case RCTL_SUBJECT_TYPE_LOGINCLASS:
+		available = rule->rr_amount -
+		    cred->cr_loginclass->lc_racct->r_resources[resource];
+		break;
+	case RCTL_SUBJECT_TYPE_JAIL:
+		available = rule->rr_amount -
+		    cred->cr_prison->pr_racct->r_resources[resource];
+		break;
+	default:
+		panic("rctl_compute_available: unknown per %d",
+		    rule->rr_per);
+	}
+
+	return (available);
+}
+
+/*
+ * Return non-zero if allocating 'amount' by proc 'p' would exceed
+ * resource limit specified by 'rule'.
+ */
+static int
+rctl_would_exceed(const struct proc *p, const struct rctl_rule *rule,
+    int64_t amount)
+{
+	int64_t available;
+
+	rw_assert(&rctl_lock, RA_LOCKED);
+
+	available = rctl_available_resource(p, rule);
+	if (available >= amount)
+		return (0);
+
+	return (1);
+}
+
+/*
+ * Check whether the proc 'p' can allocate 'amount' of 'resource' in addition
+ * to what it keeps allocated now.  Returns non-zero if the allocation should
+ * be denied, 0 otherwise.
+ */
+int
+rctl_enforce(struct proc *p, int resource, uint64_t amount)
+{
+	struct rctl_rule *rule;
+	struct rctl_rule_link *link;
+	struct sbuf sb;
+	int should_deny = 0;
+	char *buf;
+	static int curtime = 0;
+	static struct timeval lasttime;
+
+	rw_rlock(&rctl_lock);
+
+	/*
+	 * There may be more than one matching rule; go through all of them.
+	 * Denial should be done last, after logging and sending signals.
+	 */
+	LIST_FOREACH(link, &p->p_racct->r_rule_links, rrl_next) {
+		rule = link->rrl_rule;
+		if (rule->rr_resource != resource)
+			continue;
+		if (!rctl_would_exceed(p, rule, amount)) {
+			link->rrl_exceeded = 0;
+			continue;
+		}
+
+		switch (rule->rr_action) {
+		case RCTL_ACTION_DENY:
+			should_deny = 1;
+			continue;
+		case RCTL_ACTION_LOG:
+			/*
+			 * If rrl_exceeded != 0, it means we've already
+			 * logged a warning for this process.
+			 */
+			if (link->rrl_exceeded != 0)
+				continue;
+
+			if (!ppsratecheck(&lasttime, &curtime, 10))
+				continue;
+
+			buf = malloc(RCTL_LOG_BUFSIZE, M_RCTL, M_NOWAIT);
+			if (buf == NULL) {
+				printf("rctl_enforce: out of memory\n");
+				continue;
+			}
+			sbuf_new(&sb, buf, RCTL_LOG_BUFSIZE, SBUF_FIXEDLEN);
+			rctl_rule_to_sbuf(&sb, rule);
+			sbuf_finish(&sb);
+			printf("rctl: rule \"%s\" matched by pid %d "
+			    "(%s), uid %d, jail %s\n", sbuf_data(&sb),
+			    p->p_pid, p->p_comm, p->p_ucred->cr_uid,
+			    p->p_ucred->cr_prison->pr_name);
+			sbuf_delete(&sb);
+			free(buf, M_RCTL);
+			link->rrl_exceeded = 1;
+			continue;
+		case RCTL_ACTION_DEVCTL:
+			if (link->rrl_exceeded != 0)
+				continue;
+
+			buf = malloc(RCTL_LOG_BUFSIZE, M_RCTL, M_NOWAIT);
+			if (buf == NULL) {
+				printf("rctl_enforce: out of memory\n");
+				continue;
+			}
+			sbuf_new(&sb, buf, RCTL_LOG_BUFSIZE, SBUF_FIXEDLEN);
+			sbuf_printf(&sb, "rule=");
+			rctl_rule_to_sbuf(&sb, rule);
+			sbuf_printf(&sb, " pid=%d ruid=%d jail=%s",
+			    p->p_pid, p->p_ucred->cr_ruid,
+			    p->p_ucred->cr_prison->pr_name);
+			sbuf_finish(&sb);
+			devctl_notify_f("RCTL", "rule", "matched",
+			    sbuf_data(&sb), M_NOWAIT);
+			sbuf_delete(&sb);
+			free(buf, M_RCTL);
+			link->rrl_exceeded = 1;
+			continue;
+		default:
+			if (link->rrl_exceeded != 0)
+				continue;
+
+			KASSERT(rule->rr_action > 0 &&
+			    rule->rr_action <= RCTL_ACTION_SIGNAL_MAX,
+			    ("rctl_enforce: unknown action %d",
+			     rule->rr_action));
+
+			/*
+			 * We're using the fact that RCTL_ACTION_SIG* values
+			 * are equal to their counterparts from sys/signal.h.
+			 */
+			psignal(p, rule->rr_action);
+			link->rrl_exceeded = 1;
+			continue;
+		}
+	}
+
+	rw_runlock(&rctl_lock);
+
+	if (should_deny) {
+		/*
+		 * Return fake error code; the caller should change it
+		 * into one proper for the situation - EFSIZ, ENOMEM etc.
+		 */
+		return (EDOOFUS);
+	}
+
+	return (0);
+}
+
+uint64_t
+rctl_get_limit(struct proc *p, int resource)
+{
+	struct rctl_rule *rule;
+	struct rctl_rule_link *link;
+	uint64_t amount = UINT64_MAX;
+
+	rw_rlock(&rctl_lock);
+
+	/*
+	 * There may be more than one matching rule; go through all of them.
+	 * Denial should be done last, after logging and sending signals.
+	 */
+	LIST_FOREACH(link, &p->p_racct->r_rule_links, rrl_next) {
+		rule = link->rrl_rule;
+		if (rule->rr_resource != resource)
+			continue;
+		if (rule->rr_action != RCTL_ACTION_DENY)
+			continue;
+		if (rule->rr_amount < amount)
+			amount = rule->rr_amount;
+	}
+
+	rw_runlock(&rctl_lock);
+
+	return (amount);
+}
+
+uint64_t
+rctl_get_available(struct proc *p, int resource)
+{
+	struct rctl_rule *rule;
+	struct rctl_rule_link *link;
+	int64_t available, minavailable, allocated;
+
+	minavailable = INT64_MAX;
+
+	rw_rlock(&rctl_lock);
+
+	/*
+	 * There may be more than one matching rule; go through all of them.
+	 * Denial should be done last, after logging and sending signals.
+	 */
+	LIST_FOREACH(link, &p->p_racct->r_rule_links, rrl_next) {
+		rule = link->rrl_rule;
+		if (rule->rr_resource != resource)
+			continue;
+		if (rule->rr_action != RCTL_ACTION_DENY)
+			continue;
+		available = rctl_available_resource(p, rule);
+		if (available < minavailable)
+			minavailable = available;
+	}
+
+	rw_runlock(&rctl_lock);
+
+	/*
+	 * XXX: Think about this _hard_.
+	 */
+	allocated = p->p_racct->r_resources[resource];
+	if (minavailable < INT64_MAX - allocated)
+		minavailable += allocated;
+	if (minavailable < 0)
+		minavailable = 0;
+	return (minavailable);
+}
+
+static int
+rctl_rule_matches(const struct rctl_rule *rule, const struct rctl_rule *filter)
+{
+
+	if (filter->rr_subject_type != RCTL_SUBJECT_TYPE_UNDEFINED) {
+		if (rule->rr_subject_type != filter->rr_subject_type)
+			return (0);
+
+		switch (filter->rr_subject_type) {
+		case RCTL_SUBJECT_TYPE_PROCESS:
+			if (filter->rr_subject.rs_proc != NULL &&
+			    rule->rr_subject.rs_proc !=
+			    filter->rr_subject.rs_proc)
+				return (0);
+			break;
+		case RCTL_SUBJECT_TYPE_USER:
+			if (filter->rr_subject.rs_uip != NULL &&
+			    rule->rr_subject.rs_uip !=
+			    filter->rr_subject.rs_uip)
+				return (0);
+			break;
+		case RCTL_SUBJECT_TYPE_LOGINCLASS:
+			if (filter->rr_subject.hr_loginclass != NULL &&
+			    rule->rr_subject.hr_loginclass !=
+			    filter->rr_subject.hr_loginclass)
+				return (0);
+			break;
+		case RCTL_SUBJECT_TYPE_JAIL:
+			if (filter->rr_subject.rs_prison != NULL &&
+			    rule->rr_subject.rs_prison !=
+			    filter->rr_subject.rs_prison)
+				return (0);
+			break;
+		default:
+			panic("rctl_rule_matches: unknown subject type %d",
+			    filter->rr_subject_type);
+		}
+	}
+
+	if (filter->rr_resource != RACCT_UNDEFINED) {
+		if (rule->rr_resource != filter->rr_resource)
+			return (0);
+	}
+
+	if (filter->rr_action != RCTL_ACTION_UNDEFINED) {
+		if (rule->rr_action != filter->rr_action)
+			return (0);
+	}
+
+	if (filter->rr_amount != RCTL_AMOUNT_UNDEFINED) {
+		if (rule->rr_amount != filter->rr_amount)
+			return (0);
+	}
+
+	if (filter->rr_per != RCTL_SUBJECT_TYPE_UNDEFINED) {
+		if (rule->rr_per != filter->rr_per)
+			return (0);
+	}
+
+	return (1);
+}
+
+static int
+str2value(const char *str, int *value, struct dict *table)
+{
+	int i;
+
+	if (value == NULL)
+		return (EINVAL);
+
+	for (i = 0; table[i].d_name != NULL; i++) {
+		if (strcasecmp(table[i].d_name, str) == 0) {
+			*value =  table[i].d_value;
+			return (0);
+		}
+	}
+
+	return (EINVAL);
+}
+
+static int
+str2id(const char *str, id_t *value)
+{
+	char *end;
+
+	if (str == NULL)
+		return (EINVAL);
+
+	*value = strtoul(str, &end, 10);
+	if ((size_t)(end - str) != strlen(str))
+		return (EINVAL);
+
+	return (0);
+}
+
+static int
+str2int64(const char *str, int64_t *value)
+{
+	char *end;
+
+	if (str == NULL)
+		return (EINVAL);
+
+	*value = strtoul(str, &end, 10);
+	if ((size_t)(end - str) != strlen(str))
+		return (EINVAL);
+
+	return (0);
+}
+
+/*
+ * Connect the rule to the racct, increasing refcount for the rule.
+ */
+static void
+rctl_racct_add_rule(struct racct *racct, struct rctl_rule *rule)
+{
+	struct rctl_rule_link *link;
+
+	KASSERT(rctl_rule_fully_specified(rule), ("rule not fully specified"));
+
+	rctl_rule_acquire(rule);
+	link = uma_zalloc(rctl_rule_link_zone, M_WAITOK);
+	link->rrl_rule = rule;
+	link->rrl_exceeded = 0;
+
+	rw_wlock(&rctl_lock);
+	LIST_INSERT_HEAD(&racct->r_rule_links, link, rrl_next);
+	rw_wunlock(&rctl_lock);
+}
+
+static int
+rctl_racct_add_rule_locked(struct racct *racct, struct rctl_rule *rule)
+{
+	struct rctl_rule_link *link;
+
+	KASSERT(rctl_rule_fully_specified(rule), ("rule not fully specified"));
+	rw_assert(&rctl_lock, RA_WLOCKED);
+
+	link = uma_zalloc(rctl_rule_link_zone, M_NOWAIT);
+	if (link == NULL)
+		return (ENOMEM);
+	rctl_rule_acquire(rule);
+	link->rrl_rule = rule;
+	link->rrl_exceeded = 0;
+
+	LIST_INSERT_HEAD(&racct->r_rule_links, link, rrl_next);
+	return (0);
+}
+
+/*
+ * Remove limits for a rules matching the filter and release
+ * the refcounts for the rules, possibly freeing them.  Returns
+ * the number of limit structures removed.
+ */
+static int
+rctl_racct_remove_rules(struct racct *racct,
+    const struct rctl_rule *filter)
+{
+	int removed = 0;
+	struct rctl_rule_link *link, *linktmp;
+
+	rw_assert(&rctl_lock, RA_WLOCKED);
+
+	LIST_FOREACH_SAFE(link, &racct->r_rule_links, rrl_next, linktmp) {
+		if (!rctl_rule_matches(link->rrl_rule, filter))
+			continue;
+
+		LIST_REMOVE(link, rrl_next);
+		rctl_rule_release(link->rrl_rule);
+		uma_zfree(rctl_rule_link_zone, link);
+		removed++;
+	}
+	return (removed);
+}
+
+static void
+rctl_rule_acquire_subject(struct rctl_rule *rule)
+{
+
+	switch (rule->rr_subject_type) {
+	case RCTL_SUBJECT_TYPE_UNDEFINED:
+	case RCTL_SUBJECT_TYPE_PROCESS:
+	case RCTL_SUBJECT_TYPE_JAIL:
+		break;
+	case RCTL_SUBJECT_TYPE_USER:
+		if (rule->rr_subject.rs_uip != NULL)
+			uihold(rule->rr_subject.rs_uip);
+		break;
+	case RCTL_SUBJECT_TYPE_LOGINCLASS:
+		if (rule->rr_subject.hr_loginclass != NULL)
+			loginclass_hold(rule->rr_subject.hr_loginclass);
+		break;
+	default:
+		panic("rctl_rule_acquire_subject: unknown subject type %d",
+		    rule->rr_subject_type);
+	}
+}
+
+static void
+rctl_rule_release_subject(struct rctl_rule *rule)
+{
+
+	switch (rule->rr_subject_type) {
+	case RCTL_SUBJECT_TYPE_UNDEFINED:
+	case RCTL_SUBJECT_TYPE_PROCESS:
+	case RCTL_SUBJECT_TYPE_JAIL:
+		break;
+	case RCTL_SUBJECT_TYPE_USER:
+		if (rule->rr_subject.rs_uip != NULL)
+			uifree(rule->rr_subject.rs_uip);
+		break;
+	case RCTL_SUBJECT_TYPE_LOGINCLASS:
+		if (rule->rr_subject.hr_loginclass != NULL)
+			loginclass_free(rule->rr_subject.hr_loginclass);
+		break;
+	default:
+		panic("rctl_rule_release_subject: unknown subject type %d",
+		    rule->rr_subject_type);
+	}
+}
+
+struct rctl_rule *
+rctl_rule_alloc(int flags)
+{
+	struct rctl_rule *rule;
+
+	rule = uma_zalloc(rctl_rule_zone, flags);
+	if (rule == NULL)
+		return (NULL);
+	rule->rr_subject_type = RCTL_SUBJECT_TYPE_UNDEFINED;
+	rule->rr_subject.rs_proc = NULL;
+	rule->rr_subject.rs_uip = NULL;
+	rule->rr_subject.hr_loginclass = NULL;
+	rule->rr_subject.rs_prison = NULL;
+	rule->rr_per = RCTL_SUBJECT_TYPE_UNDEFINED;
+	rule->rr_resource = RACCT_UNDEFINED;
+	rule->rr_action = RCTL_ACTION_UNDEFINED;
+	rule->rr_amount = RCTL_AMOUNT_UNDEFINED;
+	refcount_init(&rule->rr_refcount, 1);
+
+	return (rule);
+}
+
+struct rctl_rule *
+rctl_rule_duplicate(const struct rctl_rule *rule, int flags)
+{
+	struct rctl_rule *copy;
+
+	copy = uma_zalloc(rctl_rule_zone, flags);
+	if (copy == NULL)
+		return (NULL);
+	copy->rr_subject_type = rule->rr_subject_type;
+	copy->rr_subject.rs_proc = rule->rr_subject.rs_proc;
+	copy->rr_subject.rs_uip = rule->rr_subject.rs_uip;
+	copy->rr_subject.hr_loginclass = rule->rr_subject.hr_loginclass;
+	copy->rr_subject.rs_prison = rule->rr_subject.rs_prison;
+	copy->rr_per = rule->rr_per;
+	copy->rr_resource = rule->rr_resource;
+	copy->rr_action = rule->rr_action;
+	copy->rr_amount = rule->rr_amount;
+	refcount_init(&copy->rr_refcount, 1);
+	rctl_rule_acquire_subject(copy);
+
+	return (copy);
+}
+
+void
+rctl_rule_acquire(struct rctl_rule *rule)
+{
+
+	KASSERT(rule->rr_refcount > 0, ("rule->rr_refcount <= 0"));
+
+	refcount_acquire(&rule->rr_refcount);
+}
+
+static void
+rctl_rule_free(void *context, int pending)
+{
+	struct rctl_rule *rule;
+	
+	rule = (struct rctl_rule *)context;
+
+	KASSERT(rule->rr_refcount == 0, ("rule->rr_refcount != 0"));
+	
+	/*
+	 * We don't need locking here; rule is guaranteed to be inaccessible.
+	 */
+	
+	rctl_rule_release_subject(rule);
+	uma_zfree(rctl_rule_zone, rule);
+}
+
+void
+rctl_rule_release(struct rctl_rule *rule)
+{
+
+	KASSERT(rule->rr_refcount > 0, ("rule->rr_refcount <= 0"));
+
+	if (refcount_release(&rule->rr_refcount)) {
+		/*
+		 * rctl_rule_release() is often called when iterating
+		 * over all the uidinfo structures in the system,
+		 * holding uihashtbl_lock.  Since rctl_rule_free()
+		 * might end up calling uifree(), this would lead
+		 * to lock recursion.  Use taskqueue to avoid this.
+		 */
+		TASK_INIT(&rule->rr_task, 0, rctl_rule_free, rule);
+		taskqueue_enqueue(taskqueue_thread, &rule->rr_task);
+	}
+}
+
+static int
+rctl_rule_fully_specified(const struct rctl_rule *rule)
+{
+
+	switch (rule->rr_subject_type) {
+	case RCTL_SUBJECT_TYPE_UNDEFINED:
+		return (0);
+	case RCTL_SUBJECT_TYPE_PROCESS:
+		if (rule->rr_subject.rs_proc == NULL)
+			return (0);
+		break;
+	case RCTL_SUBJECT_TYPE_USER:
+		if (rule->rr_subject.rs_uip == NULL)
+			return (0);
+		break;
+	case RCTL_SUBJECT_TYPE_LOGINCLASS:
+		if (rule->rr_subject.hr_loginclass == NULL)
+			return (0);
+		break;
+	case RCTL_SUBJECT_TYPE_JAIL:
+		if (rule->rr_subject.rs_prison == NULL)
+			return (0);
+		break;
+	default:
+		panic("rctl_rule_fully_specified: unknown subject type %d",
+		    rule->rr_subject_type);
+	}
+	if (rule->rr_resource == RACCT_UNDEFINED)
+		return (0);
+	if (rule->rr_action == RCTL_ACTION_UNDEFINED)
+		return (0);
+	if (rule->rr_amount == RCTL_AMOUNT_UNDEFINED)
+		return (0);
+	if (rule->rr_per == RCTL_SUBJECT_TYPE_UNDEFINED)
+		return (0);
+
+	return (1);
+}
+
+static int
+rctl_string_to_rule(char *rulestr, struct rctl_rule **rulep)
+{
+	int error = 0;
+	char *subjectstr, *subject_idstr, *resourcestr, *actionstr,
+	     *amountstr, *perstr;
+	struct rctl_rule *rule;
+	id_t id;
+
+	rule = rctl_rule_alloc(M_WAITOK);
+
+	subjectstr = strsep(&rulestr, ":");
+	subject_idstr = strsep(&rulestr, ":");
+	resourcestr = strsep(&rulestr, ":");
+	actionstr = strsep(&rulestr, "=/");
+	amountstr = strsep(&rulestr, "/");
+	perstr = rulestr;
+
+	if (subjectstr == NULL || subjectstr[0] == '\0')
+		rule->rr_subject_type = RCTL_SUBJECT_TYPE_UNDEFINED;
+	else {
+		error = str2value(subjectstr, &rule->rr_subject_type, subjectnames);
+		if (error != 0)
+			goto out;
+	}
+
+	if (subject_idstr == NULL || subject_idstr[0] == '\0') {
+		rule->rr_subject.rs_proc = NULL;
+		rule->rr_subject.rs_uip = NULL;
+		rule->rr_subject.hr_loginclass = NULL;
+		rule->rr_subject.rs_prison = NULL;
+	} else {
+		switch (rule->rr_subject_type) {
+		case RCTL_SUBJECT_TYPE_UNDEFINED:
+			error = EINVAL;
+			goto out;
+		case RCTL_SUBJECT_TYPE_PROCESS:
+			error = str2id(subject_idstr, &id);
+			if (error != 0)
+				goto out;
+			sx_assert(&allproc_lock, SA_LOCKED);
+			rule->rr_subject.rs_proc = pfind(id);
+			if (rule->rr_subject.rs_proc == NULL) {
+				error = ESRCH;
+				goto out;
+			}
+			PROC_UNLOCK(rule->rr_subject.rs_proc);
+			break;
+		case RCTL_SUBJECT_TYPE_USER:
+			error = str2id(subject_idstr, &id);
+			if (error != 0)
+				goto out;
+			rule->rr_subject.rs_uip = uifind(id);
+			break;
+		case RCTL_SUBJECT_TYPE_LOGINCLASS:
+			rule->rr_subject.hr_loginclass =
+			    loginclass_find(subject_idstr);
+			if (rule->rr_subject.hr_loginclass == NULL) {
+				error = ENAMETOOLONG;
+				goto out;
+			}
+			break;
+		case RCTL_SUBJECT_TYPE_JAIL:
+			rule->rr_subject.rs_prison =
+			    prison_find_name(&prison0, subject_idstr);
+			if (rule->rr_subject.rs_prison == NULL) {
+				/*
+				 * No jail with that name; try with the JID.
+				 */
+				error = str2id(subject_idstr, &id);
+				if (error != 0)
+					goto out;
+				rule->rr_subject.rs_prison = prison_find(id);
+				if (rule->rr_subject.rs_prison == NULL) {
+					error = ESRCH;
+					goto out;
+				}
+			}
+			/* prison_find() returns with mutex held. */
+			mtx_unlock(&rule->rr_subject.rs_prison->pr_mtx);
+			break;
+               default:
+                       panic("rctl_string_to_rule: unknown subject type %d",
+                           rule->rr_subject_type);
+               }
+	}
+
+	if (resourcestr == NULL || resourcestr[0] == '\0')
+		rule->rr_resource = RACCT_UNDEFINED;
+	else {
+		error = str2value(resourcestr, &rule->rr_resource,
+		    resourcenames);
+		if (error != 0)
+			goto out;
+	}
+
+	if (actionstr == NULL || actionstr[0] == '\0')
+		rule->rr_action = RCTL_ACTION_UNDEFINED;
+	else {
+		error = str2value(actionstr, &rule->rr_action, actionnames);
+		if (error != 0)
+			goto out;
+	}
+
+	if (amountstr == NULL || amountstr[0] == '\0')
+		rule->rr_amount = RCTL_AMOUNT_UNDEFINED;
+	else {
+		error = str2int64(amountstr, &rule->rr_amount);
+		if (error != 0)
+			goto out;
+		if (racct_is_in_thousands(rule->rr_resource))
+			rule->rr_amount *= 1000;
+	}
+
+	if (perstr == NULL || perstr[0] == '\0')
+		rule->rr_per = RCTL_SUBJECT_TYPE_UNDEFINED;
+	else {

*** DIFF OUTPUT TRUNCATED AT 1000 LINES ***



Want to link to this message? Use this URL: <https://mail-archive.FreeBSD.org/cgi/mid.cgi?201103301748.p2UHmF0g070602>