| Paul Menage | ddbcc7e | 2007-10-18 23:39:30 -0700 | [diff] [blame] | 1 | #ifndef _LINUX_CGROUP_H | 
 | 2 | #define _LINUX_CGROUP_H | 
 | 3 | /* | 
 | 4 |  *  cgroup interface | 
 | 5 |  * | 
 | 6 |  *  Copyright (C) 2003 BULL SA | 
 | 7 |  *  Copyright (C) 2004-2006 Silicon Graphics, Inc. | 
 | 8 |  * | 
 | 9 |  */ | 
 | 10 |  | 
 | 11 | #include <linux/sched.h> | 
| Paul Menage | ddbcc7e | 2007-10-18 23:39:30 -0700 | [diff] [blame] | 12 | #include <linux/cpumask.h> | 
 | 13 | #include <linux/nodemask.h> | 
 | 14 | #include <linux/rcupdate.h> | 
| Balbir Singh | 846c7bb | 2007-10-18 23:39:44 -0700 | [diff] [blame] | 15 | #include <linux/cgroupstats.h> | 
| Cliff Wickman | 31a7df0 | 2008-02-07 00:14:42 -0800 | [diff] [blame] | 16 | #include <linux/prio_heap.h> | 
| Paul Menage | cc31edc | 2008-10-18 20:28:04 -0700 | [diff] [blame] | 17 | #include <linux/rwsem.h> | 
| KAMEZAWA Hiroyuki | 38460b4 | 2009-04-02 16:57:25 -0700 | [diff] [blame] | 18 | #include <linux/idr.h> | 
| Paul Menage | ddbcc7e | 2007-10-18 23:39:30 -0700 | [diff] [blame] | 19 |  | 
 | 20 | #ifdef CONFIG_CGROUPS | 
 | 21 |  | 
 | 22 | struct cgroupfs_root; | 
 | 23 | struct cgroup_subsys; | 
 | 24 | struct inode; | 
| Paul Menage | 84eea84 | 2008-07-25 01:47:00 -0700 | [diff] [blame] | 25 | struct cgroup; | 
| KAMEZAWA Hiroyuki | 38460b4 | 2009-04-02 16:57:25 -0700 | [diff] [blame] | 26 | struct css_id; | 
| Paul Menage | ddbcc7e | 2007-10-18 23:39:30 -0700 | [diff] [blame] | 27 |  | 
 | 28 | extern int cgroup_init_early(void); | 
 | 29 | extern int cgroup_init(void); | 
| Paul Menage | ddbcc7e | 2007-10-18 23:39:30 -0700 | [diff] [blame] | 30 | extern void cgroup_lock(void); | 
| Paul Menage | 84eea84 | 2008-07-25 01:47:00 -0700 | [diff] [blame] | 31 | extern bool cgroup_lock_live_group(struct cgroup *cgrp); | 
| Paul Menage | ddbcc7e | 2007-10-18 23:39:30 -0700 | [diff] [blame] | 32 | extern void cgroup_unlock(void); | 
| Paul Menage | b4f48b6 | 2007-10-18 23:39:33 -0700 | [diff] [blame] | 33 | extern void cgroup_fork(struct task_struct *p); | 
 | 34 | extern void cgroup_fork_callbacks(struct task_struct *p); | 
| Paul Menage | 817929e | 2007-10-18 23:39:36 -0700 | [diff] [blame] | 35 | extern void cgroup_post_fork(struct task_struct *p); | 
| Paul Menage | b4f48b6 | 2007-10-18 23:39:33 -0700 | [diff] [blame] | 36 | extern void cgroup_exit(struct task_struct *p, int run_callbacks); | 
| Balbir Singh | 846c7bb | 2007-10-18 23:39:44 -0700 | [diff] [blame] | 37 | extern int cgroupstats_build(struct cgroupstats *stats, | 
 | 38 | 				struct dentry *dentry); | 
| Paul Menage | ddbcc7e | 2007-10-18 23:39:30 -0700 | [diff] [blame] | 39 |  | 
| Paul Menage | a424316 | 2007-10-18 23:39:35 -0700 | [diff] [blame] | 40 | extern struct file_operations proc_cgroup_operations; | 
 | 41 |  | 
| Paul Menage | 817929e | 2007-10-18 23:39:36 -0700 | [diff] [blame] | 42 | /* Define the enumeration of all cgroup subsystems */ | 
 | 43 | #define SUBSYS(_x) _x ## _subsys_id, | 
 | 44 | enum cgroup_subsys_id { | 
 | 45 | #include <linux/cgroup_subsys.h> | 
 | 46 | 	CGROUP_SUBSYS_COUNT | 
 | 47 | }; | 
 | 48 | #undef SUBSYS | 
 | 49 |  | 
| Paul Menage | ddbcc7e | 2007-10-18 23:39:30 -0700 | [diff] [blame] | 50 | /* Per-subsystem/per-cgroup state maintained by the system. */ | 
 | 51 | struct cgroup_subsys_state { | 
| Paul Menage | d20a390 | 2009-04-02 16:57:22 -0700 | [diff] [blame] | 52 | 	/* | 
 | 53 | 	 * The cgroup that this subsystem is attached to. Useful | 
| Paul Menage | ddbcc7e | 2007-10-18 23:39:30 -0700 | [diff] [blame] | 54 | 	 * for subsystems that want to know about the cgroup | 
| Paul Menage | d20a390 | 2009-04-02 16:57:22 -0700 | [diff] [blame] | 55 | 	 * hierarchy structure | 
 | 56 | 	 */ | 
| Paul Menage | ddbcc7e | 2007-10-18 23:39:30 -0700 | [diff] [blame] | 57 | 	struct cgroup *cgroup; | 
 | 58 |  | 
| Paul Menage | d20a390 | 2009-04-02 16:57:22 -0700 | [diff] [blame] | 59 | 	/* | 
 | 60 | 	 * State maintained by the cgroup system to allow subsystems | 
| Paul Menage | e7c5ec9 | 2009-01-07 18:08:38 -0800 | [diff] [blame] | 61 | 	 * to be "busy". Should be accessed via css_get(), | 
| Paul Menage | d20a390 | 2009-04-02 16:57:22 -0700 | [diff] [blame] | 62 | 	 * css_tryget() and and css_put(). | 
 | 63 | 	 */ | 
| Paul Menage | ddbcc7e | 2007-10-18 23:39:30 -0700 | [diff] [blame] | 64 |  | 
 | 65 | 	atomic_t refcnt; | 
 | 66 |  | 
 | 67 | 	unsigned long flags; | 
| KAMEZAWA Hiroyuki | 38460b4 | 2009-04-02 16:57:25 -0700 | [diff] [blame] | 68 | 	/* ID for this css, if possible */ | 
 | 69 | 	struct css_id *id; | 
| Paul Menage | ddbcc7e | 2007-10-18 23:39:30 -0700 | [diff] [blame] | 70 | }; | 
 | 71 |  | 
 | 72 | /* bits in struct cgroup_subsys_state flags field */ | 
 | 73 | enum { | 
 | 74 | 	CSS_ROOT, /* This CSS is the root of the subsystem */ | 
| Paul Menage | e7c5ec9 | 2009-01-07 18:08:38 -0800 | [diff] [blame] | 75 | 	CSS_REMOVED, /* This CSS is dead */ | 
| Paul Menage | ddbcc7e | 2007-10-18 23:39:30 -0700 | [diff] [blame] | 76 | }; | 
 | 77 |  | 
 | 78 | /* | 
| Paul Menage | e7c5ec9 | 2009-01-07 18:08:38 -0800 | [diff] [blame] | 79 |  * Call css_get() to hold a reference on the css; it can be used | 
 | 80 |  * for a reference obtained via: | 
 | 81 |  * - an existing ref-counted reference to the css | 
 | 82 |  * - task->cgroups for a locked task | 
| Paul Menage | ddbcc7e | 2007-10-18 23:39:30 -0700 | [diff] [blame] | 83 |  */ | 
 | 84 |  | 
 | 85 | static inline void css_get(struct cgroup_subsys_state *css) | 
 | 86 | { | 
 | 87 | 	/* We don't need to reference count the root state */ | 
 | 88 | 	if (!test_bit(CSS_ROOT, &css->flags)) | 
 | 89 | 		atomic_inc(&css->refcnt); | 
 | 90 | } | 
| Paul Menage | e7c5ec9 | 2009-01-07 18:08:38 -0800 | [diff] [blame] | 91 |  | 
 | 92 | static inline bool css_is_removed(struct cgroup_subsys_state *css) | 
 | 93 | { | 
 | 94 | 	return test_bit(CSS_REMOVED, &css->flags); | 
 | 95 | } | 
 | 96 |  | 
 | 97 | /* | 
 | 98 |  * Call css_tryget() to take a reference on a css if your existing | 
 | 99 |  * (known-valid) reference isn't already ref-counted. Returns false if | 
 | 100 |  * the css has been destroyed. | 
 | 101 |  */ | 
 | 102 |  | 
 | 103 | static inline bool css_tryget(struct cgroup_subsys_state *css) | 
 | 104 | { | 
 | 105 | 	if (test_bit(CSS_ROOT, &css->flags)) | 
 | 106 | 		return true; | 
 | 107 | 	while (!atomic_inc_not_zero(&css->refcnt)) { | 
 | 108 | 		if (test_bit(CSS_REMOVED, &css->flags)) | 
 | 109 | 			return false; | 
| Paul Menage | 804b3c2 | 2009-01-29 14:25:21 -0800 | [diff] [blame] | 110 | 		cpu_relax(); | 
| Paul Menage | e7c5ec9 | 2009-01-07 18:08:38 -0800 | [diff] [blame] | 111 | 	} | 
 | 112 | 	return true; | 
 | 113 | } | 
 | 114 |  | 
| Paul Menage | ddbcc7e | 2007-10-18 23:39:30 -0700 | [diff] [blame] | 115 | /* | 
 | 116 |  * css_put() should be called to release a reference taken by | 
| Paul Menage | e7c5ec9 | 2009-01-07 18:08:38 -0800 | [diff] [blame] | 117 |  * css_get() or css_tryget() | 
| Paul Menage | ddbcc7e | 2007-10-18 23:39:30 -0700 | [diff] [blame] | 118 |  */ | 
 | 119 |  | 
| Paul Menage | 81a6a5c | 2007-10-18 23:39:38 -0700 | [diff] [blame] | 120 | extern void __css_put(struct cgroup_subsys_state *css); | 
| Paul Menage | ddbcc7e | 2007-10-18 23:39:30 -0700 | [diff] [blame] | 121 | static inline void css_put(struct cgroup_subsys_state *css) | 
 | 122 | { | 
 | 123 | 	if (!test_bit(CSS_ROOT, &css->flags)) | 
| Paul Menage | 81a6a5c | 2007-10-18 23:39:38 -0700 | [diff] [blame] | 124 | 		__css_put(css); | 
| Paul Menage | ddbcc7e | 2007-10-18 23:39:30 -0700 | [diff] [blame] | 125 | } | 
 | 126 |  | 
| Paul Menage | 3116f0e | 2008-04-29 01:00:04 -0700 | [diff] [blame] | 127 | /* bits in struct cgroup flags field */ | 
 | 128 | enum { | 
 | 129 | 	/* Control Group is dead */ | 
 | 130 | 	CGRP_REMOVED, | 
| Paul Menage | d20a390 | 2009-04-02 16:57:22 -0700 | [diff] [blame] | 131 | 	/* | 
 | 132 | 	 * Control Group has previously had a child cgroup or a task, | 
 | 133 | 	 * but no longer (only if CGRP_NOTIFY_ON_RELEASE is set) | 
 | 134 | 	 */ | 
| Paul Menage | 3116f0e | 2008-04-29 01:00:04 -0700 | [diff] [blame] | 135 | 	CGRP_RELEASABLE, | 
 | 136 | 	/* Control Group requires release notifications to userspace */ | 
 | 137 | 	CGRP_NOTIFY_ON_RELEASE, | 
| KAMEZAWA Hiroyuki | ec64f51 | 2009-04-02 16:57:26 -0700 | [diff] [blame] | 138 | 	/* | 
 | 139 | 	 * A thread in rmdir() is wating for this cgroup. | 
 | 140 | 	 */ | 
 | 141 | 	CGRP_WAIT_ON_RMDIR, | 
| Paul Menage | 3116f0e | 2008-04-29 01:00:04 -0700 | [diff] [blame] | 142 | }; | 
 | 143 |  | 
| Paul Menage | ddbcc7e | 2007-10-18 23:39:30 -0700 | [diff] [blame] | 144 | struct cgroup { | 
 | 145 | 	unsigned long flags;		/* "unsigned long" so bitops work */ | 
 | 146 |  | 
| Paul Menage | d20a390 | 2009-04-02 16:57:22 -0700 | [diff] [blame] | 147 | 	/* | 
 | 148 | 	 * count users of this cgroup. >0 means busy, but doesn't | 
 | 149 | 	 * necessarily indicate the number of tasks in the cgroup | 
 | 150 | 	 */ | 
| Paul Menage | ddbcc7e | 2007-10-18 23:39:30 -0700 | [diff] [blame] | 151 | 	atomic_t count; | 
 | 152 |  | 
 | 153 | 	/* | 
 | 154 | 	 * We link our 'sibling' struct into our parent's 'children'. | 
 | 155 | 	 * Our children link their 'sibling' into our 'children'. | 
 | 156 | 	 */ | 
 | 157 | 	struct list_head sibling;	/* my parent's children */ | 
 | 158 | 	struct list_head children;	/* my children */ | 
 | 159 |  | 
| Paul Menage | d20a390 | 2009-04-02 16:57:22 -0700 | [diff] [blame] | 160 | 	struct cgroup *parent;		/* my parent */ | 
| Paul Menage | a47295e | 2009-01-07 18:07:44 -0800 | [diff] [blame] | 161 | 	struct dentry *dentry;	  	/* cgroup fs entry, RCU protected */ | 
| Paul Menage | ddbcc7e | 2007-10-18 23:39:30 -0700 | [diff] [blame] | 162 |  | 
 | 163 | 	/* Private pointers for each registered subsystem */ | 
 | 164 | 	struct cgroup_subsys_state *subsys[CGROUP_SUBSYS_COUNT]; | 
 | 165 |  | 
 | 166 | 	struct cgroupfs_root *root; | 
 | 167 | 	struct cgroup *top_cgroup; | 
| Paul Menage | 817929e | 2007-10-18 23:39:36 -0700 | [diff] [blame] | 168 |  | 
 | 169 | 	/* | 
 | 170 | 	 * List of cg_cgroup_links pointing at css_sets with | 
 | 171 | 	 * tasks in this cgroup. Protected by css_set_lock | 
 | 172 | 	 */ | 
 | 173 | 	struct list_head css_sets; | 
| Paul Menage | 81a6a5c | 2007-10-18 23:39:38 -0700 | [diff] [blame] | 174 |  | 
 | 175 | 	/* | 
 | 176 | 	 * Linked list running through all cgroups that can | 
 | 177 | 	 * potentially be reaped by the release agent. Protected by | 
 | 178 | 	 * release_list_lock | 
 | 179 | 	 */ | 
 | 180 | 	struct list_head release_list; | 
| Paul Menage | cc31edc | 2008-10-18 20:28:04 -0700 | [diff] [blame] | 181 |  | 
 | 182 | 	/* pids_mutex protects the fields below */ | 
 | 183 | 	struct rw_semaphore pids_mutex; | 
 | 184 | 	/* Array of process ids in the cgroup */ | 
 | 185 | 	pid_t *tasks_pids; | 
 | 186 | 	/* How many files are using the current tasks_pids array */ | 
 | 187 | 	int pids_use_count; | 
 | 188 | 	/* Length of the current tasks_pids array */ | 
 | 189 | 	int pids_length; | 
| Paul Menage | a47295e | 2009-01-07 18:07:44 -0800 | [diff] [blame] | 190 |  | 
 | 191 | 	/* For RCU-protected deletion */ | 
 | 192 | 	struct rcu_head rcu_head; | 
| Paul Menage | 817929e | 2007-10-18 23:39:36 -0700 | [diff] [blame] | 193 | }; | 
 | 194 |  | 
| Paul Menage | d20a390 | 2009-04-02 16:57:22 -0700 | [diff] [blame] | 195 | /* | 
 | 196 |  * A css_set is a structure holding pointers to a set of | 
| Paul Menage | 817929e | 2007-10-18 23:39:36 -0700 | [diff] [blame] | 197 |  * cgroup_subsys_state objects. This saves space in the task struct | 
 | 198 |  * object and speeds up fork()/exit(), since a single inc/dec and a | 
| Paul Menage | d20a390 | 2009-04-02 16:57:22 -0700 | [diff] [blame] | 199 |  * list_add()/del() can bump the reference count on the entire cgroup | 
 | 200 |  * set for a task. | 
| Paul Menage | 817929e | 2007-10-18 23:39:36 -0700 | [diff] [blame] | 201 |  */ | 
 | 202 |  | 
 | 203 | struct css_set { | 
 | 204 |  | 
 | 205 | 	/* Reference count */ | 
| Lai Jiangshan | 146aa1b | 2008-10-18 20:28:03 -0700 | [diff] [blame] | 206 | 	atomic_t refcount; | 
| Paul Menage | 817929e | 2007-10-18 23:39:36 -0700 | [diff] [blame] | 207 |  | 
 | 208 | 	/* | 
| Li Zefan | 472b105 | 2008-04-29 01:00:11 -0700 | [diff] [blame] | 209 | 	 * List running through all cgroup groups in the same hash | 
 | 210 | 	 * slot. Protected by css_set_lock | 
 | 211 | 	 */ | 
 | 212 | 	struct hlist_node hlist; | 
 | 213 |  | 
 | 214 | 	/* | 
| Paul Menage | 817929e | 2007-10-18 23:39:36 -0700 | [diff] [blame] | 215 | 	 * List running through all tasks using this cgroup | 
 | 216 | 	 * group. Protected by css_set_lock | 
 | 217 | 	 */ | 
 | 218 | 	struct list_head tasks; | 
 | 219 |  | 
 | 220 | 	/* | 
 | 221 | 	 * List of cg_cgroup_link objects on link chains from | 
 | 222 | 	 * cgroups referenced from this css_set. Protected by | 
 | 223 | 	 * css_set_lock | 
 | 224 | 	 */ | 
 | 225 | 	struct list_head cg_links; | 
 | 226 |  | 
 | 227 | 	/* | 
 | 228 | 	 * Set of subsystem states, one for each subsystem. This array | 
 | 229 | 	 * is immutable after creation apart from the init_css_set | 
 | 230 | 	 * during subsystem registration (at boot time). | 
 | 231 | 	 */ | 
 | 232 | 	struct cgroup_subsys_state *subsys[CGROUP_SUBSYS_COUNT]; | 
| Paul Menage | ddbcc7e | 2007-10-18 23:39:30 -0700 | [diff] [blame] | 233 | }; | 
 | 234 |  | 
| Paul Menage | 9179656 | 2008-04-29 01:00:01 -0700 | [diff] [blame] | 235 | /* | 
 | 236 |  * cgroup_map_cb is an abstract callback API for reporting map-valued | 
 | 237 |  * control files | 
 | 238 |  */ | 
 | 239 |  | 
 | 240 | struct cgroup_map_cb { | 
 | 241 | 	int (*fill)(struct cgroup_map_cb *cb, const char *key, u64 value); | 
 | 242 | 	void *state; | 
 | 243 | }; | 
 | 244 |  | 
| Paul Menage | d20a390 | 2009-04-02 16:57:22 -0700 | [diff] [blame] | 245 | /* | 
 | 246 |  * struct cftype: handler definitions for cgroup control files | 
| Paul Menage | ddbcc7e | 2007-10-18 23:39:30 -0700 | [diff] [blame] | 247 |  * | 
 | 248 |  * When reading/writing to a file: | 
| Li Zefan | a043e3b | 2008-02-23 15:24:09 -0800 | [diff] [blame] | 249 |  *	- the cgroup to use is file->f_dentry->d_parent->d_fsdata | 
| Paul Menage | ddbcc7e | 2007-10-18 23:39:30 -0700 | [diff] [blame] | 250 |  *	- the 'cftype' of the file is file->f_dentry->d_fsdata | 
 | 251 |  */ | 
 | 252 |  | 
 | 253 | #define MAX_CFTYPE_NAME 64 | 
 | 254 | struct cftype { | 
| Paul Menage | d20a390 | 2009-04-02 16:57:22 -0700 | [diff] [blame] | 255 | 	/* | 
 | 256 | 	 * By convention, the name should begin with the name of the | 
 | 257 | 	 * subsystem, followed by a period | 
 | 258 | 	 */ | 
| Paul Menage | ddbcc7e | 2007-10-18 23:39:30 -0700 | [diff] [blame] | 259 | 	char name[MAX_CFTYPE_NAME]; | 
 | 260 | 	int private; | 
| Li Zefan | 099fca3 | 2009-04-02 16:57:29 -0700 | [diff] [blame] | 261 | 	/* | 
 | 262 | 	 * If not 0, file mode is set to this value, otherwise it will | 
 | 263 | 	 * be figured out automatically | 
 | 264 | 	 */ | 
 | 265 | 	mode_t mode; | 
| Paul Menage | db3b149 | 2008-07-25 01:46:58 -0700 | [diff] [blame] | 266 |  | 
 | 267 | 	/* | 
 | 268 | 	 * If non-zero, defines the maximum length of string that can | 
 | 269 | 	 * be passed to write_string; defaults to 64 | 
 | 270 | 	 */ | 
 | 271 | 	size_t max_write_len; | 
 | 272 |  | 
| Paul Menage | ce16b49 | 2008-07-25 01:46:57 -0700 | [diff] [blame] | 273 | 	int (*open)(struct inode *inode, struct file *file); | 
 | 274 | 	ssize_t (*read)(struct cgroup *cgrp, struct cftype *cft, | 
 | 275 | 			struct file *file, | 
 | 276 | 			char __user *buf, size_t nbytes, loff_t *ppos); | 
| Paul Menage | ddbcc7e | 2007-10-18 23:39:30 -0700 | [diff] [blame] | 277 | 	/* | 
| Paul Menage | f4c753b | 2008-04-29 00:59:56 -0700 | [diff] [blame] | 278 | 	 * read_u64() is a shortcut for the common case of returning a | 
| Paul Menage | ddbcc7e | 2007-10-18 23:39:30 -0700 | [diff] [blame] | 279 | 	 * single integer. Use it in place of read() | 
 | 280 | 	 */ | 
| Paul Menage | ce16b49 | 2008-07-25 01:46:57 -0700 | [diff] [blame] | 281 | 	u64 (*read_u64)(struct cgroup *cgrp, struct cftype *cft); | 
| Paul Menage | 9179656 | 2008-04-29 01:00:01 -0700 | [diff] [blame] | 282 | 	/* | 
| Paul Menage | e73d2c6 | 2008-04-29 01:00:06 -0700 | [diff] [blame] | 283 | 	 * read_s64() is a signed version of read_u64() | 
 | 284 | 	 */ | 
| Paul Menage | ce16b49 | 2008-07-25 01:46:57 -0700 | [diff] [blame] | 285 | 	s64 (*read_s64)(struct cgroup *cgrp, struct cftype *cft); | 
| Paul Menage | e73d2c6 | 2008-04-29 01:00:06 -0700 | [diff] [blame] | 286 | 	/* | 
| Paul Menage | 9179656 | 2008-04-29 01:00:01 -0700 | [diff] [blame] | 287 | 	 * read_map() is used for defining a map of key/value | 
 | 288 | 	 * pairs. It should call cb->fill(cb, key, value) for each | 
 | 289 | 	 * entry. The key/value pairs (and their ordering) should not | 
 | 290 | 	 * change between reboots. | 
 | 291 | 	 */ | 
| Paul Menage | ce16b49 | 2008-07-25 01:46:57 -0700 | [diff] [blame] | 292 | 	int (*read_map)(struct cgroup *cont, struct cftype *cft, | 
 | 293 | 			struct cgroup_map_cb *cb); | 
| Serge E. Hallyn | 29486df | 2008-04-29 01:00:14 -0700 | [diff] [blame] | 294 | 	/* | 
 | 295 | 	 * read_seq_string() is used for outputting a simple sequence | 
 | 296 | 	 * using seqfile. | 
 | 297 | 	 */ | 
| Paul Menage | ce16b49 | 2008-07-25 01:46:57 -0700 | [diff] [blame] | 298 | 	int (*read_seq_string)(struct cgroup *cont, struct cftype *cft, | 
 | 299 | 			       struct seq_file *m); | 
| Paul Menage | 9179656 | 2008-04-29 01:00:01 -0700 | [diff] [blame] | 300 |  | 
| Paul Menage | ce16b49 | 2008-07-25 01:46:57 -0700 | [diff] [blame] | 301 | 	ssize_t (*write)(struct cgroup *cgrp, struct cftype *cft, | 
 | 302 | 			 struct file *file, | 
 | 303 | 			 const char __user *buf, size_t nbytes, loff_t *ppos); | 
| Paul Menage | 355e0c4 | 2007-10-18 23:39:33 -0700 | [diff] [blame] | 304 |  | 
 | 305 | 	/* | 
| Paul Menage | f4c753b | 2008-04-29 00:59:56 -0700 | [diff] [blame] | 306 | 	 * write_u64() is a shortcut for the common case of accepting | 
| Paul Menage | 355e0c4 | 2007-10-18 23:39:33 -0700 | [diff] [blame] | 307 | 	 * a single integer (as parsed by simple_strtoull) from | 
 | 308 | 	 * userspace. Use in place of write(); return 0 or error. | 
 | 309 | 	 */ | 
| Paul Menage | ce16b49 | 2008-07-25 01:46:57 -0700 | [diff] [blame] | 310 | 	int (*write_u64)(struct cgroup *cgrp, struct cftype *cft, u64 val); | 
| Paul Menage | e73d2c6 | 2008-04-29 01:00:06 -0700 | [diff] [blame] | 311 | 	/* | 
 | 312 | 	 * write_s64() is a signed version of write_u64() | 
 | 313 | 	 */ | 
| Paul Menage | ce16b49 | 2008-07-25 01:46:57 -0700 | [diff] [blame] | 314 | 	int (*write_s64)(struct cgroup *cgrp, struct cftype *cft, s64 val); | 
| Paul Menage | 355e0c4 | 2007-10-18 23:39:33 -0700 | [diff] [blame] | 315 |  | 
| Pavel Emelyanov | d447ea2 | 2008-04-29 01:00:08 -0700 | [diff] [blame] | 316 | 	/* | 
| Paul Menage | db3b149 | 2008-07-25 01:46:58 -0700 | [diff] [blame] | 317 | 	 * write_string() is passed a nul-terminated kernelspace | 
 | 318 | 	 * buffer of maximum length determined by max_write_len. | 
 | 319 | 	 * Returns 0 or -ve error code. | 
 | 320 | 	 */ | 
 | 321 | 	int (*write_string)(struct cgroup *cgrp, struct cftype *cft, | 
 | 322 | 			    const char *buffer); | 
 | 323 | 	/* | 
| Pavel Emelyanov | d447ea2 | 2008-04-29 01:00:08 -0700 | [diff] [blame] | 324 | 	 * trigger() callback can be used to get some kick from the | 
 | 325 | 	 * userspace, when the actual string written is not important | 
 | 326 | 	 * at all. The private field can be used to determine the | 
 | 327 | 	 * kick type for multiplexing. | 
 | 328 | 	 */ | 
 | 329 | 	int (*trigger)(struct cgroup *cgrp, unsigned int event); | 
 | 330 |  | 
| Paul Menage | ce16b49 | 2008-07-25 01:46:57 -0700 | [diff] [blame] | 331 | 	int (*release)(struct inode *inode, struct file *file); | 
| Paul Menage | ddbcc7e | 2007-10-18 23:39:30 -0700 | [diff] [blame] | 332 | }; | 
 | 333 |  | 
| Cliff Wickman | 31a7df0 | 2008-02-07 00:14:42 -0800 | [diff] [blame] | 334 | struct cgroup_scanner { | 
 | 335 | 	struct cgroup *cg; | 
 | 336 | 	int (*test_task)(struct task_struct *p, struct cgroup_scanner *scan); | 
 | 337 | 	void (*process_task)(struct task_struct *p, | 
 | 338 | 			struct cgroup_scanner *scan); | 
 | 339 | 	struct ptr_heap *heap; | 
| Li Zefan | bd1a8ab | 2009-04-02 16:57:50 -0700 | [diff] [blame] | 340 | 	void *data; | 
| Cliff Wickman | 31a7df0 | 2008-02-07 00:14:42 -0800 | [diff] [blame] | 341 | }; | 
 | 342 |  | 
| Paul Menage | d20a390 | 2009-04-02 16:57:22 -0700 | [diff] [blame] | 343 | /* | 
 | 344 |  * Add a new file to the given cgroup directory. Should only be | 
 | 345 |  * called by subsystems from within a populate() method | 
 | 346 |  */ | 
| Li Zefan | ffd2d88 | 2008-02-23 15:24:09 -0800 | [diff] [blame] | 347 | int cgroup_add_file(struct cgroup *cgrp, struct cgroup_subsys *subsys, | 
| Paul Menage | ddbcc7e | 2007-10-18 23:39:30 -0700 | [diff] [blame] | 348 | 		       const struct cftype *cft); | 
 | 349 |  | 
| Paul Menage | d20a390 | 2009-04-02 16:57:22 -0700 | [diff] [blame] | 350 | /* | 
 | 351 |  * Add a set of new files to the given cgroup directory. Should | 
 | 352 |  * only be called by subsystems from within a populate() method | 
 | 353 |  */ | 
| Li Zefan | ffd2d88 | 2008-02-23 15:24:09 -0800 | [diff] [blame] | 354 | int cgroup_add_files(struct cgroup *cgrp, | 
| Paul Menage | ddbcc7e | 2007-10-18 23:39:30 -0700 | [diff] [blame] | 355 | 			struct cgroup_subsys *subsys, | 
 | 356 | 			const struct cftype cft[], | 
 | 357 | 			int count); | 
 | 358 |  | 
| Li Zefan | ffd2d88 | 2008-02-23 15:24:09 -0800 | [diff] [blame] | 359 | int cgroup_is_removed(const struct cgroup *cgrp); | 
| Paul Menage | ddbcc7e | 2007-10-18 23:39:30 -0700 | [diff] [blame] | 360 |  | 
| Li Zefan | ffd2d88 | 2008-02-23 15:24:09 -0800 | [diff] [blame] | 361 | int cgroup_path(const struct cgroup *cgrp, char *buf, int buflen); | 
| Paul Menage | ddbcc7e | 2007-10-18 23:39:30 -0700 | [diff] [blame] | 362 |  | 
| Li Zefan | ffd2d88 | 2008-02-23 15:24:09 -0800 | [diff] [blame] | 363 | int cgroup_task_count(const struct cgroup *cgrp); | 
| Paul Menage | bbcb81d | 2007-10-18 23:39:32 -0700 | [diff] [blame] | 364 |  | 
| Grzegorz Nosek | 313e924 | 2009-04-02 16:57:23 -0700 | [diff] [blame] | 365 | /* Return true if cgrp is a descendant of the task's cgroup */ | 
 | 366 | int cgroup_is_descendant(const struct cgroup *cgrp, struct task_struct *task); | 
| Paul Menage | ddbcc7e | 2007-10-18 23:39:30 -0700 | [diff] [blame] | 367 |  | 
| Thadeu Lima de Souza Cascardo | 21acb9c | 2009-02-04 10:12:08 +0100 | [diff] [blame] | 368 | /* | 
 | 369 |  * Control Group subsystem type. | 
 | 370 |  * See Documentation/cgroups/cgroups.txt for details | 
 | 371 |  */ | 
| Paul Menage | ddbcc7e | 2007-10-18 23:39:30 -0700 | [diff] [blame] | 372 |  | 
 | 373 | struct cgroup_subsys { | 
 | 374 | 	struct cgroup_subsys_state *(*create)(struct cgroup_subsys *ss, | 
| Li Zefan | ffd2d88 | 2008-02-23 15:24:09 -0800 | [diff] [blame] | 375 | 						  struct cgroup *cgrp); | 
| KAMEZAWA Hiroyuki | ec64f51 | 2009-04-02 16:57:26 -0700 | [diff] [blame] | 376 | 	int (*pre_destroy)(struct cgroup_subsys *ss, struct cgroup *cgrp); | 
| Li Zefan | ffd2d88 | 2008-02-23 15:24:09 -0800 | [diff] [blame] | 377 | 	void (*destroy)(struct cgroup_subsys *ss, struct cgroup *cgrp); | 
| Paul Menage | ddbcc7e | 2007-10-18 23:39:30 -0700 | [diff] [blame] | 378 | 	int (*can_attach)(struct cgroup_subsys *ss, | 
| Li Zefan | ffd2d88 | 2008-02-23 15:24:09 -0800 | [diff] [blame] | 379 | 			  struct cgroup *cgrp, struct task_struct *tsk); | 
 | 380 | 	void (*attach)(struct cgroup_subsys *ss, struct cgroup *cgrp, | 
 | 381 | 			struct cgroup *old_cgrp, struct task_struct *tsk); | 
| Paul Menage | ddbcc7e | 2007-10-18 23:39:30 -0700 | [diff] [blame] | 382 | 	void (*fork)(struct cgroup_subsys *ss, struct task_struct *task); | 
 | 383 | 	void (*exit)(struct cgroup_subsys *ss, struct task_struct *task); | 
 | 384 | 	int (*populate)(struct cgroup_subsys *ss, | 
| Li Zefan | ffd2d88 | 2008-02-23 15:24:09 -0800 | [diff] [blame] | 385 | 			struct cgroup *cgrp); | 
 | 386 | 	void (*post_clone)(struct cgroup_subsys *ss, struct cgroup *cgrp); | 
| Paul Menage | ddbcc7e | 2007-10-18 23:39:30 -0700 | [diff] [blame] | 387 | 	void (*bind)(struct cgroup_subsys *ss, struct cgroup *root); | 
| Hugh Dickins | e599137 | 2009-01-06 14:39:22 -0800 | [diff] [blame] | 388 |  | 
| Paul Menage | ddbcc7e | 2007-10-18 23:39:30 -0700 | [diff] [blame] | 389 | 	int subsys_id; | 
 | 390 | 	int active; | 
| Paul Menage | 8bab8dd | 2008-04-04 14:29:57 -0700 | [diff] [blame] | 391 | 	int disabled; | 
| Paul Menage | ddbcc7e | 2007-10-18 23:39:30 -0700 | [diff] [blame] | 392 | 	int early_init; | 
| KAMEZAWA Hiroyuki | 38460b4 | 2009-04-02 16:57:25 -0700 | [diff] [blame] | 393 | 	/* | 
 | 394 | 	 * True if this subsys uses ID. ID is not available before cgroup_init() | 
 | 395 | 	 * (not available in early_init time.) | 
 | 396 | 	 */ | 
 | 397 | 	bool use_id; | 
| Paul Menage | ddbcc7e | 2007-10-18 23:39:30 -0700 | [diff] [blame] | 398 | #define MAX_CGROUP_TYPE_NAMELEN 32 | 
 | 399 | 	const char *name; | 
 | 400 |  | 
| Paul Menage | 999cd8a | 2009-01-07 18:08:36 -0800 | [diff] [blame] | 401 | 	/* | 
 | 402 | 	 * Protects sibling/children links of cgroups in this | 
 | 403 | 	 * hierarchy, plus protects which hierarchy (or none) the | 
 | 404 | 	 * subsystem is a part of (i.e. root/sibling).  To avoid | 
 | 405 | 	 * potential deadlocks, the following operations should not be | 
 | 406 | 	 * undertaken while holding any hierarchy_mutex: | 
 | 407 | 	 * | 
 | 408 | 	 * - allocating memory | 
 | 409 | 	 * - initiating hotplug events | 
 | 410 | 	 */ | 
 | 411 | 	struct mutex hierarchy_mutex; | 
| Li Zefan | cfebe56 | 2009-02-11 13:04:36 -0800 | [diff] [blame] | 412 | 	struct lock_class_key subsys_key; | 
| Paul Menage | ddbcc7e | 2007-10-18 23:39:30 -0700 | [diff] [blame] | 413 |  | 
| Paul Menage | 999cd8a | 2009-01-07 18:08:36 -0800 | [diff] [blame] | 414 | 	/* | 
 | 415 | 	 * Link to parent, and list entry in parent's children. | 
 | 416 | 	 * Protected by this->hierarchy_mutex and cgroup_lock() | 
 | 417 | 	 */ | 
 | 418 | 	struct cgroupfs_root *root; | 
| Paul Menage | ddbcc7e | 2007-10-18 23:39:30 -0700 | [diff] [blame] | 419 | 	struct list_head sibling; | 
| KAMEZAWA Hiroyuki | 38460b4 | 2009-04-02 16:57:25 -0700 | [diff] [blame] | 420 | 	/* used when use_id == true */ | 
 | 421 | 	struct idr idr; | 
 | 422 | 	spinlock_t id_lock; | 
| Paul Menage | ddbcc7e | 2007-10-18 23:39:30 -0700 | [diff] [blame] | 423 | }; | 
 | 424 |  | 
 | 425 | #define SUBSYS(_x) extern struct cgroup_subsys _x ## _subsys; | 
 | 426 | #include <linux/cgroup_subsys.h> | 
 | 427 | #undef SUBSYS | 
 | 428 |  | 
 | 429 | static inline struct cgroup_subsys_state *cgroup_subsys_state( | 
| Li Zefan | ffd2d88 | 2008-02-23 15:24:09 -0800 | [diff] [blame] | 430 | 	struct cgroup *cgrp, int subsys_id) | 
| Paul Menage | ddbcc7e | 2007-10-18 23:39:30 -0700 | [diff] [blame] | 431 | { | 
| Li Zefan | ffd2d88 | 2008-02-23 15:24:09 -0800 | [diff] [blame] | 432 | 	return cgrp->subsys[subsys_id]; | 
| Paul Menage | ddbcc7e | 2007-10-18 23:39:30 -0700 | [diff] [blame] | 433 | } | 
 | 434 |  | 
 | 435 | static inline struct cgroup_subsys_state *task_subsys_state( | 
 | 436 | 	struct task_struct *task, int subsys_id) | 
 | 437 | { | 
| Paul Menage | 817929e | 2007-10-18 23:39:36 -0700 | [diff] [blame] | 438 | 	return rcu_dereference(task->cgroups->subsys[subsys_id]); | 
| Paul Menage | ddbcc7e | 2007-10-18 23:39:30 -0700 | [diff] [blame] | 439 | } | 
 | 440 |  | 
 | 441 | static inline struct cgroup* task_cgroup(struct task_struct *task, | 
 | 442 | 					       int subsys_id) | 
 | 443 | { | 
 | 444 | 	return task_subsys_state(task, subsys_id)->cgroup; | 
 | 445 | } | 
 | 446 |  | 
| Serge E. Hallyn | e885dcd | 2008-07-25 01:47:06 -0700 | [diff] [blame] | 447 | int cgroup_clone(struct task_struct *tsk, struct cgroup_subsys *ss, | 
 | 448 | 							char *nodename); | 
| Paul Menage | 697f416 | 2007-10-18 23:39:34 -0700 | [diff] [blame] | 449 |  | 
| Paul Menage | 817929e | 2007-10-18 23:39:36 -0700 | [diff] [blame] | 450 | /* A cgroup_iter should be treated as an opaque object */ | 
 | 451 | struct cgroup_iter { | 
 | 452 | 	struct list_head *cg_link; | 
 | 453 | 	struct list_head *task; | 
 | 454 | }; | 
 | 455 |  | 
| Paul Menage | d20a390 | 2009-04-02 16:57:22 -0700 | [diff] [blame] | 456 | /* | 
 | 457 |  * To iterate across the tasks in a cgroup: | 
| Paul Menage | 817929e | 2007-10-18 23:39:36 -0700 | [diff] [blame] | 458 |  * | 
 | 459 |  * 1) call cgroup_iter_start to intialize an iterator | 
 | 460 |  * | 
 | 461 |  * 2) call cgroup_iter_next() to retrieve member tasks until it | 
 | 462 |  *    returns NULL or until you want to end the iteration | 
 | 463 |  * | 
 | 464 |  * 3) call cgroup_iter_end() to destroy the iterator. | 
| Cliff Wickman | 31a7df0 | 2008-02-07 00:14:42 -0800 | [diff] [blame] | 465 |  * | 
| Paul Menage | d20a390 | 2009-04-02 16:57:22 -0700 | [diff] [blame] | 466 |  * Or, call cgroup_scan_tasks() to iterate through every task in a | 
 | 467 |  * cgroup - cgroup_scan_tasks() holds the css_set_lock when calling | 
 | 468 |  * the test_task() callback, but not while calling the process_task() | 
 | 469 |  * callback. | 
| Paul Menage | 817929e | 2007-10-18 23:39:36 -0700 | [diff] [blame] | 470 |  */ | 
| Li Zefan | ffd2d88 | 2008-02-23 15:24:09 -0800 | [diff] [blame] | 471 | void cgroup_iter_start(struct cgroup *cgrp, struct cgroup_iter *it); | 
 | 472 | struct task_struct *cgroup_iter_next(struct cgroup *cgrp, | 
| Paul Menage | 817929e | 2007-10-18 23:39:36 -0700 | [diff] [blame] | 473 | 					struct cgroup_iter *it); | 
| Li Zefan | ffd2d88 | 2008-02-23 15:24:09 -0800 | [diff] [blame] | 474 | void cgroup_iter_end(struct cgroup *cgrp, struct cgroup_iter *it); | 
| Cliff Wickman | 31a7df0 | 2008-02-07 00:14:42 -0800 | [diff] [blame] | 475 | int cgroup_scan_tasks(struct cgroup_scanner *scan); | 
| Cliff Wickman | 956db3c | 2008-02-07 00:14:43 -0800 | [diff] [blame] | 476 | int cgroup_attach_task(struct cgroup *, struct task_struct *); | 
| Paul Menage | 817929e | 2007-10-18 23:39:36 -0700 | [diff] [blame] | 477 |  | 
| KAMEZAWA Hiroyuki | 38460b4 | 2009-04-02 16:57:25 -0700 | [diff] [blame] | 478 | /* | 
 | 479 |  * CSS ID is ID for cgroup_subsys_state structs under subsys. This only works | 
 | 480 |  * if cgroup_subsys.use_id == true. It can be used for looking up and scanning. | 
 | 481 |  * CSS ID is assigned at cgroup allocation (create) automatically | 
 | 482 |  * and removed when subsys calls free_css_id() function. This is because | 
 | 483 |  * the lifetime of cgroup_subsys_state is subsys's matter. | 
 | 484 |  * | 
 | 485 |  * Looking up and scanning function should be called under rcu_read_lock(). | 
 | 486 |  * Taking cgroup_mutex()/hierarchy_mutex() is not necessary for following calls. | 
 | 487 |  * But the css returned by this routine can be "not populated yet" or "being | 
 | 488 |  * destroyed". The caller should check css and cgroup's status. | 
 | 489 |  */ | 
 | 490 |  | 
 | 491 | /* | 
 | 492 |  * Typically Called at ->destroy(), or somewhere the subsys frees | 
 | 493 |  * cgroup_subsys_state. | 
 | 494 |  */ | 
 | 495 | void free_css_id(struct cgroup_subsys *ss, struct cgroup_subsys_state *css); | 
 | 496 |  | 
 | 497 | /* Find a cgroup_subsys_state which has given ID */ | 
 | 498 |  | 
 | 499 | struct cgroup_subsys_state *css_lookup(struct cgroup_subsys *ss, int id); | 
 | 500 |  | 
 | 501 | /* | 
 | 502 |  * Get a cgroup whose id is greater than or equal to id under tree of root. | 
 | 503 |  * Returning a cgroup_subsys_state or NULL. | 
 | 504 |  */ | 
 | 505 | struct cgroup_subsys_state *css_get_next(struct cgroup_subsys *ss, int id, | 
 | 506 | 		struct cgroup_subsys_state *root, int *foundid); | 
 | 507 |  | 
 | 508 | /* Returns true if root is ancestor of cg */ | 
 | 509 | bool css_is_ancestor(struct cgroup_subsys_state *cg, | 
| KAMEZAWA Hiroyuki | 0b7f569 | 2009-04-02 16:57:38 -0700 | [diff] [blame] | 510 | 		     const struct cgroup_subsys_state *root); | 
| KAMEZAWA Hiroyuki | 38460b4 | 2009-04-02 16:57:25 -0700 | [diff] [blame] | 511 |  | 
 | 512 | /* Get id and depth of css */ | 
 | 513 | unsigned short css_id(struct cgroup_subsys_state *css); | 
 | 514 | unsigned short css_depth(struct cgroup_subsys_state *css); | 
 | 515 |  | 
| Paul Menage | ddbcc7e | 2007-10-18 23:39:30 -0700 | [diff] [blame] | 516 | #else /* !CONFIG_CGROUPS */ | 
 | 517 |  | 
 | 518 | static inline int cgroup_init_early(void) { return 0; } | 
 | 519 | static inline int cgroup_init(void) { return 0; } | 
| Paul Menage | b4f48b6 | 2007-10-18 23:39:33 -0700 | [diff] [blame] | 520 | static inline void cgroup_fork(struct task_struct *p) {} | 
 | 521 | static inline void cgroup_fork_callbacks(struct task_struct *p) {} | 
| Paul Menage | 817929e | 2007-10-18 23:39:36 -0700 | [diff] [blame] | 522 | static inline void cgroup_post_fork(struct task_struct *p) {} | 
| Paul Menage | b4f48b6 | 2007-10-18 23:39:33 -0700 | [diff] [blame] | 523 | static inline void cgroup_exit(struct task_struct *p, int callbacks) {} | 
| Paul Menage | ddbcc7e | 2007-10-18 23:39:30 -0700 | [diff] [blame] | 524 |  | 
 | 525 | static inline void cgroup_lock(void) {} | 
 | 526 | static inline void cgroup_unlock(void) {} | 
| Balbir Singh | 846c7bb | 2007-10-18 23:39:44 -0700 | [diff] [blame] | 527 | static inline int cgroupstats_build(struct cgroupstats *stats, | 
 | 528 | 					struct dentry *dentry) | 
 | 529 | { | 
 | 530 | 	return -EINVAL; | 
 | 531 | } | 
| Paul Menage | ddbcc7e | 2007-10-18 23:39:30 -0700 | [diff] [blame] | 532 |  | 
 | 533 | #endif /* !CONFIG_CGROUPS */ | 
 | 534 |  | 
| Paul Menage | ddbcc7e | 2007-10-18 23:39:30 -0700 | [diff] [blame] | 535 | #endif /* _LINUX_CGROUP_H */ |