| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 1 | /* Kernel thread helper functions. | 
|  | 2 | *   Copyright (C) 2004 IBM Corporation, Rusty Russell. | 
|  | 3 | * | 
| Eric W. Biederman | 73c2799 | 2007-05-09 02:34:32 -0700 | [diff] [blame] | 4 | * Creation is done via kthreadd, so that we get a clean environment | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 5 | * even if we're invoked from userspace (think modprobe, hotplug cpu, | 
|  | 6 | * etc.). | 
|  | 7 | */ | 
|  | 8 | #include <linux/sched.h> | 
|  | 9 | #include <linux/kthread.h> | 
|  | 10 | #include <linux/completion.h> | 
|  | 11 | #include <linux/err.h> | 
|  | 12 | #include <linux/unistd.h> | 
|  | 13 | #include <linux/file.h> | 
|  | 14 | #include <linux/module.h> | 
| Arjan van de Ven | 97d1f15 | 2006-03-23 03:00:24 -0800 | [diff] [blame] | 15 | #include <linux/mutex.h> | 
| Mathieu Desnoyers | 0a16b60 | 2008-07-18 12:16:17 -0400 | [diff] [blame] | 16 | #include <trace/sched.h> | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 17 |  | 
| Michal Schmidt | 4f05b98 | 2008-01-25 21:08:33 +0100 | [diff] [blame] | 18 | #define KTHREAD_NICE_LEVEL (-5) | 
|  | 19 |  | 
| Eric W. Biederman | 73c2799 | 2007-05-09 02:34:32 -0700 | [diff] [blame] | 20 | static DEFINE_SPINLOCK(kthread_create_lock); | 
|  | 21 | static LIST_HEAD(kthread_create_list); | 
|  | 22 | struct task_struct *kthreadd_task; | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 23 |  | 
| Mathieu Desnoyers | 7e066fb | 2008-11-14 17:47:47 -0500 | [diff] [blame] | 24 | DEFINE_TRACE(sched_kthread_stop); | 
|  | 25 | DEFINE_TRACE(sched_kthread_stop_ret); | 
|  | 26 |  | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 27 | struct kthread_create_info | 
|  | 28 | { | 
| Eric W. Biederman | 73c2799 | 2007-05-09 02:34:32 -0700 | [diff] [blame] | 29 | /* Information passed to kthread() from kthreadd. */ | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 30 | int (*threadfn)(void *data); | 
|  | 31 | void *data; | 
|  | 32 | struct completion started; | 
|  | 33 |  | 
| Eric W. Biederman | 73c2799 | 2007-05-09 02:34:32 -0700 | [diff] [blame] | 34 | /* Result passed back to kthread_create() from kthreadd. */ | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 35 | struct task_struct *result; | 
|  | 36 | struct completion done; | 
| David Howells | 65f27f3 | 2006-11-22 14:55:48 +0000 | [diff] [blame] | 37 |  | 
| Eric W. Biederman | 73c2799 | 2007-05-09 02:34:32 -0700 | [diff] [blame] | 38 | struct list_head list; | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 39 | }; | 
|  | 40 |  | 
|  | 41 | struct kthread_stop_info | 
|  | 42 | { | 
|  | 43 | struct task_struct *k; | 
|  | 44 | int err; | 
|  | 45 | struct completion done; | 
|  | 46 | }; | 
|  | 47 |  | 
|  | 48 | /* Thread stopping is done by setthing this var: lock serializes | 
|  | 49 | * multiple kthread_stop calls. */ | 
| Arjan van de Ven | 97d1f15 | 2006-03-23 03:00:24 -0800 | [diff] [blame] | 50 | static DEFINE_MUTEX(kthread_stop_lock); | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 51 | static struct kthread_stop_info kthread_stop_info; | 
|  | 52 |  | 
| Randy Dunlap | 9e37bd3 | 2006-06-25 05:49:19 -0700 | [diff] [blame] | 53 | /** | 
|  | 54 | * kthread_should_stop - should this kthread return now? | 
|  | 55 | * | 
| Robert P. J. Day | 72fd4a3 | 2007-02-10 01:45:59 -0800 | [diff] [blame] | 56 | * When someone calls kthread_stop() on your kthread, it will be woken | 
| Randy Dunlap | 9e37bd3 | 2006-06-25 05:49:19 -0700 | [diff] [blame] | 57 | * and this will return true.  You should then return, and your return | 
|  | 58 | * value will be passed through to kthread_stop(). | 
|  | 59 | */ | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 60 | int kthread_should_stop(void) | 
|  | 61 | { | 
|  | 62 | return (kthread_stop_info.k == current); | 
|  | 63 | } | 
|  | 64 | EXPORT_SYMBOL(kthread_should_stop); | 
|  | 65 |  | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 66 | static int kthread(void *_create) | 
|  | 67 | { | 
|  | 68 | struct kthread_create_info *create = _create; | 
|  | 69 | int (*threadfn)(void *data); | 
|  | 70 | void *data; | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 71 | int ret = -EINTR; | 
|  | 72 |  | 
| Eric W. Biederman | 73c2799 | 2007-05-09 02:34:32 -0700 | [diff] [blame] | 73 | /* Copy data: it's on kthread's stack */ | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 74 | threadfn = create->threadfn; | 
|  | 75 | data = create->data; | 
|  | 76 |  | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 77 | /* OK, tell user we're spawned, wait for stop or wakeup */ | 
| Oleg Nesterov | a076e4b | 2007-05-23 13:57:27 -0700 | [diff] [blame] | 78 | __set_current_state(TASK_UNINTERRUPTIBLE); | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 79 | complete(&create->started); | 
|  | 80 | schedule(); | 
|  | 81 |  | 
|  | 82 | if (!kthread_should_stop()) | 
|  | 83 | ret = threadfn(data); | 
|  | 84 |  | 
|  | 85 | /* It might have exited on its own, w/o kthread_stop.  Check. */ | 
|  | 86 | if (kthread_should_stop()) { | 
|  | 87 | kthread_stop_info.err = ret; | 
|  | 88 | complete(&kthread_stop_info.done); | 
|  | 89 | } | 
|  | 90 | return 0; | 
|  | 91 | } | 
|  | 92 |  | 
| Eric W. Biederman | 73c2799 | 2007-05-09 02:34:32 -0700 | [diff] [blame] | 93 | static void create_kthread(struct kthread_create_info *create) | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 94 | { | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 95 | int pid; | 
|  | 96 |  | 
|  | 97 | /* We want our own signal handler (we take no signals by default). */ | 
|  | 98 | pid = kernel_thread(kthread, create, CLONE_FS | CLONE_FILES | SIGCHLD); | 
|  | 99 | if (pid < 0) { | 
|  | 100 | create->result = ERR_PTR(pid); | 
|  | 101 | } else { | 
| Michal Schmidt | 4f05b98 | 2008-01-25 21:08:33 +0100 | [diff] [blame] | 102 | struct sched_param param = { .sched_priority = 0 }; | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 103 | wait_for_completion(&create->started); | 
| Andrew Morton | 05eeae2 | 2006-03-25 03:07:48 -0800 | [diff] [blame] | 104 | read_lock(&tasklist_lock); | 
| Pavel Emelyanov | 5cd2045 | 2008-04-30 00:54:24 -0700 | [diff] [blame] | 105 | create->result = find_task_by_pid_ns(pid, &init_pid_ns); | 
| Andrew Morton | 05eeae2 | 2006-03-25 03:07:48 -0800 | [diff] [blame] | 106 | read_unlock(&tasklist_lock); | 
| Michal Schmidt | 4f05b98 | 2008-01-25 21:08:33 +0100 | [diff] [blame] | 107 | /* | 
|  | 108 | * root may have changed our (kthreadd's) priority or CPU mask. | 
|  | 109 | * The kernel thread should not inherit these properties. | 
|  | 110 | */ | 
|  | 111 | sched_setscheduler(create->result, SCHED_NORMAL, ¶m); | 
|  | 112 | set_user_nice(create->result, KTHREAD_NICE_LEVEL); | 
| Rusty Russell | 1a2142a | 2009-03-30 22:05:10 -0600 | [diff] [blame] | 113 | set_cpus_allowed_ptr(create->result, cpu_all_mask); | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 114 | } | 
|  | 115 | complete(&create->done); | 
|  | 116 | } | 
|  | 117 |  | 
| Randy Dunlap | 9e37bd3 | 2006-06-25 05:49:19 -0700 | [diff] [blame] | 118 | /** | 
|  | 119 | * kthread_create - create a kthread. | 
|  | 120 | * @threadfn: the function to run until signal_pending(current). | 
|  | 121 | * @data: data ptr for @threadfn. | 
|  | 122 | * @namefmt: printf-style name for the thread. | 
|  | 123 | * | 
|  | 124 | * Description: This helper function creates and names a kernel | 
|  | 125 | * thread.  The thread will be stopped: use wake_up_process() to start | 
|  | 126 | * it.  See also kthread_run(), kthread_create_on_cpu(). | 
|  | 127 | * | 
|  | 128 | * When woken, the thread will run @threadfn() with @data as its | 
| Robert P. J. Day | 72fd4a3 | 2007-02-10 01:45:59 -0800 | [diff] [blame] | 129 | * argument. @threadfn() can either call do_exit() directly if it is a | 
| Randy Dunlap | 9e37bd3 | 2006-06-25 05:49:19 -0700 | [diff] [blame] | 130 | * standalone thread for which noone will call kthread_stop(), or | 
|  | 131 | * return when 'kthread_should_stop()' is true (which means | 
|  | 132 | * kthread_stop() has been called).  The return value should be zero | 
|  | 133 | * or a negative error number; it will be passed to kthread_stop(). | 
|  | 134 | * | 
|  | 135 | * Returns a task_struct or ERR_PTR(-ENOMEM). | 
|  | 136 | */ | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 137 | struct task_struct *kthread_create(int (*threadfn)(void *data), | 
|  | 138 | void *data, | 
|  | 139 | const char namefmt[], | 
|  | 140 | ...) | 
|  | 141 | { | 
|  | 142 | struct kthread_create_info create; | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 143 |  | 
|  | 144 | create.threadfn = threadfn; | 
|  | 145 | create.data = data; | 
|  | 146 | init_completion(&create.started); | 
|  | 147 | init_completion(&create.done); | 
|  | 148 |  | 
| Eric W. Biederman | 73c2799 | 2007-05-09 02:34:32 -0700 | [diff] [blame] | 149 | spin_lock(&kthread_create_lock); | 
|  | 150 | list_add_tail(&create.list, &kthread_create_list); | 
| Eric W. Biederman | 73c2799 | 2007-05-09 02:34:32 -0700 | [diff] [blame] | 151 | spin_unlock(&kthread_create_lock); | 
|  | 152 |  | 
| Dmitry Adamushko | cbd9b67 | 2008-04-29 00:59:23 -0700 | [diff] [blame] | 153 | wake_up_process(kthreadd_task); | 
| Eric W. Biederman | 73c2799 | 2007-05-09 02:34:32 -0700 | [diff] [blame] | 154 | wait_for_completion(&create.done); | 
|  | 155 |  | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 156 | if (!IS_ERR(create.result)) { | 
|  | 157 | va_list args; | 
|  | 158 | va_start(args, namefmt); | 
|  | 159 | vsnprintf(create.result->comm, sizeof(create.result->comm), | 
|  | 160 | namefmt, args); | 
|  | 161 | va_end(args); | 
|  | 162 | } | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 163 | return create.result; | 
|  | 164 | } | 
|  | 165 | EXPORT_SYMBOL(kthread_create); | 
|  | 166 |  | 
| Randy Dunlap | 9e37bd3 | 2006-06-25 05:49:19 -0700 | [diff] [blame] | 167 | /** | 
|  | 168 | * kthread_bind - bind a just-created kthread to a cpu. | 
|  | 169 | * @k: thread created by kthread_create(). | 
|  | 170 | * @cpu: cpu (might not be online, must be possible) for @k to run on. | 
|  | 171 | * | 
|  | 172 | * Description: This function is equivalent to set_cpus_allowed(), | 
|  | 173 | * except that @cpu doesn't need to be online, and the thread must be | 
| Robert P. J. Day | 72fd4a3 | 2007-02-10 01:45:59 -0800 | [diff] [blame] | 174 | * stopped (i.e., just returned from kthread_create()). | 
| Randy Dunlap | 9e37bd3 | 2006-06-25 05:49:19 -0700 | [diff] [blame] | 175 | */ | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 176 | void kthread_bind(struct task_struct *k, unsigned int cpu) | 
|  | 177 | { | 
| Oleg Nesterov | 293adee | 2008-10-18 20:28:24 -0700 | [diff] [blame] | 178 | /* Must have done schedule() in kthread() before we set_task_cpu */ | 
|  | 179 | if (!wait_task_inactive(k, TASK_UNINTERRUPTIBLE)) { | 
| Oleg Nesterov | a076e4b | 2007-05-23 13:57:27 -0700 | [diff] [blame] | 180 | WARN_ON(1); | 
|  | 181 | return; | 
|  | 182 | } | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 183 | set_task_cpu(k, cpu); | 
|  | 184 | k->cpus_allowed = cpumask_of_cpu(cpu); | 
| Gregory Haskins | 9f0e738 | 2008-02-12 13:30:05 -0500 | [diff] [blame] | 185 | k->rt.nr_cpus_allowed = 1; | 
| David Rientjes | 9985b0b | 2008-06-05 12:57:11 -0700 | [diff] [blame] | 186 | k->flags |= PF_THREAD_BOUND; | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 187 | } | 
|  | 188 | EXPORT_SYMBOL(kthread_bind); | 
|  | 189 |  | 
| Randy Dunlap | 9e37bd3 | 2006-06-25 05:49:19 -0700 | [diff] [blame] | 190 | /** | 
|  | 191 | * kthread_stop - stop a thread created by kthread_create(). | 
|  | 192 | * @k: thread created by kthread_create(). | 
|  | 193 | * | 
|  | 194 | * Sets kthread_should_stop() for @k to return true, wakes it, and | 
|  | 195 | * waits for it to exit.  Your threadfn() must not call do_exit() | 
|  | 196 | * itself if you use this function!  This can also be called after | 
|  | 197 | * kthread_create() instead of calling wake_up_process(): the thread | 
|  | 198 | * will exit without calling threadfn(). | 
|  | 199 | * | 
|  | 200 | * Returns the result of threadfn(), or %-EINTR if wake_up_process() | 
|  | 201 | * was never called. | 
|  | 202 | */ | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 203 | int kthread_stop(struct task_struct *k) | 
|  | 204 | { | 
|  | 205 | int ret; | 
|  | 206 |  | 
| Arjan van de Ven | 97d1f15 | 2006-03-23 03:00:24 -0800 | [diff] [blame] | 207 | mutex_lock(&kthread_stop_lock); | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 208 |  | 
|  | 209 | /* It could exit after stop_info.k set, but before wake_up_process. */ | 
|  | 210 | get_task_struct(k); | 
|  | 211 |  | 
| Mathieu Desnoyers | 0a16b60 | 2008-07-18 12:16:17 -0400 | [diff] [blame] | 212 | trace_sched_kthread_stop(k); | 
|  | 213 |  | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 214 | /* Must init completion *before* thread sees kthread_stop_info.k */ | 
|  | 215 | init_completion(&kthread_stop_info.done); | 
| akpm@osdl.org | d59dd46 | 2005-05-01 08:58:47 -0700 | [diff] [blame] | 216 | smp_wmb(); | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 217 |  | 
|  | 218 | /* Now set kthread_should_stop() to true, and wake it up. */ | 
|  | 219 | kthread_stop_info.k = k; | 
| Adrian Bunk | 52e92e5 | 2006-07-14 00:24:05 -0700 | [diff] [blame] | 220 | wake_up_process(k); | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 221 | put_task_struct(k); | 
|  | 222 |  | 
|  | 223 | /* Once it dies, reset stop ptr, gather result and we're done. */ | 
|  | 224 | wait_for_completion(&kthread_stop_info.done); | 
|  | 225 | kthread_stop_info.k = NULL; | 
|  | 226 | ret = kthread_stop_info.err; | 
| Arjan van de Ven | 97d1f15 | 2006-03-23 03:00:24 -0800 | [diff] [blame] | 227 | mutex_unlock(&kthread_stop_lock); | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 228 |  | 
| Mathieu Desnoyers | 0a16b60 | 2008-07-18 12:16:17 -0400 | [diff] [blame] | 229 | trace_sched_kthread_stop_ret(ret); | 
|  | 230 |  | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 231 | return ret; | 
|  | 232 | } | 
| Adrian Bunk | 52e92e5 | 2006-07-14 00:24:05 -0700 | [diff] [blame] | 233 | EXPORT_SYMBOL(kthread_stop); | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 234 |  | 
| Satyam Sharma | e804a4a | 2007-07-31 00:39:16 -0700 | [diff] [blame] | 235 | int kthreadd(void *unused) | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 236 | { | 
| Eric W. Biederman | 73c2799 | 2007-05-09 02:34:32 -0700 | [diff] [blame] | 237 | struct task_struct *tsk = current; | 
| Eric W. Biederman | 73c2799 | 2007-05-09 02:34:32 -0700 | [diff] [blame] | 238 |  | 
| Satyam Sharma | e804a4a | 2007-07-31 00:39:16 -0700 | [diff] [blame] | 239 | /* Setup a clean context for our children to inherit. */ | 
| Eric W. Biederman | 73c2799 | 2007-05-09 02:34:32 -0700 | [diff] [blame] | 240 | set_task_comm(tsk, "kthreadd"); | 
| Oleg Nesterov | 10ab825 | 2007-05-09 02:34:37 -0700 | [diff] [blame] | 241 | ignore_signals(tsk); | 
| Michal Schmidt | 4f05b98 | 2008-01-25 21:08:33 +0100 | [diff] [blame] | 242 | set_user_nice(tsk, KTHREAD_NICE_LEVEL); | 
| Rusty Russell | 1a2142a | 2009-03-30 22:05:10 -0600 | [diff] [blame] | 243 | set_cpus_allowed_ptr(tsk, cpu_all_mask); | 
| Eric W. Biederman | 73c2799 | 2007-05-09 02:34:32 -0700 | [diff] [blame] | 244 |  | 
| Rafael J. Wysocki | ebb12db | 2008-06-11 22:04:29 +0200 | [diff] [blame] | 245 | current->flags |= PF_NOFREEZE | PF_FREEZER_NOSIG; | 
| Eric W. Biederman | 73c2799 | 2007-05-09 02:34:32 -0700 | [diff] [blame] | 246 |  | 
|  | 247 | for (;;) { | 
|  | 248 | set_current_state(TASK_INTERRUPTIBLE); | 
|  | 249 | if (list_empty(&kthread_create_list)) | 
|  | 250 | schedule(); | 
|  | 251 | __set_current_state(TASK_RUNNING); | 
|  | 252 |  | 
|  | 253 | spin_lock(&kthread_create_lock); | 
|  | 254 | while (!list_empty(&kthread_create_list)) { | 
|  | 255 | struct kthread_create_info *create; | 
|  | 256 |  | 
|  | 257 | create = list_entry(kthread_create_list.next, | 
|  | 258 | struct kthread_create_info, list); | 
|  | 259 | list_del_init(&create->list); | 
|  | 260 | spin_unlock(&kthread_create_lock); | 
|  | 261 |  | 
|  | 262 | create_kthread(create); | 
|  | 263 |  | 
|  | 264 | spin_lock(&kthread_create_lock); | 
|  | 265 | } | 
|  | 266 | spin_unlock(&kthread_create_lock); | 
|  | 267 | } | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 268 |  | 
|  | 269 | return 0; | 
|  | 270 | } |