Commit f400e198 authored by Sukadev Bhattiprolu's avatar Sukadev Bhattiprolu Committed by Linus Torvalds

[PATCH] pidspace: is_init()

This is an updated version of Eric Biederman's is_init() patch.
(http://lkml.org/lkml/2006/2/6/280).  It applies cleanly to 2.6.18-rc3 and
replaces a few more instances of ->pid == 1 with is_init().

Further, is_init() checks pid and thus removes dependency on Eric's other
patches for now.

Eric's original description:

	There are a lot of places in the kernel where we test for init
	because we give it special properties.  Most  significantly init
	must not die.  This results in code all over the kernel test
	->pid == 1.

	Introduce is_init to capture this case.

	With multiple pid spaces for all of the cases affected we are
	looking for only the first process on the system, not some other
	process that has pid == 1.
Signed-off-by: default avatarEric W. Biederman <ebiederm@xmission.com>
Signed-off-by: default avatarSukadev Bhattiprolu <sukadev@us.ibm.com>
Cc: Dave Hansen <haveblue@us.ibm.com>
Cc: Serge Hallyn <serue@us.ibm.com>
Cc: Cedric Le Goater <clg@fr.ibm.com>
Cc: <lxc-devel@lists.sourceforge.net>
Acked-by: default avatarPaul Mackerras <paulus@samba.org>
Signed-off-by: default avatarAndrew Morton <akpm@osdl.org>
Signed-off-by: default avatarLinus Torvalds <torvalds@osdl.org>
parent 959ed340
...@@ -193,7 +193,7 @@ do_page_fault(unsigned long address, unsigned long mmcsr, ...@@ -193,7 +193,7 @@ do_page_fault(unsigned long address, unsigned long mmcsr,
/* We ran out of memory, or some other thing happened to us that /* We ran out of memory, or some other thing happened to us that
made us unable to handle the page fault gracefully. */ made us unable to handle the page fault gracefully. */
out_of_memory: out_of_memory:
if (current->pid == 1) { if (is_init(current)) {
yield(); yield();
down_read(&mm->mmap_sem); down_read(&mm->mmap_sem);
goto survive; goto survive;
......
...@@ -198,7 +198,7 @@ survive: ...@@ -198,7 +198,7 @@ survive:
return fault; return fault;
} }
if (tsk->pid != 1) if (!is_init(tsk))
goto out; goto out;
/* /*
......
...@@ -185,7 +185,7 @@ survive: ...@@ -185,7 +185,7 @@ survive:
} }
fault = -3; /* out of memory */ fault = -3; /* out of memory */
if (tsk->pid != 1) if (!is_init(tsk))
goto out; goto out;
/* /*
......
...@@ -739,7 +739,7 @@ survive: ...@@ -739,7 +739,7 @@ survive:
retval = get_user_pages(current, current->mm, retval = get_user_pages(current, current->mm,
(unsigned long )to, 1, 1, 0, &pg, NULL); (unsigned long )to, 1, 1, 0, &pg, NULL);
if (retval == -ENOMEM && current->pid == 1) { if (retval == -ENOMEM && is_init(current)) {
up_read(&current->mm->mmap_sem); up_read(&current->mm->mmap_sem);
blk_congestion_wait(WRITE, HZ/50); blk_congestion_wait(WRITE, HZ/50);
goto survive; goto survive;
......
...@@ -589,7 +589,7 @@ no_context: ...@@ -589,7 +589,7 @@ no_context:
*/ */
out_of_memory: out_of_memory:
up_read(&mm->mmap_sem); up_read(&mm->mmap_sem);
if (tsk->pid == 1) { if (is_init(tsk)) {
yield(); yield();
down_read(&mm->mmap_sem); down_read(&mm->mmap_sem);
goto survive; goto survive;
......
...@@ -280,7 +280,7 @@ ia64_do_page_fault (unsigned long address, unsigned long isr, struct pt_regs *re ...@@ -280,7 +280,7 @@ ia64_do_page_fault (unsigned long address, unsigned long isr, struct pt_regs *re
out_of_memory: out_of_memory:
up_read(&mm->mmap_sem); up_read(&mm->mmap_sem);
if (current->pid == 1) { if (is_init(current)) {
yield(); yield();
down_read(&mm->mmap_sem); down_read(&mm->mmap_sem);
goto survive; goto survive;
......
...@@ -299,7 +299,7 @@ no_context: ...@@ -299,7 +299,7 @@ no_context:
*/ */
out_of_memory: out_of_memory:
up_read(&mm->mmap_sem); up_read(&mm->mmap_sem);
if (tsk->pid == 1) { if (is_init(tsk)) {
yield(); yield();
down_read(&mm->mmap_sem); down_read(&mm->mmap_sem);
goto survive; goto survive;
......
...@@ -181,7 +181,7 @@ good_area: ...@@ -181,7 +181,7 @@ good_area:
*/ */
out_of_memory: out_of_memory:
up_read(&mm->mmap_sem); up_read(&mm->mmap_sem);
if (current->pid == 1) { if (is_init(current)) {
yield(); yield();
down_read(&mm->mmap_sem); down_read(&mm->mmap_sem);
goto survive; goto survive;
......
...@@ -171,7 +171,7 @@ no_context: ...@@ -171,7 +171,7 @@ no_context:
*/ */
out_of_memory: out_of_memory:
up_read(&mm->mmap_sem); up_read(&mm->mmap_sem);
if (tsk->pid == 1) { if (is_init(tsk)) {
yield(); yield();
down_read(&mm->mmap_sem); down_read(&mm->mmap_sem);
goto survive; goto survive;
......
...@@ -386,7 +386,7 @@ bad_area_nosemaphore: ...@@ -386,7 +386,7 @@ bad_area_nosemaphore:
*/ */
out_of_memory: out_of_memory:
up_read(&mm->mmap_sem); up_read(&mm->mmap_sem);
if (current->pid == 1) { if (is_init(current)) {
yield(); yield();
down_read(&mm->mmap_sem); down_read(&mm->mmap_sem);
goto survive; goto survive;
......
...@@ -337,7 +337,7 @@ static int recover_mce(struct pt_regs *regs, struct rtas_error_log * err) ...@@ -337,7 +337,7 @@ static int recover_mce(struct pt_regs *regs, struct rtas_error_log * err)
err->disposition == RTAS_DISP_NOT_RECOVERED && err->disposition == RTAS_DISP_NOT_RECOVERED &&
err->target == RTAS_TARGET_MEMORY && err->target == RTAS_TARGET_MEMORY &&
err->type == RTAS_TYPE_ECC_UNCORR && err->type == RTAS_TYPE_ECC_UNCORR &&
!(current->pid == 0 || current->pid == 1)) { !(current->pid == 0 || is_init(current))) {
/* Kill off a user process with an ECC error */ /* Kill off a user process with an ECC error */
printk(KERN_ERR "MCE: uncorrectable ecc error for pid %d\n", printk(KERN_ERR "MCE: uncorrectable ecc error for pid %d\n",
current->pid); current->pid);
......
...@@ -119,7 +119,7 @@ void _exception(int signr, struct pt_regs *regs, int code, unsigned long addr) ...@@ -119,7 +119,7 @@ void _exception(int signr, struct pt_regs *regs, int code, unsigned long addr)
* generate the same exception over and over again and we get * generate the same exception over and over again and we get
* nowhere. Better to kill it and let the kernel panic. * nowhere. Better to kill it and let the kernel panic.
*/ */
if (current->pid == 1) { if (is_init(current)) {
__sighandler_t handler; __sighandler_t handler;
spin_lock_irq(&current->sighand->siglock); spin_lock_irq(&current->sighand->siglock);
......
...@@ -291,7 +291,7 @@ bad_area: ...@@ -291,7 +291,7 @@ bad_area:
*/ */
out_of_memory: out_of_memory:
up_read(&mm->mmap_sem); up_read(&mm->mmap_sem);
if (current->pid == 1) { if (is_init(current)) {
yield(); yield();
down_read(&mm->mmap_sem); down_read(&mm->mmap_sem);
goto survive; goto survive;
......
...@@ -353,7 +353,7 @@ no_context: ...@@ -353,7 +353,7 @@ no_context:
*/ */
out_of_memory: out_of_memory:
up_read(&mm->mmap_sem); up_read(&mm->mmap_sem);
if (tsk->pid == 1) { if (is_init(tsk)) {
yield(); yield();
down_read(&mm->mmap_sem); down_read(&mm->mmap_sem);
goto survive; goto survive;
......
...@@ -149,7 +149,7 @@ no_context: ...@@ -149,7 +149,7 @@ no_context:
*/ */
out_of_memory: out_of_memory:
up_read(&mm->mmap_sem); up_read(&mm->mmap_sem);
if (current->pid == 1) { if (is_init(current)) {
yield(); yield();
down_read(&mm->mmap_sem); down_read(&mm->mmap_sem);
goto survive; goto survive;
......
...@@ -277,7 +277,7 @@ bad_area: ...@@ -277,7 +277,7 @@ bad_area:
show_regs(regs); show_regs(regs);
#endif #endif
} }
if (tsk->pid == 1) { if (is_init(tsk)) {
panic("INIT had user mode bad_area\n"); panic("INIT had user mode bad_area\n");
} }
tsk->thread.address = address; tsk->thread.address = address;
...@@ -319,14 +319,14 @@ no_context: ...@@ -319,14 +319,14 @@ no_context:
* us unable to handle the page fault gracefully. * us unable to handle the page fault gracefully.
*/ */
out_of_memory: out_of_memory:
if (current->pid == 1) { if (is_init(current)) {
panic("INIT out of memory\n"); panic("INIT out of memory\n");
yield(); yield();
goto survive; goto survive;
} }
printk("fault:Out of memory\n"); printk("fault:Out of memory\n");
up_read(&mm->mmap_sem); up_read(&mm->mmap_sem);
if (current->pid == 1) { if (is_init(current)) {
yield(); yield();
down_read(&mm->mmap_sem); down_read(&mm->mmap_sem);
goto survive; goto survive;
......
...@@ -120,7 +120,7 @@ out_nosemaphore: ...@@ -120,7 +120,7 @@ out_nosemaphore:
* us unable to handle the page fault gracefully. * us unable to handle the page fault gracefully.
*/ */
out_of_memory: out_of_memory:
if (current->pid == 1) { if (is_init(current)) {
up_read(&mm->mmap_sem); up_read(&mm->mmap_sem);
yield(); yield();
down_read(&mm->mmap_sem); down_read(&mm->mmap_sem);
......
...@@ -244,7 +244,7 @@ static int is_errata93(struct pt_regs *regs, unsigned long address) ...@@ -244,7 +244,7 @@ static int is_errata93(struct pt_regs *regs, unsigned long address)
int unhandled_signal(struct task_struct *tsk, int sig) int unhandled_signal(struct task_struct *tsk, int sig)
{ {
if (tsk->pid == 1) if (is_init(tsk))
return 1; return 1;
if (tsk->ptrace & PT_PTRACED) if (tsk->ptrace & PT_PTRACED)
return 0; return 0;
...@@ -580,7 +580,7 @@ no_context: ...@@ -580,7 +580,7 @@ no_context:
*/ */
out_of_memory: out_of_memory:
up_read(&mm->mmap_sem); up_read(&mm->mmap_sem);
if (current->pid == 1) { if (is_init(current)) {
yield(); yield();
goto again; goto again;
} }
......
...@@ -144,7 +144,7 @@ bad_area: ...@@ -144,7 +144,7 @@ bad_area:
*/ */
out_of_memory: out_of_memory:
up_read(&mm->mmap_sem); up_read(&mm->mmap_sem);
if (current->pid == 1) { if (is_init(current)) {
yield(); yield();
down_read(&mm->mmap_sem); down_read(&mm->mmap_sem);
goto survive; goto survive;
......
...@@ -208,7 +208,7 @@ static void send_sig_all(int sig) ...@@ -208,7 +208,7 @@ static void send_sig_all(int sig)
struct task_struct *p; struct task_struct *p;
for_each_process(p) { for_each_process(p) {
if (p->mm && p->pid != 1) if (p->mm && !is_init(p))
/* Not swapper, init nor kernel thread */ /* Not swapper, init nor kernel thread */
force_sig(sig, p); force_sig(sig, p);
} }
......
...@@ -1033,6 +1033,16 @@ static inline int pid_alive(struct task_struct *p) ...@@ -1033,6 +1033,16 @@ static inline int pid_alive(struct task_struct *p)
return p->pids[PIDTYPE_PID].pid != NULL; return p->pids[PIDTYPE_PID].pid != NULL;
} }
/**
* is_init - check if a task structure is the first user space
* task the kernel created.
* @p: Task structure to be checked.
*/
static inline int is_init(struct task_struct *tsk)
{
return tsk->pid == 1;
}
extern void free_task(struct task_struct *tsk); extern void free_task(struct task_struct *tsk);
#define get_task_struct(tsk) do { atomic_inc(&(tsk)->usage); } while(0) #define get_task_struct(tsk) do { atomic_inc(&(tsk)->usage); } while(0)
......
...@@ -133,7 +133,7 @@ static inline int cap_set_all(kernel_cap_t *effective, ...@@ -133,7 +133,7 @@ static inline int cap_set_all(kernel_cap_t *effective,
int found = 0; int found = 0;
do_each_thread(g, target) { do_each_thread(g, target) {
if (target == current || target->pid == 1) if (target == current || is_init(target))
continue; continue;
found = 1; found = 1;
if (security_capset_check(target, effective, inheritable, if (security_capset_check(target, effective, inheritable,
......
...@@ -240,7 +240,7 @@ static struct super_block *cpuset_sb; ...@@ -240,7 +240,7 @@ static struct super_block *cpuset_sb;
* A cpuset can only be deleted if both its 'count' of using tasks * A cpuset can only be deleted if both its 'count' of using tasks
* is zero, and its list of 'children' cpusets is empty. Since all * is zero, and its list of 'children' cpusets is empty. Since all
* tasks in the system use _some_ cpuset, and since there is always at * tasks in the system use _some_ cpuset, and since there is always at
* least one task in the system (init, pid == 1), therefore, top_cpuset * least one task in the system (init), therefore, top_cpuset
* always has either children cpusets and/or using tasks. So we don't * always has either children cpusets and/or using tasks. So we don't
* need a special hack to ensure that top_cpuset cannot be deleted. * need a special hack to ensure that top_cpuset cannot be deleted.
* *
......
...@@ -219,7 +219,7 @@ static int will_become_orphaned_pgrp(int pgrp, struct task_struct *ignored_task) ...@@ -219,7 +219,7 @@ static int will_become_orphaned_pgrp(int pgrp, struct task_struct *ignored_task)
do_each_task_pid(pgrp, PIDTYPE_PGID, p) { do_each_task_pid(pgrp, PIDTYPE_PGID, p) {
if (p == ignored_task if (p == ignored_task
|| p->exit_state || p->exit_state
|| p->real_parent->pid == 1) || is_init(p->real_parent))
continue; continue;
if (process_group(p->real_parent) != pgrp if (process_group(p->real_parent) != pgrp
&& p->real_parent->signal->session == p->signal->session) { && p->real_parent->signal->session == p->signal->session) {
......
...@@ -40,7 +40,7 @@ struct resource crashk_res = { ...@@ -40,7 +40,7 @@ struct resource crashk_res = {
int kexec_should_crash(struct task_struct *p) int kexec_should_crash(struct task_struct *p)
{ {
if (in_interrupt() || !p->pid || p->pid == 1 || panic_on_oops) if (in_interrupt() || !p->pid || is_init(p) || panic_on_oops)
return 1; return 1;
return 0; return 0;
} }
......
...@@ -440,6 +440,7 @@ struct task_struct *ptrace_get_task_struct(pid_t pid) ...@@ -440,6 +440,7 @@ struct task_struct *ptrace_get_task_struct(pid_t pid)
child = find_task_by_pid(pid); child = find_task_by_pid(pid);
if (child) if (child)
get_task_struct(child); get_task_struct(child);
read_unlock(&tasklist_lock); read_unlock(&tasklist_lock);
if (!child) if (!child)
return ERR_PTR(-ESRCH); return ERR_PTR(-ESRCH);
......
...@@ -1915,7 +1915,7 @@ int proc_dointvec_bset(ctl_table *table, int write, struct file *filp, ...@@ -1915,7 +1915,7 @@ int proc_dointvec_bset(ctl_table *table, int write, struct file *filp,
return -EPERM; return -EPERM;
} }
op = (current->pid == 1) ? OP_SET : OP_AND; op = is_init(current) ? OP_SET : OP_AND;
return do_proc_dointvec(table,write,filp,buffer,lenp,ppos, return do_proc_dointvec(table,write,filp,buffer,lenp,ppos,
do_proc_dointvec_bset_conv,&op); do_proc_dointvec_bset_conv,&op);
} }
......
...@@ -255,7 +255,7 @@ static struct task_struct *select_bad_process(unsigned long *ppoints) ...@@ -255,7 +255,7 @@ static struct task_struct *select_bad_process(unsigned long *ppoints)
*/ */
static void __oom_kill_task(struct task_struct *p, const char *message) static void __oom_kill_task(struct task_struct *p, const char *message)
{ {
if (p->pid == 1) { if (is_init(p)) {
WARN_ON(1); WARN_ON(1);
printk(KERN_WARNING "tried to kill init!\n"); printk(KERN_WARNING "tried to kill init!\n");
return; return;
......
...@@ -169,7 +169,7 @@ void cap_bprm_apply_creds (struct linux_binprm *bprm, int unsafe) ...@@ -169,7 +169,7 @@ void cap_bprm_apply_creds (struct linux_binprm *bprm, int unsafe)
/* For init, we want to retain the capabilities set /* For init, we want to retain the capabilities set
* in the init_task struct. Thus we skip the usual * in the init_task struct. Thus we skip the usual
* capability rules */ * capability rules */
if (current->pid != 1) { if (!is_init(current)) {
current->cap_permitted = new_permitted; current->cap_permitted = new_permitted;
current->cap_effective = current->cap_effective =
cap_intersect (new_permitted, bprm->cap_effective); cap_intersect (new_permitted, bprm->cap_effective);
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment