mirror of
https://github.com/torvalds/linux
synced 2024-11-05 18:23:50 +00:00
fork: report pid reservation failure properly
copy_process will report any failure in alloc_pid as ENOMEM currently which is misleading because the pid allocation might fail not only when the memory is short but also when the pid space is consumed already. The current man page even mentions this case: : EAGAIN : : A system-imposed limit on the number of threads was encountered. : There are a number of limits that may trigger this error: the : RLIMIT_NPROC soft resource limit (set via setrlimit(2)), which : limits the number of processes and threads for a real user ID, was : reached; the kernel's system-wide limit on the number of processes : and threads, /proc/sys/kernel/threads-max, was reached (see : proc(5)); or the maximum number of PIDs, /proc/sys/kernel/pid_max, : was reached (see proc(5)). so the current behavior is also incorrect wrt. documentation. POSIX man page also suggest returing EAGAIN when the process count limit is reached. This patch simply propagates error code from alloc_pid and makes sure we return -EAGAIN due to reservation failure. This will make behavior of fork closer to both our documentation and POSIX. alloc_pid might alsoo fail when the reaper in the pid namespace is dead (the namespace basically disallows all new processes) and there is no good error code which would match documented ones. We have traditionally returned ENOMEM for this case which is misleading as well but as per Eric W. Biederman this behavior is documented in man pid_namespaces(7) : If the "init" process of a PID namespace terminates, the kernel : terminates all of the processes in the namespace via a SIGKILL signal. : This behavior reflects the fact that the "init" process is essential for : the correct operation of a PID namespace. In this case, a subsequent : fork(2) into this PID namespace will fail with the error ENOMEM; it is : not possible to create a new processes in a PID namespace whose "init" : process has terminated. and introducing a new error code would be too risky so let's stick to ENOMEM for this case. Signed-off-by: Michal Hocko <mhocko@suse.cz> Cc: Oleg Nesterov <oleg@redhat.com> Cc: "Eric W. Biederman" <ebiederm@xmission.com> Cc: Michael Kerrisk <mtk.manpages@gmail.com> Signed-off-by: Andrew Morton <akpm@linux-foundation.org> Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org>
This commit is contained in:
parent
69828dce7a
commit
35f71bc0a0
2 changed files with 11 additions and 9 deletions
|
@ -1403,10 +1403,11 @@ static struct task_struct *copy_process(unsigned long clone_flags,
|
|||
goto bad_fork_cleanup_io;
|
||||
|
||||
if (pid != &init_struct_pid) {
|
||||
retval = -ENOMEM;
|
||||
pid = alloc_pid(p->nsproxy->pid_ns_for_children);
|
||||
if (!pid)
|
||||
if (IS_ERR(pid)) {
|
||||
retval = PTR_ERR(pid);
|
||||
goto bad_fork_cleanup_io;
|
||||
}
|
||||
}
|
||||
|
||||
p->set_child_tid = (clone_flags & CLONE_CHILD_SETTID) ? child_tidptr : NULL;
|
||||
|
|
15
kernel/pid.c
15
kernel/pid.c
|
@ -182,7 +182,7 @@ static int alloc_pidmap(struct pid_namespace *pid_ns)
|
|||
spin_unlock_irq(&pidmap_lock);
|
||||
kfree(page);
|
||||
if (unlikely(!map->page))
|
||||
break;
|
||||
return -ENOMEM;
|
||||
}
|
||||
if (likely(atomic_read(&map->nr_free))) {
|
||||
for ( ; ; ) {
|
||||
|
@ -210,7 +210,7 @@ static int alloc_pidmap(struct pid_namespace *pid_ns)
|
|||
}
|
||||
pid = mk_pid(pid_ns, map, offset);
|
||||
}
|
||||
return -1;
|
||||
return -EAGAIN;
|
||||
}
|
||||
|
||||
int next_pidmap(struct pid_namespace *pid_ns, unsigned int last)
|
||||
|
@ -301,17 +301,20 @@ struct pid *alloc_pid(struct pid_namespace *ns)
|
|||
int i, nr;
|
||||
struct pid_namespace *tmp;
|
||||
struct upid *upid;
|
||||
int retval = -ENOMEM;
|
||||
|
||||
pid = kmem_cache_alloc(ns->pid_cachep, GFP_KERNEL);
|
||||
if (!pid)
|
||||
goto out;
|
||||
return ERR_PTR(retval);
|
||||
|
||||
tmp = ns;
|
||||
pid->level = ns->level;
|
||||
for (i = ns->level; i >= 0; i--) {
|
||||
nr = alloc_pidmap(tmp);
|
||||
if (nr < 0)
|
||||
if (IS_ERR_VALUE(nr)) {
|
||||
retval = nr;
|
||||
goto out_free;
|
||||
}
|
||||
|
||||
pid->numbers[i].nr = nr;
|
||||
pid->numbers[i].ns = tmp;
|
||||
|
@ -339,7 +342,6 @@ struct pid *alloc_pid(struct pid_namespace *ns)
|
|||
}
|
||||
spin_unlock_irq(&pidmap_lock);
|
||||
|
||||
out:
|
||||
return pid;
|
||||
|
||||
out_unlock:
|
||||
|
@ -351,8 +353,7 @@ struct pid *alloc_pid(struct pid_namespace *ns)
|
|||
free_pidmap(pid->numbers + i);
|
||||
|
||||
kmem_cache_free(ns->pid_cachep, pid);
|
||||
pid = NULL;
|
||||
goto out;
|
||||
return ERR_PTR(retval);
|
||||
}
|
||||
|
||||
void disable_pid_allocation(struct pid_namespace *ns)
|
||||
|
|
Loading…
Reference in a new issue