Merge tag 'vfs-6.16-rc1.pidfs' of git://git.kernel.org/pub/scm/linux/kernel/git/vfs/vfs (7d7a103d) · Commits · git / linux-net

fs/coredump.c

+59 −6

Original line number	Diff line number	Diff line
		@@ -43,6 +43,8 @@
		#include <linux/timekeeping.h>
		#include <linux/sysctl.h>
		#include <linux/elf.h>
		#include <linux/pidfs.h>
		#include <uapi/linux/pidfd.h>

		#include <linux/uaccess.h>
		#include <asm/mmu_context.h>
		@@ -60,6 +62,12 @@ static void free_vma_snapshot(struct coredump_params *cprm);
		#define CORE_FILE_NOTE_SIZE_DEFAULT (410241024)
		/* Define a reasonable max cap */
		#define CORE_FILE_NOTE_SIZE_MAX (1610241024)
		/*
		* File descriptor number for the pidfd for the thread-group leader of
		* the coredumping task installed into the usermode helper's file
		* descriptor table.
		*/
		#define COREDUMP_PIDFD_NUMBER 3

		static int core_uses_pid;
		static unsigned int core_pipe_limit;
		@@ -339,6 +347,27 @@ static int format_corename(struct core_name cn, struct coredump_params cprm,
		case 'C':
		err = cn_printf(cn, "%d", cprm->cpu);
		break;
		/* pidfd number */
		case 'F': {
		/*
		* Installing a pidfd only makes sense if
		* we actually spawn a usermode helper.
		*/
		if (!ispipe)
		break;

		/*
		* Note that we'll install a pidfd for the
		* thread-group leader. We know that task
		* linkage hasn't been removed yet and even if
		* this @current isn't the actual thread-group
		* leader we know that the thread-group leader
		* cannot be reaped until @current has exited.
		*/
		cprm->pid = task_tgid(current);
		err = cn_printf(cn, "%d", COREDUMP_PIDFD_NUMBER);
		break;
		}
		default:
		break;
		}
		@@ -493,7 +522,7 @@ static void wait_for_dump_helpers(struct file *file)
		}

		/*
		* umh_pipe_setup
		* umh_coredump_setup
		* helper function to customize the process used
		* to collect the core in userspace. Specifically
		* it sets up a pipe and installs it as fd 0 (stdin)
		@@ -503,11 +532,32 @@ static void wait_for_dump_helpers(struct file *file)
		* is a special value that we use to trap recursive
		* core dumps
		*/
		static int umh_pipe_setup(struct subprocess_info info, struct cred new)
		static int umh_coredump_setup(struct subprocess_info info, struct cred new)
		{
		struct file *files[2];
		struct coredump_params cp = (struct coredump_params )info->data;
		int err = create_pipe_files(files, 0);
		int err;

		if (cp->pid) {
		struct file *pidfs_file __free(fput) = NULL;

		pidfs_file = pidfs_alloc_file(cp->pid, 0);
		if (IS_ERR(pidfs_file))
		return PTR_ERR(pidfs_file);

		/*
		* Usermode helpers are childen of either
		* system_unbound_wq or of kthreadd. So we know that
		* we're starting off with a clean file descriptor
		* table. So we should always be able to use
		* COREDUMP_PIDFD_NUMBER as our file descriptor value.
		*/
		err = replace_fd(COREDUMP_PIDFD_NUMBER, pidfs_file, 0);
		if (err < 0)
		return err;
		}

		err = create_pipe_files(files, 0);
		if (err)
		return err;

		@@ -515,10 +565,13 @@ static int umh_pipe_setup(struct subprocess_info info, struct cred new)

		err = replace_fd(0, files[0], 0);
		fput(files[0]);
		if (err < 0)
		return err;

		/* and disallow core files too */
		current->signal->rlim[RLIMIT_CORE] = (struct rlimit){1, 1};

		return err;
		return 0;
		}

		void do_coredump(const kernel_siginfo_t *siginfo)
		@@ -593,7 +646,7 @@ void do_coredump(const kernel_siginfo_t *siginfo)
		}

		if (cprm.limit == 1) {
		/* See umh_pipe_setup() which sets RLIMIT_CORE = 1.
		/* See umh_coredump_setup() which sets RLIMIT_CORE = 1.
		*
		* Normally core limits are irrelevant to pipes, since
		* we're not writing to the file system, but we use
		@@ -632,7 +685,7 @@ void do_coredump(const kernel_siginfo_t *siginfo)
		retval = -ENOMEM;
		sub_info = call_usermodehelper_setup(helper_argv[0],
		helper_argv, NULL, GFP_KERNEL,
		umh_pipe_setup, NULL, &cprm);
		umh_coredump_setup, NULL, &cprm);
		if (sub_info)
		retval = call_usermodehelper_exec(sub_info,
		UMH_WAIT_EXEC);

fs/pidfs.c

+73 −9

Original line number	Diff line number	Diff line
		@@ -746,7 +746,7 @@ static inline bool pidfs_pid_valid(struct pid pid, const struct path path,
		{
		enum pid_type type;

		if (flags & PIDFD_CLONE)
		if (flags & PIDFD_STALE)
		return true;

		/*
		@@ -755,10 +755,14 @@ static inline bool pidfs_pid_valid(struct pid pid, const struct path path,
		* pidfd has been allocated perform another check that the pid
		* is still alive. If it is exit information is available even
		* if the task gets reaped before the pidfd is returned to
		* userspace. The only exception is PIDFD_CLONE where no task
		* linkage has been established for @pid yet and the kernel is
		* in the middle of process creation so there's nothing for
		* pidfs to miss.
		* userspace. The only exception are indicated by PIDFD_STALE:
		*
		* (1) The kernel is in the middle of task creation and thus no
		* task linkage has been established yet.
		* (2) The caller knows @pid has been registered in pidfs at a
		* time when the task was still alive.
		*
		* In both cases exit information will have been reported.
		*/
		if (flags & PIDFD_THREAD)
		type = PIDTYPE_PID;
		@@ -852,11 +856,11 @@ struct file pidfs_alloc_file(struct pid pid, unsigned int flags)
		int ret;

		/*
		* Ensure that PIDFD_CLONE can be passed as a flag without
		* Ensure that PIDFD_STALE can be passed as a flag without
		* overloading other uapi pidfd flags.
		*/
		BUILD_BUG_ON(PIDFD_CLONE == PIDFD_THREAD);
		BUILD_BUG_ON(PIDFD_CLONE == PIDFD_NONBLOCK);
		BUILD_BUG_ON(PIDFD_STALE == PIDFD_THREAD);
		BUILD_BUG_ON(PIDFD_STALE == PIDFD_NONBLOCK);

		ret = path_from_stashed(&pid->stashed, pidfs_mnt, get_pid(pid), &path);
		if (ret < 0)
		@@ -865,7 +869,8 @@ struct file pidfs_alloc_file(struct pid pid, unsigned int flags)
		if (!pidfs_pid_valid(pid, &path, flags))
		return ERR_PTR(-ESRCH);

		flags &= ~PIDFD_CLONE;
		flags &= ~PIDFD_STALE;
		flags \|= O_RDWR;
		pidfd_file = dentry_open(&path, flags, current_cred());
		/* Raise PIDFD_THREAD explicitly as do_dentry_open() strips it. */
		if (!IS_ERR(pidfd_file))
		@@ -874,6 +879,65 @@ struct file pidfs_alloc_file(struct pid pid, unsigned int flags)
		return pidfd_file;
		}

		/**
		* pidfs_register_pid - register a struct pid in pidfs
		* @pid: pid to pin
		*
		* Register a struct pid in pidfs. Needs to be paired with
		* pidfs_put_pid() to not risk leaking the pidfs dentry and inode.
		*
		* Return: On success zero, on error a negative error code is returned.
		*/
		int pidfs_register_pid(struct pid *pid)
		{
		struct path path __free(path_put) = {};
		int ret;

		might_sleep();

		if (!pid)
		return 0;

		ret = path_from_stashed(&pid->stashed, pidfs_mnt, get_pid(pid), &path);
		if (unlikely(ret))
		return ret;
		/* Keep the dentry and only put the reference to the mount. */
		path.dentry = NULL;
		return 0;
		}

		/**
		* pidfs_get_pid - pin a struct pid through pidfs
		* @pid: pid to pin
		*
		* Similar to pidfs_register_pid() but only valid if the caller knows
		* there's a reference to the @pid through a dentry already that can't
		* go away.
		*/
		void pidfs_get_pid(struct pid *pid)
		{
		if (!pid)
		return;
		WARN_ON_ONCE(!stashed_dentry_get(&pid->stashed));
		}

		/**
		* pidfs_put_pid - drop a pidfs reference
		* @pid: pid to drop
		*
		* Drop a reference to @pid via pidfs. This is only safe if the
		* reference has been taken via pidfs_get_pid().
		*/
		void pidfs_put_pid(struct pid *pid)
		{
		might_sleep();

		if (!pid)
		return;
		VFS_WARN_ON_ONCE(!pid->stashed);
		dput(pid->stashed);
		}

		static void pidfs_inode_init_once(void *data)
		{
		struct pidfs_inode *pi = data;

include/linux/coredump.h

+1 −0

Original line number	Diff line number	Diff line
		@@ -28,6 +28,7 @@ struct coredump_params {
		int vma_count;
		size_t vma_data_size;
		struct core_vma_metadata *vma_meta;
		struct pid *pid;
		};

		extern unsigned int core_file_note_size_limit;

include/linux/pid.h

+1 −1

Original line number	Diff line number	Diff line
		@@ -77,7 +77,7 @@ struct file;
		struct pid pidfd_pid(const struct file file);
		struct pid pidfd_get_pid(unsigned int fd, unsigned int flags);
		struct task_struct pidfd_get_task(int pidfd, unsigned int flags);
		int pidfd_prepare(struct pid pid, unsigned int flags, struct file *ret);
		int pidfd_prepare(struct pid pid, unsigned int flags, struct file *ret_file);
		void do_notify_pidfd(struct task_struct *task);

		static inline struct pid get_pid(struct pid pid)

include/linux/pidfs.h

+3 −0

Original line number	Diff line number	Diff line
		@@ -8,5 +8,8 @@ void pidfs_add_pid(struct pid *pid);
		void pidfs_remove_pid(struct pid *pid);
		void pidfs_exit(struct task_struct *tsk);
		extern const struct dentry_operations pidfs_dentry_operations;
		int pidfs_register_pid(struct pid *pid);
		void pidfs_get_pid(struct pid *pid);
		void pidfs_put_pid(struct pid *pid);

		#endif /* _LINUX_PID_FS_H */

Original line number	Diff line number	Diff line
		@@ -77,7 +77,7 @@ struct file;
		struct pid pidfd_pid(const struct file file);
		struct pid pidfd_get_pid(unsigned int fd, unsigned int flags);
		struct task_struct pidfd_get_task(int pidfd, unsigned int flags);
		int pidfd_prepare(struct pid pid, unsigned int flags, struct file *ret);
		int pidfd_prepare(struct pid pid, unsigned int flags, struct file *ret_file);
		void do_notify_pidfd(struct task_struct *task);

		static inline struct pid get_pid(struct pid pid)