mirror of
				https://github.com/torvalds/linux.git
				synced 2025-11-04 02:30:34 +02:00 
			
		
		
		
	fs/proc, core/debug: Don't expose absolute kernel addresses via wchan
So the /proc/PID/stat 'wchan' field (the 30th field, which contains
the absolute kernel address of the kernel function a task is blocked in)
leaks absolute kernel addresses to unprivileged user-space:
        seq_put_decimal_ull(m, ' ', wchan);
The absolute address might also leak via /proc/PID/wchan as well, if
KALLSYMS is turned off or if the symbol lookup fails for some reason:
static int proc_pid_wchan(struct seq_file *m, struct pid_namespace *ns,
                          struct pid *pid, struct task_struct *task)
{
        unsigned long wchan;
        char symname[KSYM_NAME_LEN];
        wchan = get_wchan(task);
        if (lookup_symbol_name(wchan, symname) < 0) {
                if (!ptrace_may_access(task, PTRACE_MODE_READ))
                        return 0;
                seq_printf(m, "%lu", wchan);
        } else {
                seq_printf(m, "%s", symname);
        }
        return 0;
}
This isn't ideal, because for example it trivially leaks the KASLR offset
to any local attacker:
  fomalhaut:~> printf "%016lx\n" $(cat /proc/$$/stat | cut -d' ' -f35)
  ffffffff8123b380
Most real-life uses of wchan are symbolic:
  ps -eo pid:10,tid:10,wchan:30,comm
and procps uses /proc/PID/wchan, not the absolute address in /proc/PID/stat:
  triton:~/tip> strace -f ps -eo pid:10,tid:10,wchan:30,comm 2>&1 | grep wchan | tail -1
  open("/proc/30833/wchan", O_RDONLY)     = 6
There's one compatibility quirk here: procps relies on whether the
absolute value is non-zero - and we can provide that functionality
by outputing "0" or "1" depending on whether the task is blocked
(whether there's a wchan address).
These days there appears to be very little legitimate reason
user-space would be interested in  the absolute address. The
absolute address is mostly historic: from the days when we
didn't have kallsyms and user-space procps had to do the
decoding itself via the System.map.
So this patch sets all numeric output to "0" or "1" and keeps only
symbolic output, in /proc/PID/wchan.
( The absolute sleep address can generally still be profiled via
  perf, by tasks with sufficient privileges. )
Reviewed-by: Thomas Gleixner <tglx@linutronix.de>
Acked-by: Kees Cook <keescook@chromium.org>
Acked-by: Linus Torvalds <torvalds@linux-foundation.org>
Cc: <stable@vger.kernel.org>
Cc: Al Viro <viro@zeniv.linux.org.uk>
Cc: Alexander Potapenko <glider@google.com>
Cc: Andrey Konovalov <andreyknvl@google.com>
Cc: Andrey Ryabinin <ryabinin.a.a@gmail.com>
Cc: Andy Lutomirski <luto@amacapital.net>
Cc: Andy Lutomirski <luto@kernel.org>
Cc: Borislav Petkov <bp@alien8.de>
Cc: Denys Vlasenko <dvlasenk@redhat.com>
Cc: Dmitry Vyukov <dvyukov@google.com>
Cc: Kostya Serebryany <kcc@google.com>
Cc: Mike Galbraith <efault@gmx.de>
Cc: Peter Zijlstra <a.p.zijlstra@chello.nl>
Cc: Peter Zijlstra <peterz@infradead.org>
Cc: Sasha Levin <sasha.levin@oracle.com>
Cc: kasan-dev <kasan-dev@googlegroups.com>
Cc: linux-kernel@vger.kernel.org
Link: http://lkml.kernel.org/r/20150930135917.GA3285@gmail.com
Signed-off-by: Ingo Molnar <mingo@kernel.org>
			
			
This commit is contained in:
		
							parent
							
								
									3225031fbe
								
							
						
					
					
						commit
						b2f73922d1
					
				
					 3 changed files with 20 additions and 10 deletions
				
			
		| 
						 | 
					@ -140,7 +140,8 @@ Table 1-1: Process specific entries in /proc
 | 
				
			||||||
 stat		Process status
 | 
					 stat		Process status
 | 
				
			||||||
 statm		Process memory status information
 | 
					 statm		Process memory status information
 | 
				
			||||||
 status		Process status in human readable form
 | 
					 status		Process status in human readable form
 | 
				
			||||||
 wchan		If CONFIG_KALLSYMS is set, a pre-decoded wchan
 | 
					 wchan		Present with CONFIG_KALLSYMS=y: it shows the kernel function
 | 
				
			||||||
 | 
							symbol the task is blocked in - or "0" if not blocked.
 | 
				
			||||||
 pagemap	Page table
 | 
					 pagemap	Page table
 | 
				
			||||||
 stack		Report full stack trace, enable via CONFIG_STACKTRACE
 | 
					 stack		Report full stack trace, enable via CONFIG_STACKTRACE
 | 
				
			||||||
 smaps		a extension based on maps, showing the memory consumption of
 | 
					 smaps		a extension based on maps, showing the memory consumption of
 | 
				
			||||||
| 
						 | 
					@ -310,7 +311,7 @@ Table 1-4: Contents of the stat files (as of 2.6.30-rc7)
 | 
				
			||||||
  blocked       bitmap of blocked signals
 | 
					  blocked       bitmap of blocked signals
 | 
				
			||||||
  sigign        bitmap of ignored signals
 | 
					  sigign        bitmap of ignored signals
 | 
				
			||||||
  sigcatch      bitmap of caught signals
 | 
					  sigcatch      bitmap of caught signals
 | 
				
			||||||
  wchan         address where process went to sleep
 | 
					  0		(place holder, used to be the wchan address, use /proc/PID/wchan instead)
 | 
				
			||||||
  0             (place holder)
 | 
					  0             (place holder)
 | 
				
			||||||
  0             (place holder)
 | 
					  0             (place holder)
 | 
				
			||||||
  exit_signal   signal to send to parent thread on exit
 | 
					  exit_signal   signal to send to parent thread on exit
 | 
				
			||||||
| 
						 | 
					
 | 
				
			||||||
| 
						 | 
					@ -375,7 +375,7 @@ int proc_pid_status(struct seq_file *m, struct pid_namespace *ns,
 | 
				
			||||||
static int do_task_stat(struct seq_file *m, struct pid_namespace *ns,
 | 
					static int do_task_stat(struct seq_file *m, struct pid_namespace *ns,
 | 
				
			||||||
			struct pid *pid, struct task_struct *task, int whole)
 | 
								struct pid *pid, struct task_struct *task, int whole)
 | 
				
			||||||
{
 | 
					{
 | 
				
			||||||
	unsigned long vsize, eip, esp, wchan = ~0UL;
 | 
						unsigned long vsize, eip, esp, wchan = 0;
 | 
				
			||||||
	int priority, nice;
 | 
						int priority, nice;
 | 
				
			||||||
	int tty_pgrp = -1, tty_nr = 0;
 | 
						int tty_pgrp = -1, tty_nr = 0;
 | 
				
			||||||
	sigset_t sigign, sigcatch;
 | 
						sigset_t sigign, sigcatch;
 | 
				
			||||||
| 
						 | 
					@ -507,7 +507,19 @@ static int do_task_stat(struct seq_file *m, struct pid_namespace *ns,
 | 
				
			||||||
	seq_put_decimal_ull(m, ' ', task->blocked.sig[0] & 0x7fffffffUL);
 | 
						seq_put_decimal_ull(m, ' ', task->blocked.sig[0] & 0x7fffffffUL);
 | 
				
			||||||
	seq_put_decimal_ull(m, ' ', sigign.sig[0] & 0x7fffffffUL);
 | 
						seq_put_decimal_ull(m, ' ', sigign.sig[0] & 0x7fffffffUL);
 | 
				
			||||||
	seq_put_decimal_ull(m, ' ', sigcatch.sig[0] & 0x7fffffffUL);
 | 
						seq_put_decimal_ull(m, ' ', sigcatch.sig[0] & 0x7fffffffUL);
 | 
				
			||||||
	seq_put_decimal_ull(m, ' ', wchan);
 | 
					
 | 
				
			||||||
 | 
						/*
 | 
				
			||||||
 | 
						 * We used to output the absolute kernel address, but that's an
 | 
				
			||||||
 | 
						 * information leak - so instead we show a 0/1 flag here, to signal
 | 
				
			||||||
 | 
						 * to user-space whether there's a wchan field in /proc/PID/wchan.
 | 
				
			||||||
 | 
						 *
 | 
				
			||||||
 | 
						 * This works with older implementations of procps as well.
 | 
				
			||||||
 | 
						 */
 | 
				
			||||||
 | 
						if (wchan)
 | 
				
			||||||
 | 
							seq_puts(m, " 1");
 | 
				
			||||||
 | 
						else
 | 
				
			||||||
 | 
							seq_puts(m, " 0");
 | 
				
			||||||
 | 
					
 | 
				
			||||||
	seq_put_decimal_ull(m, ' ', 0);
 | 
						seq_put_decimal_ull(m, ' ', 0);
 | 
				
			||||||
	seq_put_decimal_ull(m, ' ', 0);
 | 
						seq_put_decimal_ull(m, ' ', 0);
 | 
				
			||||||
	seq_put_decimal_ll(m, ' ', task->exit_signal);
 | 
						seq_put_decimal_ll(m, ' ', task->exit_signal);
 | 
				
			||||||
| 
						 | 
					
 | 
				
			||||||
| 
						 | 
					@ -430,13 +430,10 @@ static int proc_pid_wchan(struct seq_file *m, struct pid_namespace *ns,
 | 
				
			||||||
 | 
					
 | 
				
			||||||
	wchan = get_wchan(task);
 | 
						wchan = get_wchan(task);
 | 
				
			||||||
 | 
					
 | 
				
			||||||
	if (lookup_symbol_name(wchan, symname) < 0) {
 | 
						if (wchan && ptrace_may_access(task, PTRACE_MODE_READ) && !lookup_symbol_name(wchan, symname))
 | 
				
			||||||
		if (!ptrace_may_access(task, PTRACE_MODE_READ))
 | 
					 | 
				
			||||||
			return 0;
 | 
					 | 
				
			||||||
		seq_printf(m, "%lu", wchan);
 | 
					 | 
				
			||||||
	} else {
 | 
					 | 
				
			||||||
		seq_printf(m, "%s", symname);
 | 
							seq_printf(m, "%s", symname);
 | 
				
			||||||
	}
 | 
						else
 | 
				
			||||||
 | 
							seq_putc(m, '0');
 | 
				
			||||||
 | 
					
 | 
				
			||||||
	return 0;
 | 
						return 0;
 | 
				
			||||||
}
 | 
					}
 | 
				
			||||||
| 
						 | 
					
 | 
				
			||||||
		Loading…
	
		Reference in a new issue