2016-04-19 00:42:14 +08:00
|
|
|
/*
|
|
|
|
* kaslr.c
|
|
|
|
*
|
|
|
|
* This contains the routines needed to generate a reasonable level of
|
|
|
|
* entropy to choose a randomized kernel base address offset in support
|
|
|
|
* of Kernel Address Space Layout Randomization (KASLR). Additionally
|
|
|
|
* handles walking the physical memory maps (and tracking memory regions
|
|
|
|
* to avoid) in order to select a physical memory location that can
|
|
|
|
* contain the entire properly aligned running kernel image.
|
|
|
|
*
|
|
|
|
*/
|
2013-10-11 08:18:14 +08:00
|
|
|
#include "misc.h"
|
|
|
|
|
2013-10-11 08:18:15 +08:00
|
|
|
#include <asm/msr.h>
|
|
|
|
#include <asm/archrandom.h>
|
2013-10-11 08:18:16 +08:00
|
|
|
#include <asm/e820.h>
|
2013-10-11 08:18:15 +08:00
|
|
|
|
2013-11-12 06:28:39 +08:00
|
|
|
#include <generated/compile.h>
|
|
|
|
#include <linux/module.h>
|
|
|
|
#include <linux/uts.h>
|
|
|
|
#include <linux/utsname.h>
|
|
|
|
#include <generated/utsrelease.h>
|
|
|
|
|
|
|
|
/* Simplified build-specific string for starting entropy. */
|
2013-11-13 00:56:07 +08:00
|
|
|
static const char build_str[] = UTS_RELEASE " (" LINUX_COMPILE_BY "@"
|
2013-11-12 06:28:39 +08:00
|
|
|
LINUX_COMPILE_HOST ") (" LINUX_COMPILER ") " UTS_VERSION;
|
|
|
|
|
2013-10-11 08:18:15 +08:00
|
|
|
#define I8254_PORT_CONTROL 0x43
|
|
|
|
#define I8254_PORT_COUNTER0 0x40
|
|
|
|
#define I8254_CMD_READBACK 0xC0
|
|
|
|
#define I8254_SELECT_COUNTER0 0x02
|
|
|
|
#define I8254_STATUS_NOTREADY 0x40
|
|
|
|
static inline u16 i8254(void)
|
|
|
|
{
|
|
|
|
u16 status, timer;
|
|
|
|
|
|
|
|
do {
|
|
|
|
outb(I8254_PORT_CONTROL,
|
|
|
|
I8254_CMD_READBACK | I8254_SELECT_COUNTER0);
|
|
|
|
status = inb(I8254_PORT_COUNTER0);
|
|
|
|
timer = inb(I8254_PORT_COUNTER0);
|
|
|
|
timer |= inb(I8254_PORT_COUNTER0) << 8;
|
|
|
|
} while (status & I8254_STATUS_NOTREADY);
|
|
|
|
|
|
|
|
return timer;
|
|
|
|
}
|
|
|
|
|
2013-11-12 06:28:39 +08:00
|
|
|
static unsigned long rotate_xor(unsigned long hash, const void *area,
|
|
|
|
size_t size)
|
|
|
|
{
|
|
|
|
size_t i;
|
|
|
|
unsigned long *ptr = (unsigned long *)area;
|
|
|
|
|
|
|
|
for (i = 0; i < size / sizeof(hash); i++) {
|
|
|
|
/* Rotate by odd number of bits and XOR. */
|
|
|
|
hash = (hash << ((sizeof(hash) * 8) - 7)) | (hash >> 7);
|
|
|
|
hash ^= ptr[i];
|
|
|
|
}
|
|
|
|
|
|
|
|
return hash;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* Attempt to create a simple but unpredictable starting entropy. */
|
|
|
|
static unsigned long get_random_boot(void)
|
|
|
|
{
|
|
|
|
unsigned long hash = 0;
|
|
|
|
|
|
|
|
hash = rotate_xor(hash, build_str, sizeof(build_str));
|
2016-04-19 00:42:12 +08:00
|
|
|
hash = rotate_xor(hash, boot_params, sizeof(*boot_params));
|
2013-11-12 06:28:39 +08:00
|
|
|
|
|
|
|
return hash;
|
|
|
|
}
|
|
|
|
|
2013-10-11 08:18:15 +08:00
|
|
|
static unsigned long get_random_long(void)
|
|
|
|
{
|
2013-11-12 14:45:20 +08:00
|
|
|
#ifdef CONFIG_X86_64
|
|
|
|
const unsigned long mix_const = 0x5d6008cbf3848dd3UL;
|
|
|
|
#else
|
|
|
|
const unsigned long mix_const = 0x3f39e593UL;
|
|
|
|
#endif
|
2013-11-12 06:28:39 +08:00
|
|
|
unsigned long raw, random = get_random_boot();
|
|
|
|
bool use_i8254 = true;
|
|
|
|
|
|
|
|
debug_putstr("KASLR using");
|
2013-10-11 08:18:15 +08:00
|
|
|
|
|
|
|
if (has_cpuflag(X86_FEATURE_RDRAND)) {
|
2013-11-12 06:28:39 +08:00
|
|
|
debug_putstr(" RDRAND");
|
|
|
|
if (rdrand_long(&raw)) {
|
|
|
|
random ^= raw;
|
|
|
|
use_i8254 = false;
|
|
|
|
}
|
2013-10-11 08:18:15 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
if (has_cpuflag(X86_FEATURE_TSC)) {
|
2013-11-12 06:28:39 +08:00
|
|
|
debug_putstr(" RDTSC");
|
2015-06-26 00:44:07 +08:00
|
|
|
raw = rdtsc();
|
2013-10-11 08:18:15 +08:00
|
|
|
|
2013-11-12 06:28:39 +08:00
|
|
|
random ^= raw;
|
|
|
|
use_i8254 = false;
|
|
|
|
}
|
2013-10-11 08:18:15 +08:00
|
|
|
|
2013-11-12 06:28:39 +08:00
|
|
|
if (use_i8254) {
|
|
|
|
debug_putstr(" i8254");
|
|
|
|
random ^= i8254();
|
2013-10-11 08:18:15 +08:00
|
|
|
}
|
|
|
|
|
2013-11-12 14:45:20 +08:00
|
|
|
/* Circular multiply for better bit diffusion */
|
|
|
|
asm("mul %3"
|
|
|
|
: "=a" (random), "=d" (raw)
|
|
|
|
: "a" (random), "rm" (mix_const));
|
|
|
|
random += raw;
|
|
|
|
|
2013-11-12 06:28:39 +08:00
|
|
|
debug_putstr("...\n");
|
|
|
|
|
2013-10-11 08:18:15 +08:00
|
|
|
return random;
|
|
|
|
}
|
2013-10-11 08:18:14 +08:00
|
|
|
|
2013-10-11 08:18:16 +08:00
|
|
|
struct mem_vector {
|
|
|
|
unsigned long start;
|
|
|
|
unsigned long size;
|
|
|
|
};
|
|
|
|
|
|
|
|
#define MEM_AVOID_MAX 5
|
2014-02-10 05:56:44 +08:00
|
|
|
static struct mem_vector mem_avoid[MEM_AVOID_MAX];
|
2013-10-11 08:18:16 +08:00
|
|
|
|
|
|
|
static bool mem_contains(struct mem_vector *region, struct mem_vector *item)
|
|
|
|
{
|
|
|
|
/* Item at least partially before region. */
|
|
|
|
if (item->start < region->start)
|
|
|
|
return false;
|
|
|
|
/* Item at least partially after region. */
|
|
|
|
if (item->start + item->size > region->start + region->size)
|
|
|
|
return false;
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
|
|
|
static bool mem_overlaps(struct mem_vector *one, struct mem_vector *two)
|
|
|
|
{
|
|
|
|
/* Item one is entirely before item two. */
|
|
|
|
if (one->start + one->size <= two->start)
|
|
|
|
return false;
|
|
|
|
/* Item one is entirely after item two. */
|
|
|
|
if (one->start >= two->start + two->size)
|
|
|
|
return false;
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
|
|
|
static void mem_avoid_init(unsigned long input, unsigned long input_size,
|
|
|
|
unsigned long output, unsigned long output_size)
|
|
|
|
{
|
|
|
|
u64 initrd_start, initrd_size;
|
|
|
|
u64 cmd_line, cmd_line_size;
|
|
|
|
unsigned long unsafe, unsafe_len;
|
|
|
|
char *ptr;
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Avoid the region that is unsafe to overlap during
|
x86/KASLR: Update description for decompressor worst case size
The comment that describes the analysis for the size of the decompressor
code only took gzip into account (there are currently 6 other decompressors
that could be used). The actual z_extract_offset calculation in code was
already handling the correct maximum size, but this documentation hadn't
been updated. This updates the documentation, fixes several typos, moves
the comment to header.S, updates references, and adds a note at the end
of the decompressor include list to remind us about updating the comment
in the future.
(Instead of moving the comment to mkpiggy.c, where the calculation
is currently happening, it is being moved to header.S because
the calculations in mkpiggy.c will be removed in favor of header.S
calculations in a following patch, and it seemed like overkill to move
the giant comment twice, especially when there's already reference to
z_extract_offset in header.S.)
Signed-off-by: Baoquan He <bhe@redhat.com>
[ Rewrote changelog, cleaned up comment style, moved comments around. ]
Signed-off-by: Kees Cook <keescook@chromium.org>
Cc: Andrew Morton <akpm@linux-foundation.org>
Cc: Andrey Ryabinin <aryabinin@virtuozzo.com>
Cc: Andy Lutomirski <luto@amacapital.net>
Cc: Andy Lutomirski <luto@kernel.org>
Cc: Borislav Petkov <bp@alien8.de>
Cc: Borislav Petkov <bp@suse.de>
Cc: Brian Gerst <brgerst@gmail.com>
Cc: Denys Vlasenko <dvlasenk@redhat.com>
Cc: Dmitry Vyukov <dvyukov@google.com>
Cc: H. Peter Anvin <hpa@zytor.com>
Cc: H.J. Lu <hjl.tools@gmail.com>
Cc: Josh Poimboeuf <jpoimboe@redhat.com>
Cc: Linus Torvalds <torvalds@linux-foundation.org>
Cc: Peter Zijlstra <peterz@infradead.org>
Cc: Thomas Gleixner <tglx@linutronix.de>
Cc: Yinghai Lu <yinghai@kernel.org>
Link: http://lkml.kernel.org/r/1461185746-8017-2-git-send-email-keescook@chromium.org
Signed-off-by: Ingo Molnar <mingo@kernel.org>
2016-04-21 04:55:42 +08:00
|
|
|
* decompression (see calculations in ../header.S).
|
2013-10-11 08:18:16 +08:00
|
|
|
*/
|
|
|
|
unsafe_len = (output_size >> 12) + 32768 + 18;
|
|
|
|
unsafe = (unsigned long)input + input_size - unsafe_len;
|
|
|
|
mem_avoid[0].start = unsafe;
|
|
|
|
mem_avoid[0].size = unsafe_len;
|
|
|
|
|
|
|
|
/* Avoid initrd. */
|
2016-04-19 00:42:12 +08:00
|
|
|
initrd_start = (u64)boot_params->ext_ramdisk_image << 32;
|
|
|
|
initrd_start |= boot_params->hdr.ramdisk_image;
|
|
|
|
initrd_size = (u64)boot_params->ext_ramdisk_size << 32;
|
|
|
|
initrd_size |= boot_params->hdr.ramdisk_size;
|
2013-10-11 08:18:16 +08:00
|
|
|
mem_avoid[1].start = initrd_start;
|
|
|
|
mem_avoid[1].size = initrd_size;
|
|
|
|
|
|
|
|
/* Avoid kernel command line. */
|
2016-04-19 00:42:12 +08:00
|
|
|
cmd_line = (u64)boot_params->ext_cmd_line_ptr << 32;
|
|
|
|
cmd_line |= boot_params->hdr.cmd_line_ptr;
|
2013-10-11 08:18:16 +08:00
|
|
|
/* Calculate size of cmd_line. */
|
|
|
|
ptr = (char *)(unsigned long)cmd_line;
|
|
|
|
for (cmd_line_size = 0; ptr[cmd_line_size++]; )
|
|
|
|
;
|
|
|
|
mem_avoid[2].start = cmd_line;
|
|
|
|
mem_avoid[2].size = cmd_line_size;
|
|
|
|
|
|
|
|
/* Avoid heap memory. */
|
|
|
|
mem_avoid[3].start = (unsigned long)free_mem_ptr;
|
|
|
|
mem_avoid[3].size = BOOT_HEAP_SIZE;
|
|
|
|
|
|
|
|
/* Avoid stack memory. */
|
|
|
|
mem_avoid[4].start = (unsigned long)free_mem_end_ptr;
|
|
|
|
mem_avoid[4].size = BOOT_STACK_SIZE;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* Does this memory vector overlap a known avoided area? */
|
2014-02-10 05:56:44 +08:00
|
|
|
static bool mem_avoid_overlap(struct mem_vector *img)
|
2013-10-11 08:18:16 +08:00
|
|
|
{
|
|
|
|
int i;
|
2014-09-12 00:19:31 +08:00
|
|
|
struct setup_data *ptr;
|
2013-10-11 08:18:16 +08:00
|
|
|
|
|
|
|
for (i = 0; i < MEM_AVOID_MAX; i++) {
|
|
|
|
if (mem_overlaps(img, &mem_avoid[i]))
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
2014-09-12 00:19:31 +08:00
|
|
|
/* Avoid all entries in the setup_data linked list. */
|
2016-04-19 00:42:12 +08:00
|
|
|
ptr = (struct setup_data *)(unsigned long)boot_params->hdr.setup_data;
|
2014-09-12 00:19:31 +08:00
|
|
|
while (ptr) {
|
|
|
|
struct mem_vector avoid;
|
|
|
|
|
2014-10-02 02:36:32 +08:00
|
|
|
avoid.start = (unsigned long)ptr;
|
2014-09-12 00:19:31 +08:00
|
|
|
avoid.size = sizeof(*ptr) + ptr->len;
|
|
|
|
|
|
|
|
if (mem_overlaps(img, &avoid))
|
|
|
|
return true;
|
|
|
|
|
|
|
|
ptr = (struct setup_data *)(unsigned long)ptr->next;
|
|
|
|
}
|
|
|
|
|
2013-10-11 08:18:16 +08:00
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
2016-04-21 04:55:43 +08:00
|
|
|
static unsigned long slots[KERNEL_IMAGE_SIZE / CONFIG_PHYSICAL_ALIGN];
|
2014-02-10 05:56:44 +08:00
|
|
|
static unsigned long slot_max;
|
2013-10-11 08:18:16 +08:00
|
|
|
|
|
|
|
static void slots_append(unsigned long addr)
|
|
|
|
{
|
|
|
|
/* Overflowing the slots list should be impossible. */
|
2016-04-21 04:55:43 +08:00
|
|
|
if (slot_max >= KERNEL_IMAGE_SIZE / CONFIG_PHYSICAL_ALIGN)
|
2013-10-11 08:18:16 +08:00
|
|
|
return;
|
|
|
|
|
|
|
|
slots[slot_max++] = addr;
|
|
|
|
}
|
|
|
|
|
|
|
|
static unsigned long slots_fetch_random(void)
|
|
|
|
{
|
|
|
|
/* Handle case of no slots stored. */
|
|
|
|
if (slot_max == 0)
|
|
|
|
return 0;
|
|
|
|
|
|
|
|
return slots[get_random_long() % slot_max];
|
|
|
|
}
|
|
|
|
|
|
|
|
static void process_e820_entry(struct e820entry *entry,
|
|
|
|
unsigned long minimum,
|
|
|
|
unsigned long image_size)
|
|
|
|
{
|
|
|
|
struct mem_vector region, img;
|
|
|
|
|
|
|
|
/* Skip non-RAM entries. */
|
|
|
|
if (entry->type != E820_RAM)
|
|
|
|
return;
|
|
|
|
|
|
|
|
/* Ignore entries entirely above our maximum. */
|
2016-04-21 04:55:43 +08:00
|
|
|
if (entry->addr >= KERNEL_IMAGE_SIZE)
|
2013-10-11 08:18:16 +08:00
|
|
|
return;
|
|
|
|
|
|
|
|
/* Ignore entries entirely below our minimum. */
|
|
|
|
if (entry->addr + entry->size < minimum)
|
|
|
|
return;
|
|
|
|
|
|
|
|
region.start = entry->addr;
|
|
|
|
region.size = entry->size;
|
|
|
|
|
|
|
|
/* Potentially raise address to minimum location. */
|
|
|
|
if (region.start < minimum)
|
|
|
|
region.start = minimum;
|
|
|
|
|
|
|
|
/* Potentially raise address to meet alignment requirements. */
|
|
|
|
region.start = ALIGN(region.start, CONFIG_PHYSICAL_ALIGN);
|
|
|
|
|
|
|
|
/* Did we raise the address above the bounds of this e820 region? */
|
|
|
|
if (region.start > entry->addr + entry->size)
|
|
|
|
return;
|
|
|
|
|
|
|
|
/* Reduce size by any delta from the original address. */
|
|
|
|
region.size -= region.start - entry->addr;
|
|
|
|
|
|
|
|
/* Reduce maximum size to fit end of image within maximum limit. */
|
2016-04-21 04:55:43 +08:00
|
|
|
if (region.start + region.size > KERNEL_IMAGE_SIZE)
|
|
|
|
region.size = KERNEL_IMAGE_SIZE - region.start;
|
2013-10-11 08:18:16 +08:00
|
|
|
|
|
|
|
/* Walk each aligned slot and check for avoided areas. */
|
|
|
|
for (img.start = region.start, img.size = image_size ;
|
|
|
|
mem_contains(®ion, &img) ;
|
|
|
|
img.start += CONFIG_PHYSICAL_ALIGN) {
|
|
|
|
if (mem_avoid_overlap(&img))
|
|
|
|
continue;
|
|
|
|
slots_append(img.start);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
static unsigned long find_random_addr(unsigned long minimum,
|
|
|
|
unsigned long size)
|
|
|
|
{
|
|
|
|
int i;
|
|
|
|
unsigned long addr;
|
|
|
|
|
|
|
|
/* Make sure minimum is aligned. */
|
|
|
|
minimum = ALIGN(minimum, CONFIG_PHYSICAL_ALIGN);
|
|
|
|
|
|
|
|
/* Verify potential e820 positions, appending to slots list. */
|
2016-04-19 00:42:12 +08:00
|
|
|
for (i = 0; i < boot_params->e820_entries; i++) {
|
|
|
|
process_e820_entry(&boot_params->e820_map[i], minimum, size);
|
2013-10-11 08:18:16 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
return slots_fetch_random();
|
|
|
|
}
|
|
|
|
|
2016-04-19 00:42:14 +08:00
|
|
|
unsigned char *choose_random_location(unsigned char *input,
|
2013-10-11 08:18:14 +08:00
|
|
|
unsigned long input_size,
|
|
|
|
unsigned char *output,
|
|
|
|
unsigned long output_size)
|
|
|
|
{
|
|
|
|
unsigned long choice = (unsigned long)output;
|
2016-04-19 00:42:15 +08:00
|
|
|
unsigned long random_addr;
|
2013-10-11 08:18:14 +08:00
|
|
|
|
2014-06-14 04:30:36 +08:00
|
|
|
#ifdef CONFIG_HIBERNATION
|
|
|
|
if (!cmdline_find_option_bool("kaslr")) {
|
|
|
|
debug_putstr("KASLR disabled by default...\n");
|
|
|
|
goto out;
|
|
|
|
}
|
|
|
|
#else
|
2013-10-11 08:18:14 +08:00
|
|
|
if (cmdline_find_option_bool("nokaslr")) {
|
2014-06-14 04:30:36 +08:00
|
|
|
debug_putstr("KASLR disabled by cmdline...\n");
|
2013-10-11 08:18:14 +08:00
|
|
|
goto out;
|
|
|
|
}
|
2014-06-14 04:30:36 +08:00
|
|
|
#endif
|
2013-10-11 08:18:14 +08:00
|
|
|
|
2016-04-19 00:42:12 +08:00
|
|
|
boot_params->hdr.loadflags |= KASLR_FLAG;
|
2015-04-01 18:49:52 +08:00
|
|
|
|
2013-10-11 08:18:16 +08:00
|
|
|
/* Record the various known unsafe memory ranges. */
|
|
|
|
mem_avoid_init((unsigned long)input, input_size,
|
|
|
|
(unsigned long)output, output_size);
|
|
|
|
|
|
|
|
/* Walk e820 and find a random address. */
|
2016-04-19 00:42:15 +08:00
|
|
|
random_addr = find_random_addr(choice, output_size);
|
|
|
|
if (!random_addr) {
|
2013-10-11 08:18:16 +08:00
|
|
|
debug_putstr("KASLR could not find suitable E820 region...\n");
|
|
|
|
goto out;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* Always enforce the minimum. */
|
2016-04-19 00:42:15 +08:00
|
|
|
if (random_addr < choice)
|
2013-10-11 08:18:16 +08:00
|
|
|
goto out;
|
2013-10-11 08:18:14 +08:00
|
|
|
|
2016-04-19 00:42:15 +08:00
|
|
|
choice = random_addr;
|
2013-10-11 08:18:14 +08:00
|
|
|
out:
|
|
|
|
return (unsigned char *)choice;
|
|
|
|
}
|