2008-03-22 02:37:08 +03:00
|
|
|
/*
|
|
|
|
* Hypervisor-assisted dump
|
|
|
|
*
|
|
|
|
* Linas Vepstas, Manish Ahuja 2008
|
|
|
|
* Copyright 2008 IBM Corp.
|
|
|
|
*
|
|
|
|
* This program is free software; you can redistribute it and/or
|
|
|
|
* modify it under the terms of the GNU General Public License
|
|
|
|
* as published by the Free Software Foundation; either version
|
|
|
|
* 2 of the License, or (at your option) any later version.
|
|
|
|
*
|
|
|
|
*/
|
|
|
|
|
|
|
|
#include <linux/init.h>
|
2008-03-22 02:39:17 +03:00
|
|
|
#include <linux/kobject.h>
|
2008-03-22 02:37:08 +03:00
|
|
|
#include <linux/mm.h>
|
2008-03-22 02:39:17 +03:00
|
|
|
#include <linux/of.h>
|
2008-03-22 02:37:08 +03:00
|
|
|
#include <linux/pfn.h>
|
|
|
|
#include <linux/swap.h>
|
2008-03-22 02:39:17 +03:00
|
|
|
#include <linux/sysfs.h>
|
2008-03-22 02:37:08 +03:00
|
|
|
|
|
|
|
#include <asm/page.h>
|
|
|
|
#include <asm/phyp_dump.h>
|
|
|
|
#include <asm/machdep.h>
|
|
|
|
#include <asm/prom.h>
|
2008-03-22 02:39:17 +03:00
|
|
|
#include <asm/rtas.h>
|
2008-03-22 02:37:08 +03:00
|
|
|
|
|
|
|
/* Variables, used to communicate data between early boot and late boot */
|
|
|
|
static struct phyp_dump phyp_dump_vars;
|
|
|
|
struct phyp_dump *phyp_dump_info = &phyp_dump_vars;
|
|
|
|
|
2008-03-22 02:43:15 +03:00
|
|
|
static int ibm_configure_kernel_dump;
|
|
|
|
/* ------------------------------------------------- */
|
|
|
|
/* RTAS interfaces to declare the dump regions */
|
|
|
|
|
|
|
|
struct dump_section {
|
|
|
|
u32 dump_flags;
|
|
|
|
u16 source_type;
|
|
|
|
u16 error_flags;
|
|
|
|
u64 source_address;
|
|
|
|
u64 source_length;
|
|
|
|
u64 length_copied;
|
|
|
|
u64 destination_address;
|
|
|
|
};
|
|
|
|
|
|
|
|
struct phyp_dump_header {
|
|
|
|
u32 version;
|
|
|
|
u16 num_of_sections;
|
|
|
|
u16 status;
|
|
|
|
|
|
|
|
u32 first_offset_section;
|
|
|
|
u32 dump_disk_section;
|
|
|
|
u64 block_num_dd;
|
|
|
|
u64 num_of_blocks_dd;
|
|
|
|
u32 offset_dd;
|
|
|
|
u32 maxtime_to_auto;
|
|
|
|
/* No dump disk path string used */
|
|
|
|
|
|
|
|
struct dump_section cpu_data;
|
|
|
|
struct dump_section hpte_data;
|
|
|
|
struct dump_section kernel_data;
|
|
|
|
};
|
|
|
|
|
|
|
|
/* The dump header *must be* in low memory, so .bss it */
|
|
|
|
static struct phyp_dump_header phdr;
|
|
|
|
|
|
|
|
#define NUM_DUMP_SECTIONS 3
|
|
|
|
#define DUMP_HEADER_VERSION 0x1
|
|
|
|
#define DUMP_REQUEST_FLAG 0x1
|
|
|
|
#define DUMP_SOURCE_CPU 0x0001
|
|
|
|
#define DUMP_SOURCE_HPTE 0x0002
|
|
|
|
#define DUMP_SOURCE_RMO 0x0011
|
|
|
|
|
|
|
|
/**
|
|
|
|
* init_dump_header() - initialize the header declaring a dump
|
|
|
|
* Returns: length of dump save area.
|
|
|
|
*
|
|
|
|
* When the hypervisor saves crashed state, it needs to put
|
|
|
|
* it somewhere. The dump header tells the hypervisor where
|
|
|
|
* the data can be saved.
|
|
|
|
*/
|
|
|
|
static unsigned long init_dump_header(struct phyp_dump_header *ph)
|
|
|
|
{
|
|
|
|
unsigned long addr_offset = 0;
|
|
|
|
|
|
|
|
/* Set up the dump header */
|
|
|
|
ph->version = DUMP_HEADER_VERSION;
|
|
|
|
ph->num_of_sections = NUM_DUMP_SECTIONS;
|
|
|
|
ph->status = 0;
|
|
|
|
|
|
|
|
ph->first_offset_section =
|
|
|
|
(u32)offsetof(struct phyp_dump_header, cpu_data);
|
|
|
|
ph->dump_disk_section = 0;
|
|
|
|
ph->block_num_dd = 0;
|
|
|
|
ph->num_of_blocks_dd = 0;
|
|
|
|
ph->offset_dd = 0;
|
|
|
|
|
|
|
|
ph->maxtime_to_auto = 0; /* disabled */
|
|
|
|
|
|
|
|
/* The first two sections are mandatory */
|
|
|
|
ph->cpu_data.dump_flags = DUMP_REQUEST_FLAG;
|
|
|
|
ph->cpu_data.source_type = DUMP_SOURCE_CPU;
|
|
|
|
ph->cpu_data.source_address = 0;
|
|
|
|
ph->cpu_data.source_length = phyp_dump_info->cpu_state_size;
|
|
|
|
ph->cpu_data.destination_address = addr_offset;
|
|
|
|
addr_offset += phyp_dump_info->cpu_state_size;
|
|
|
|
|
|
|
|
ph->hpte_data.dump_flags = DUMP_REQUEST_FLAG;
|
|
|
|
ph->hpte_data.source_type = DUMP_SOURCE_HPTE;
|
|
|
|
ph->hpte_data.source_address = 0;
|
|
|
|
ph->hpte_data.source_length = phyp_dump_info->hpte_region_size;
|
|
|
|
ph->hpte_data.destination_address = addr_offset;
|
|
|
|
addr_offset += phyp_dump_info->hpte_region_size;
|
|
|
|
|
|
|
|
/* This section describes the low kernel region */
|
|
|
|
ph->kernel_data.dump_flags = DUMP_REQUEST_FLAG;
|
|
|
|
ph->kernel_data.source_type = DUMP_SOURCE_RMO;
|
|
|
|
ph->kernel_data.source_address = PHYP_DUMP_RMR_START;
|
|
|
|
ph->kernel_data.source_length = PHYP_DUMP_RMR_END;
|
|
|
|
ph->kernel_data.destination_address = addr_offset;
|
|
|
|
addr_offset += ph->kernel_data.source_length;
|
|
|
|
|
|
|
|
return addr_offset;
|
|
|
|
}
|
|
|
|
|
|
|
|
static void register_dump_area(struct phyp_dump_header *ph, unsigned long addr)
|
|
|
|
{
|
|
|
|
int rc;
|
|
|
|
ph->cpu_data.destination_address += addr;
|
|
|
|
ph->hpte_data.destination_address += addr;
|
|
|
|
ph->kernel_data.destination_address += addr;
|
|
|
|
|
|
|
|
do {
|
|
|
|
rc = rtas_call(ibm_configure_kernel_dump, 3, 1, NULL,
|
|
|
|
1, ph, sizeof(struct phyp_dump_header));
|
|
|
|
} while (rtas_busy_delay(rc));
|
|
|
|
|
|
|
|
if (rc)
|
|
|
|
printk(KERN_ERR "phyp-dump: unexpected error (%d) on "
|
|
|
|
"register\n", rc);
|
|
|
|
}
|
|
|
|
|
2008-03-22 02:39:17 +03:00
|
|
|
/* ------------------------------------------------- */
|
2008-03-22 02:37:08 +03:00
|
|
|
/**
|
|
|
|
* release_memory_range -- release memory previously lmb_reserved
|
|
|
|
* @start_pfn: starting physical frame number
|
|
|
|
* @nr_pages: number of pages to free.
|
|
|
|
*
|
|
|
|
* This routine will release memory that had been previously
|
|
|
|
* lmb_reserved in early boot. The released memory becomes
|
|
|
|
* available for genreal use.
|
|
|
|
*/
|
|
|
|
static void
|
|
|
|
release_memory_range(unsigned long start_pfn, unsigned long nr_pages)
|
|
|
|
{
|
|
|
|
struct page *rpage;
|
|
|
|
unsigned long end_pfn;
|
|
|
|
long i;
|
|
|
|
|
|
|
|
end_pfn = start_pfn + nr_pages;
|
|
|
|
|
|
|
|
for (i = start_pfn; i <= end_pfn; i++) {
|
|
|
|
rpage = pfn_to_page(i);
|
|
|
|
if (PageReserved(rpage)) {
|
|
|
|
ClearPageReserved(rpage);
|
|
|
|
init_page_count(rpage);
|
|
|
|
__free_page(rpage);
|
|
|
|
totalram_pages++;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2008-03-22 02:39:17 +03:00
|
|
|
/* ------------------------------------------------- */
|
|
|
|
/**
|
|
|
|
* sysfs_release_region -- sysfs interface to release memory range.
|
|
|
|
*
|
|
|
|
* Usage:
|
|
|
|
* "echo <start addr> <length> > /sys/kernel/release_region"
|
|
|
|
*
|
|
|
|
* Example:
|
|
|
|
* "echo 0x40000000 0x10000000 > /sys/kernel/release_region"
|
|
|
|
*
|
|
|
|
* will release 256MB starting at 1GB.
|
|
|
|
*/
|
|
|
|
static ssize_t store_release_region(struct kobject *kobj,
|
|
|
|
struct kobj_attribute *attr,
|
|
|
|
const char *buf, size_t count)
|
2008-03-22 02:37:08 +03:00
|
|
|
{
|
2008-03-22 02:39:17 +03:00
|
|
|
unsigned long start_addr, length, end_addr;
|
2008-03-22 02:37:08 +03:00
|
|
|
unsigned long start_pfn, nr_pages;
|
2008-03-22 02:39:17 +03:00
|
|
|
ssize_t ret;
|
|
|
|
|
|
|
|
ret = sscanf(buf, "%lx %lx", &start_addr, &length);
|
|
|
|
if (ret != 2)
|
|
|
|
return -EINVAL;
|
|
|
|
|
|
|
|
/* Range-check - don't free any reserved memory that
|
|
|
|
* wasn't reserved for phyp-dump */
|
|
|
|
if (start_addr < phyp_dump_info->init_reserve_start)
|
|
|
|
start_addr = phyp_dump_info->init_reserve_start;
|
|
|
|
|
|
|
|
end_addr = phyp_dump_info->init_reserve_start +
|
|
|
|
phyp_dump_info->init_reserve_size;
|
|
|
|
if (start_addr+length > end_addr)
|
|
|
|
length = end_addr - start_addr;
|
|
|
|
|
|
|
|
/* Release the region of memory assed in by user */
|
|
|
|
start_pfn = PFN_DOWN(start_addr);
|
|
|
|
nr_pages = PFN_DOWN(length);
|
|
|
|
release_memory_range(start_pfn, nr_pages);
|
|
|
|
|
|
|
|
return count;
|
|
|
|
}
|
|
|
|
|
|
|
|
static struct kobj_attribute rr = __ATTR(release_region, 0600,
|
|
|
|
NULL, store_release_region);
|
|
|
|
|
|
|
|
static int __init phyp_dump_setup(void)
|
|
|
|
{
|
|
|
|
struct device_node *rtas;
|
2008-03-22 02:43:15 +03:00
|
|
|
const struct phyp_dump_header *dump_header = NULL;
|
|
|
|
unsigned long dump_area_start;
|
|
|
|
unsigned long dump_area_length;
|
2008-03-22 02:39:17 +03:00
|
|
|
int header_len = 0;
|
|
|
|
int rc;
|
2008-03-22 02:37:08 +03:00
|
|
|
|
|
|
|
/* If no memory was reserved in early boot, there is nothing to do */
|
|
|
|
if (phyp_dump_info->init_reserve_size == 0)
|
|
|
|
return 0;
|
|
|
|
|
2008-03-22 02:39:17 +03:00
|
|
|
/* Return if phyp dump not supported */
|
|
|
|
if (!phyp_dump_info->phyp_dump_configured)
|
|
|
|
return -ENOSYS;
|
|
|
|
|
2008-03-22 02:43:15 +03:00
|
|
|
/* Is there dump data waiting for us? If there isn't,
|
|
|
|
* then register a new dump area, and release all of
|
|
|
|
* the rest of the reserved ram.
|
|
|
|
*
|
|
|
|
* The /rtas/ibm,kernel-dump rtas node is present only
|
|
|
|
* if there is dump data waiting for us.
|
|
|
|
*/
|
2008-03-22 02:39:17 +03:00
|
|
|
rtas = of_find_node_by_path("/rtas");
|
|
|
|
if (rtas) {
|
|
|
|
dump_header = of_get_property(rtas, "ibm,kernel-dump",
|
|
|
|
&header_len);
|
|
|
|
of_node_put(rtas);
|
|
|
|
}
|
|
|
|
|
2008-03-22 02:43:15 +03:00
|
|
|
dump_area_length = init_dump_header(&phdr);
|
|
|
|
|
|
|
|
/* align down */
|
|
|
|
dump_area_start = phyp_dump_info->init_reserve_start & PAGE_MASK;
|
|
|
|
|
|
|
|
if (dump_header == NULL) {
|
|
|
|
register_dump_area(&phdr, dump_area_start);
|
2008-03-22 02:39:17 +03:00
|
|
|
return 0;
|
2008-03-22 02:43:15 +03:00
|
|
|
}
|
2008-03-22 02:39:17 +03:00
|
|
|
|
|
|
|
/* Should we create a dump_subsys, analogous to s390/ipl.c ? */
|
|
|
|
rc = sysfs_create_file(kernel_kobj, &rr.attr);
|
2008-03-22 02:43:15 +03:00
|
|
|
if (rc)
|
2008-03-22 02:39:17 +03:00
|
|
|
printk(KERN_ERR "phyp-dump: unable to create sysfs file (%d)\n",
|
|
|
|
rc);
|
2008-03-22 02:37:08 +03:00
|
|
|
|
2008-03-22 02:43:15 +03:00
|
|
|
/* ToDo: re-register the dump area, for next time. */
|
2008-03-22 02:37:08 +03:00
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
machine_subsys_initcall(pseries, phyp_dump_setup);
|
|
|
|
|
|
|
|
int __init early_init_dt_scan_phyp_dump(unsigned long node,
|
|
|
|
const char *uname, int depth, void *data)
|
|
|
|
{
|
|
|
|
const unsigned int *sizes;
|
|
|
|
|
|
|
|
phyp_dump_info->phyp_dump_configured = 0;
|
|
|
|
phyp_dump_info->phyp_dump_is_active = 0;
|
|
|
|
|
|
|
|
if (depth != 1 || strcmp(uname, "rtas") != 0)
|
|
|
|
return 0;
|
|
|
|
|
|
|
|
if (of_get_flat_dt_prop(node, "ibm,configure-kernel-dump", NULL))
|
|
|
|
phyp_dump_info->phyp_dump_configured++;
|
|
|
|
|
|
|
|
if (of_get_flat_dt_prop(node, "ibm,dump-kernel", NULL))
|
|
|
|
phyp_dump_info->phyp_dump_is_active++;
|
|
|
|
|
|
|
|
sizes = of_get_flat_dt_prop(node, "ibm,configure-kernel-dump-sizes",
|
|
|
|
NULL);
|
|
|
|
if (!sizes)
|
|
|
|
return 0;
|
|
|
|
|
|
|
|
if (sizes[0] == 1)
|
|
|
|
phyp_dump_info->cpu_state_size = *((unsigned long *)&sizes[1]);
|
|
|
|
|
|
|
|
if (sizes[3] == 2)
|
|
|
|
phyp_dump_info->hpte_region_size =
|
|
|
|
*((unsigned long *)&sizes[4]);
|
|
|
|
return 1;
|
|
|
|
}
|