hotplug-memory.c 5.7 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12
/*
 * pseries Memory Hotplug infrastructure.
 *
 * Copyright (C) 2008 Badari Pulavarty, IBM Corporation
 *
 *      This program is free software; you can redistribute it and/or
 *      modify it under the terms of the GNU General Public License
 *      as published by the Free Software Foundation; either version
 *      2 of the License, or (at your option) any later version.
 */

#include <linux/of.h>
Y
Yinghai Lu 已提交
13
#include <linux/memblock.h>
14
#include <linux/vmalloc.h>
15 16
#include <linux/memory.h>

17 18 19
#include <asm/firmware.h>
#include <asm/machdep.h>
#include <asm/pSeries_reconfig.h>
20
#include <asm/sparsemem.h>
21

22 23 24
static unsigned long get_memblock_size(void)
{
	struct device_node *np;
25 26
	unsigned int memblock_size = MIN_MEMORY_BLOCK_SIZE;
	struct resource r;
27 28 29

	np = of_find_node_by_path("/ibm,dynamic-reconfiguration-memory");
	if (np) {
30
		const __be64 *size;
31 32

		size = of_get_property(np, "ibm,lmb-size", NULL);
33 34
		if (size)
			memblock_size = be64_to_cpup(size);
35
		of_node_put(np);
36 37
	} else  if (machine_is(pseries)) {
		/* This fallback really only applies to pseries */
38 39 40 41
		unsigned int memzero_size = 0;

		np = of_find_node_by_path("/memory@0");
		if (np) {
42 43
			if (!of_address_to_resource(np, 0, &r))
				memzero_size = resource_size(&r);
44 45 46 47 48 49 50 51 52 53 54 55
			of_node_put(np);
		}

		if (memzero_size) {
			/* We now know the size of memory@0, use this to find
			 * the first memoryblock and get its size.
			 */
			char buf[64];

			sprintf(buf, "/memory@%x", memzero_size);
			np = of_find_node_by_path(buf);
			if (np) {
56 57
				if (!of_address_to_resource(np, 0, &r))
					memblock_size = resource_size(&r);
58 59 60 61 62 63 64
				of_node_put(np);
			}
		}
	}
	return memblock_size;
}

65 66 67 68 69 70
/* WARNING: This is going to override the generic definition whenever
 * pseries is built-in regardless of what platform is active at boot
 * time. This is fine for now as this is the only "option" and it
 * should work everywhere. If not, we'll have to turn this into a
 * ppc_md. callback
 */
71 72 73 74 75
unsigned long memory_block_size_bytes(void)
{
	return get_memblock_size();
}

Y
Yinghai Lu 已提交
76
static int pseries_remove_memblock(unsigned long base, unsigned int memblock_size)
77
{
78
	unsigned long start, start_pfn;
79
	struct zone *zone;
80 81
	int i, ret;
	int sections_to_remove;
82

83
	start_pfn = base >> PAGE_SHIFT;
84 85

	if (!pfn_valid(start_pfn)) {
Y
Yinghai Lu 已提交
86
		memblock_remove(base, memblock_size);
87 88 89
		return 0;
	}

90 91 92 93 94 95 96 97 98 99 100
	zone = page_zone(pfn_to_page(start_pfn));

	/*
	 * Remove section mappings and sysfs entries for the
	 * section of the memory we are removing.
	 *
	 * NOTE: Ideally, this should be done in generic code like
	 * remove_memory(). But remove_memory() gets called by writing
	 * to sysfs "state" file and we can't remove sysfs entries
	 * while writing to it. So we have to defer it to here.
	 */
101 102 103 104 105 106 107
	sections_to_remove = (memblock_size >> PAGE_SHIFT) / PAGES_PER_SECTION;
	for (i = 0; i < sections_to_remove; i++) {
		unsigned long pfn = start_pfn + i * PAGES_PER_SECTION;
		ret = __remove_pages(zone, start_pfn,  PAGES_PER_SECTION);
		if (ret)
			return ret;
	}
108

109 110 111
	/*
	 * Update memory regions for memory remove
	 */
Y
Yinghai Lu 已提交
112
	memblock_remove(base, memblock_size);
113

114 115 116
	/*
	 * Remove htab bolted mappings for this section of memory
	 */
117
	start = (unsigned long)__va(base);
Y
Yinghai Lu 已提交
118
	ret = remove_section_mapping(start, start + memblock_size);
119 120 121 122 123 124

	/* Ensure all vmalloc mappings are flushed in case they also
	 * hit that section of memory
	 */
	vm_unmap_aliases();

125 126 127
	return ret;
}

128 129 130 131 132
static int pseries_remove_memory(struct device_node *np)
{
	const char *type;
	const unsigned int *regs;
	unsigned long base;
133
	unsigned int lmb_size;
134 135 136 137 138 139 140 141 142 143
	int ret = -EINVAL;

	/*
	 * Check to see if we are actually removing memory
	 */
	type = of_get_property(np, "device_type", NULL);
	if (type == NULL || strcmp(type, "memory") != 0)
		return 0;

	/*
Y
Yinghai Lu 已提交
144
	 * Find the bae address and size of the memblock
145 146 147 148 149 150
	 */
	regs = of_get_property(np, "reg", NULL);
	if (!regs)
		return ret;

	base = *(unsigned long *)regs;
151
	lmb_size = regs[3];
152

153
	ret = pseries_remove_memblock(base, lmb_size);
154 155 156
	return ret;
}

157 158 159 160
static int pseries_add_memory(struct device_node *np)
{
	const char *type;
	const unsigned int *regs;
161
	unsigned long base;
162
	unsigned int lmb_size;
163 164 165 166 167 168 169 170 171 172
	int ret = -EINVAL;

	/*
	 * Check to see if we are actually adding memory
	 */
	type = of_get_property(np, "device_type", NULL);
	if (type == NULL || strcmp(type, "memory") != 0)
		return 0;

	/*
Y
Yinghai Lu 已提交
173
	 * Find the base and size of the memblock
174 175 176 177 178
	 */
	regs = of_get_property(np, "reg", NULL);
	if (!regs)
		return ret;

179
	base = *(unsigned long *)regs;
180
	lmb_size = regs[3];
181 182 183 184

	/*
	 * Update memory region to represent the memory add
	 */
185
	ret = memblock_add(base, lmb_size);
186 187 188 189 190
	return (ret < 0) ? -EINVAL : 0;
}

static int pseries_drconf_memory(unsigned long *base, unsigned int action)
{
191
	unsigned long memblock_size;
192 193
	int rc;

194 195
	memblock_size = get_memblock_size();
	if (!memblock_size)
196 197 198
		return -EINVAL;

	if (action == PSERIES_DRCONF_MEM_ADD) {
199
		rc = memblock_add(*base, memblock_size);
200 201
		rc = (rc < 0) ? -EINVAL : 0;
	} else if (action == PSERIES_DRCONF_MEM_REMOVE) {
202
		rc = pseries_remove_memblock(*base, memblock_size);
203 204 205 206 207
	} else {
		rc = -EINVAL;
	}

	return rc;
208 209
}

210 211 212
static int pseries_memory_notifier(struct notifier_block *nb,
				unsigned long action, void *node)
{
213
	int err = 0;
214 215 216

	switch (action) {
	case PSERIES_RECONFIG_ADD:
217
		err = pseries_add_memory(node);
218 219
		break;
	case PSERIES_RECONFIG_REMOVE:
220
		err = pseries_remove_memory(node);
221
		break;
222 223
	case PSERIES_DRCONF_MEM_ADD:
	case PSERIES_DRCONF_MEM_REMOVE:
224
		err = pseries_drconf_memory(node, action);
225 226
		break;
	}
227
	return notifier_from_errno(err);
228 229 230 231 232 233 234 235 236 237 238 239 240 241
}

static struct notifier_block pseries_mem_nb = {
	.notifier_call = pseries_memory_notifier,
};

static int __init pseries_memory_hotplug_init(void)
{
	if (firmware_has_feature(FW_FEATURE_LPAR))
		pSeries_reconfig_notifier_register(&pseries_mem_nb);

	return 0;
}
machine_device_initcall(pseries, pseries_memory_hotplug_init);