hotplug-memory.c 6.8 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12
/*
 * pseries Memory Hotplug infrastructure.
 *
 * Copyright (C) 2008 Badari Pulavarty, IBM Corporation
 *
 *      This program is free software; you can redistribute it and/or
 *      modify it under the terms of the GNU General Public License
 *      as published by the Free Software Foundation; either version
 *      2 of the License, or (at your option) any later version.
 */

#include <linux/of.h>
Y
Yinghai Lu 已提交
13
#include <linux/memblock.h>
14
#include <linux/vmalloc.h>
15 16
#include <linux/memory.h>

17 18
#include <asm/firmware.h>
#include <asm/machdep.h>
19
#include <asm/sparsemem.h>
20

21 22 23
static unsigned long get_memblock_size(void)
{
	struct device_node *np;
24 25
	unsigned int memblock_size = MIN_MEMORY_BLOCK_SIZE;
	struct resource r;
26 27 28

	np = of_find_node_by_path("/ibm,dynamic-reconfiguration-memory");
	if (np) {
29
		const __be64 *size;
30 31

		size = of_get_property(np, "ibm,lmb-size", NULL);
32 33
		if (size)
			memblock_size = be64_to_cpup(size);
34
		of_node_put(np);
35 36
	} else  if (machine_is(pseries)) {
		/* This fallback really only applies to pseries */
37 38 39 40
		unsigned int memzero_size = 0;

		np = of_find_node_by_path("/memory@0");
		if (np) {
41 42
			if (!of_address_to_resource(np, 0, &r))
				memzero_size = resource_size(&r);
43 44 45 46 47 48 49 50 51 52 53 54
			of_node_put(np);
		}

		if (memzero_size) {
			/* We now know the size of memory@0, use this to find
			 * the first memoryblock and get its size.
			 */
			char buf[64];

			sprintf(buf, "/memory@%x", memzero_size);
			np = of_find_node_by_path(buf);
			if (np) {
55 56
				if (!of_address_to_resource(np, 0, &r))
					memblock_size = resource_size(&r);
57 58 59 60 61 62 63
				of_node_put(np);
			}
		}
	}
	return memblock_size;
}

64 65 66 67 68 69
/* WARNING: This is going to override the generic definition whenever
 * pseries is built-in regardless of what platform is active at boot
 * time. This is fine for now as this is the only "option" and it
 * should work everywhere. If not, we'll have to turn this into a
 * ppc_md. callback
 */
70 71 72 73 74
unsigned long memory_block_size_bytes(void)
{
	return get_memblock_size();
}

75
#ifdef CONFIG_MEMORY_HOTREMOVE
Y
Yinghai Lu 已提交
76
static int pseries_remove_memblock(unsigned long base, unsigned int memblock_size)
77
{
78
	unsigned long start, start_pfn;
79
	struct zone *zone;
80 81 82
	int ret;
	unsigned long section;
	unsigned long sections_to_remove;
83

84
	start_pfn = base >> PAGE_SHIFT;
85 86

	if (!pfn_valid(start_pfn)) {
Y
Yinghai Lu 已提交
87
		memblock_remove(base, memblock_size);
88 89 90
		return 0;
	}

91 92 93 94 95 96 97 98 99 100 101
	zone = page_zone(pfn_to_page(start_pfn));

	/*
	 * Remove section mappings and sysfs entries for the
	 * section of the memory we are removing.
	 *
	 * NOTE: Ideally, this should be done in generic code like
	 * remove_memory(). But remove_memory() gets called by writing
	 * to sysfs "state" file and we can't remove sysfs entries
	 * while writing to it. So we have to defer it to here.
	 */
102
	sections_to_remove = (memblock_size >> PAGE_SHIFT) / PAGES_PER_SECTION;
103 104
	for (section = 0; section < sections_to_remove; section++) {
		unsigned long pfn = start_pfn + section * PAGES_PER_SECTION;
105
		ret = __remove_pages(zone, pfn, PAGES_PER_SECTION);
106 107 108
		if (ret)
			return ret;
	}
109

110 111 112
	/*
	 * Update memory regions for memory remove
	 */
Y
Yinghai Lu 已提交
113
	memblock_remove(base, memblock_size);
114

115 116 117
	/*
	 * Remove htab bolted mappings for this section of memory
	 */
118
	start = (unsigned long)__va(base);
Y
Yinghai Lu 已提交
119
	ret = remove_section_mapping(start, start + memblock_size);
120 121 122 123 124 125

	/* Ensure all vmalloc mappings are flushed in case they also
	 * hit that section of memory
	 */
	vm_unmap_aliases();

126 127 128
	return ret;
}

129 130 131 132 133
static int pseries_remove_memory(struct device_node *np)
{
	const char *type;
	const unsigned int *regs;
	unsigned long base;
134
	unsigned int lmb_size;
135 136 137 138 139 140 141 142 143 144
	int ret = -EINVAL;

	/*
	 * Check to see if we are actually removing memory
	 */
	type = of_get_property(np, "device_type", NULL);
	if (type == NULL || strcmp(type, "memory") != 0)
		return 0;

	/*
Y
Yinghai Lu 已提交
145
	 * Find the bae address and size of the memblock
146 147 148 149 150 151
	 */
	regs = of_get_property(np, "reg", NULL);
	if (!regs)
		return ret;

	base = *(unsigned long *)regs;
152
	lmb_size = regs[3];
153

154
	ret = pseries_remove_memblock(base, lmb_size);
155 156
	return ret;
}
157 158 159 160 161 162 163 164 165 166 167
#else
static inline int pseries_remove_memblock(unsigned long base,
					  unsigned int memblock_size)
{
	return -EOPNOTSUPP;
}
static inline int pseries_remove_memory(struct device_node *np)
{
	return -EOPNOTSUPP;
}
#endif /* CONFIG_MEMORY_HOTREMOVE */
168

169 170 171 172
static int pseries_add_memory(struct device_node *np)
{
	const char *type;
	const unsigned int *regs;
173
	unsigned long base;
174
	unsigned int lmb_size;
175 176 177 178 179 180 181 182 183 184
	int ret = -EINVAL;

	/*
	 * Check to see if we are actually adding memory
	 */
	type = of_get_property(np, "device_type", NULL);
	if (type == NULL || strcmp(type, "memory") != 0)
		return 0;

	/*
Y
Yinghai Lu 已提交
185
	 * Find the base and size of the memblock
186 187 188 189 190
	 */
	regs = of_get_property(np, "reg", NULL);
	if (!regs)
		return ret;

191
	base = *(unsigned long *)regs;
192
	lmb_size = regs[3];
193 194 195 196

	/*
	 * Update memory region to represent the memory add
	 */
197
	ret = memblock_add(base, lmb_size);
198 199 200
	return (ret < 0) ? -EINVAL : 0;
}

201
static int pseries_update_drconf_memory(struct of_prop_reconfig *pr)
202
{
203
	struct of_drconf_cell *new_drmem, *old_drmem;
204
	unsigned long memblock_size;
205 206 207
	u32 entries;
	u32 *p;
	int i, rc = -EINVAL;
208

209 210
	memblock_size = get_memblock_size();
	if (!memblock_size)
211 212
		return -EINVAL;

213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241
	p = (u32 *)of_get_property(pr->dn, "ibm,dynamic-memory", NULL);
	if (!p)
		return -EINVAL;

	/* The first int of the property is the number of lmb's described
	 * by the property. This is followed by an array of of_drconf_cell
	 * entries. Get the niumber of entries and skip to the array of
	 * of_drconf_cell's.
	 */
	entries = *p++;
	old_drmem = (struct of_drconf_cell *)p;

	p = (u32 *)pr->prop->value;
	p++;
	new_drmem = (struct of_drconf_cell *)p;

	for (i = 0; i < entries; i++) {
		if ((old_drmem[i].flags & DRCONF_MEM_ASSIGNED) &&
		    (!(new_drmem[i].flags & DRCONF_MEM_ASSIGNED))) {
			rc = pseries_remove_memblock(old_drmem[i].base_addr,
						     memblock_size);
			break;
		} else if ((!(old_drmem[i].flags & DRCONF_MEM_ASSIGNED)) &&
			   (new_drmem[i].flags & DRCONF_MEM_ASSIGNED)) {
			rc = memblock_add(old_drmem[i].base_addr,
					  memblock_size);
			rc = (rc < 0) ? -EINVAL : 0;
			break;
		}
242 243 244
	}

	return rc;
245 246
}

247
static int pseries_memory_notifier(struct notifier_block *nb,
248
				   unsigned long action, void *node)
249
{
250
	struct of_prop_reconfig *pr;
251
	int err = 0;
252 253

	switch (action) {
254
	case OF_RECONFIG_ATTACH_NODE:
255
		err = pseries_add_memory(node);
256
		break;
257
	case OF_RECONFIG_DETACH_NODE:
258
		err = pseries_remove_memory(node);
259
		break;
260 261 262 263
	case OF_RECONFIG_UPDATE_PROPERTY:
		pr = (struct of_prop_reconfig *)node;
		if (!strcmp(pr->prop->name, "ibm,dynamic-memory"))
			err = pseries_update_drconf_memory(pr);
264 265
		break;
	}
266
	return notifier_from_errno(err);
267 268 269 270 271 272 273 274 275
}

static struct notifier_block pseries_mem_nb = {
	.notifier_call = pseries_memory_notifier,
};

static int __init pseries_memory_hotplug_init(void)
{
	if (firmware_has_feature(FW_FEATURE_LPAR))
276
		of_reconfig_notifier_register(&pseries_mem_nb);
277 278 279 280

	return 0;
}
machine_device_initcall(pseries, pseries_memory_hotplug_init);