context.c 8.7 KB
Newer Older
1
// SPDX-License-Identifier: GPL-2.0-or-later
2 3 4 5 6 7 8 9 10 11 12 13 14 15
/*
 * Copyright 2014 IBM Corp.
 */

#include <linux/module.h>
#include <linux/kernel.h>
#include <linux/bitmap.h>
#include <linux/sched.h>
#include <linux/pid.h>
#include <linux/fs.h>
#include <linux/mm.h>
#include <linux/debugfs.h>
#include <linux/slab.h>
#include <linux/idr.h>
16
#include <linux/sched/mm.h>
17
#include <linux/mmu_context.h>
18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34
#include <asm/cputable.h>
#include <asm/current.h>
#include <asm/copro.h>

#include "cxl.h"

/*
 * Allocates space for a CXL context.
 */
struct cxl_context *cxl_context_alloc(void)
{
	return kzalloc(sizeof(struct cxl_context), GFP_KERNEL);
}

/*
 * Initialises a CXL context.
 */
35
int cxl_context_init(struct cxl_context *ctx, struct cxl_afu *afu, bool master)
36 37 38 39 40
{
	int i;

	ctx->afu = afu;
	ctx->master = master;
41
	ctx->pid = NULL; /* Set in start work ioctl */
42
	mutex_init(&ctx->mapping_lock);
43
	ctx->mapping = NULL;
44 45
	ctx->tidr = 0;
	ctx->assign_tidr = false;
46

47
	if (cxl_is_power8()) {
48 49 50 51 52 53 54
		spin_lock_init(&ctx->sste_lock);

		/*
		 * Allocate the segment table before we put it in the IDR so that we
		 * can always access it when dereferenced from IDR. For the same
		 * reason, the segment table is only destroyed after the context is
		 * removed from the IDR.  Access to this in the IOCTL is protected by
B
Bhaskar Chowdhury 已提交
55
		 * Linux filesystem semantics (can't IOCTL until open is complete).
56 57 58 59 60
		 */
		i = cxl_alloc_sst(ctx);
		if (i)
			return i;
	}
61 62 63 64 65 66 67 68 69 70 71

	INIT_WORK(&ctx->fault_work, cxl_handle_fault);

	init_waitqueue_head(&ctx->wq);
	spin_lock_init(&ctx->lock);

	ctx->irq_bitmap = NULL;
	ctx->pending_irq = false;
	ctx->pending_fault = false;
	ctx->pending_afu_err = false;

72 73
	INIT_LIST_HEAD(&ctx->irq_names);

74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91
	/*
	 * When we have to destroy all contexts in cxl_context_detach_all() we
	 * end up with afu_release_irqs() called from inside a
	 * idr_for_each_entry(). Hence we need to make sure that anything
	 * dereferenced from this IDR is ok before we allocate the IDR here.
	 * This clears out the IRQ ranges to ensure this.
	 */
	for (i = 0; i < CXL_IRQ_RANGES; i++)
		ctx->irqs.range[i] = 0;

	mutex_init(&ctx->status_mutex);

	ctx->status = OPENED;

	/*
	 * Allocating IDR! We better make sure everything's setup that
	 * dereferences from it.
	 */
92
	mutex_lock(&afu->contexts_lock);
93
	idr_preload(GFP_KERNEL);
94
	i = idr_alloc(&ctx->afu->contexts_idr, ctx, 0,
95 96
		      ctx->afu->num_procs, GFP_NOWAIT);
	idr_preload_end();
97
	mutex_unlock(&afu->contexts_lock);
98 99 100 101
	if (i < 0)
		return i;

	ctx->pe = i;
102
	if (cpu_has_feature(CPU_FTR_HVMODE)) {
103
		ctx->elem = &ctx->afu->native->spa[i];
104 105 106 107
		ctx->external_pe = ctx->pe;
	} else {
		ctx->external_pe = -1; /* assigned when attaching */
	}
108
	ctx->pe_inserted = false;
109 110 111 112 113 114

	/*
	 * take a ref on the afu so that it stays alive at-least till
	 * this context is reclaimed inside reclaim_ctx.
	 */
	cxl_afu_get(afu);
115 116 117
	return 0;
}

118 119 120 121 122 123 124 125
void cxl_context_set_mapping(struct cxl_context *ctx,
			struct address_space *mapping)
{
	mutex_lock(&ctx->mapping_lock);
	ctx->mapping = mapping;
	mutex_unlock(&ctx->mapping_lock);
}

126
static vm_fault_t cxl_mmap_fault(struct vm_fault *vmf)
127
{
128
	struct vm_area_struct *vma = vmf->vma;
129 130
	struct cxl_context *ctx = vma->vm_file->private_data;
	u64 area, offset;
131
	vm_fault_t ret;
132 133 134 135

	offset = vmf->pgoff << PAGE_SHIFT;

	pr_devel("%s: pe: %i address: 0x%lx offset: 0x%llx\n",
136
			__func__, ctx->pe, vmf->address, offset);
137 138 139

	if (ctx->afu->current_mode == CXL_MODE_DEDICATED) {
		area = ctx->afu->psn_phys;
140
		if (offset >= ctx->afu->adapter->ps_size)
141 142 143
			return VM_FAULT_SIGBUS;
	} else {
		area = ctx->psn_phys;
144
		if (offset >= ctx->psn_size)
145 146 147 148 149 150 151 152
			return VM_FAULT_SIGBUS;
	}

	mutex_lock(&ctx->status_mutex);

	if (ctx->status != STARTED) {
		mutex_unlock(&ctx->status_mutex);
		pr_devel("%s: Context not started, failing problem state access\n", __func__);
153 154 155 156 157 158 159 160 161 162 163 164
		if (ctx->mmio_err_ff) {
			if (!ctx->ff_page) {
				ctx->ff_page = alloc_page(GFP_USER);
				if (!ctx->ff_page)
					return VM_FAULT_OOM;
				memset(page_address(ctx->ff_page), 0xff, PAGE_SIZE);
			}
			get_page(ctx->ff_page);
			vmf->page = ctx->ff_page;
			vma->vm_page_prot = pgprot_cached(vma->vm_page_prot);
			return 0;
		}
165 166 167
		return VM_FAULT_SIGBUS;
	}

168
	ret = vmf_insert_pfn(vma, vmf->address, (area + offset) >> PAGE_SHIFT);
169 170 171

	mutex_unlock(&ctx->status_mutex);

172
	return ret;
173 174 175 176 177 178
}

static const struct vm_operations_struct cxl_mmap_vmops = {
	.fault = cxl_mmap_fault,
};

179 180 181 182 183
/*
 * Map a per-context mmio space into the given vma.
 */
int cxl_context_iomap(struct cxl_context *ctx, struct vm_area_struct *vma)
{
184
	u64 start = vma->vm_pgoff << PAGE_SHIFT;
185
	u64 len = vma->vm_end - vma->vm_start;
186 187 188 189

	if (ctx->afu->current_mode == CXL_MODE_DEDICATED) {
		if (start + len > ctx->afu->adapter->ps_size)
			return -EINVAL;
C
Christophe Lombard 已提交
190

191
		if (cxl_is_power9()) {
C
Christophe Lombard 已提交
192 193 194 195 196 197 198 199 200 201 202 203 204
			/*
			 * Make sure there is a valid problem state
			 * area space for this AFU.
			 */
			if (ctx->master && !ctx->afu->psa) {
				pr_devel("AFU doesn't support mmio space\n");
				return -EINVAL;
			}

			/* Can't mmap until the AFU is enabled */
			if (!ctx->afu->enabled)
				return -EBUSY;
		}
205 206 207
	} else {
		if (start + len > ctx->psn_size)
			return -EINVAL;
208

C
Christophe Lombard 已提交
209
		/* Make sure there is a valid per process space for this AFU */
210 211 212 213
		if ((ctx->master && !ctx->afu->psa) || (!ctx->afu->pp_psa)) {
			pr_devel("AFU doesn't support mmio space\n");
			return -EINVAL;
		}
214

215 216 217
		/* Can't mmap until the AFU is enabled */
		if (!ctx->afu->enabled)
			return -EBUSY;
218 219 220 221 222
	}

	pr_devel("%s: mmio physical: %llx pe: %i master:%i\n", __func__,
		 ctx->psn_phys, ctx->pe , ctx->master);

223
	vma->vm_flags |= VM_IO | VM_PFNMAP;
224
	vma->vm_page_prot = pgprot_noncached(vma->vm_page_prot);
225 226
	vma->vm_ops = &cxl_mmap_vmops;
	return 0;
227 228 229 230 231 232 233
}

/*
 * Detach a context from the hardware. This disables interrupts and doesn't
 * return until all outstanding interrupts for this context have completed. The
 * hardware should no longer access *ctx after this has returned.
 */
234
int __detach_context(struct cxl_context *ctx)
235 236 237 238 239 240 241 242
{
	enum cxl_context_status status;

	mutex_lock(&ctx->status_mutex);
	status = ctx->status;
	ctx->status = CLOSED;
	mutex_unlock(&ctx->status_mutex);
	if (status != STARTED)
243
		return -EBUSY;
244

245 246 247
	/* Only warn if we detached while the link was OK.
	 * If detach fails when hw is down, we don't care.
	 */
248
	WARN_ON(cxl_ops->detach_process(ctx) &&
249
		cxl_ops->link_ok(ctx->afu->adapter, ctx->afu));
M
Michael Neuling 已提交
250
	flush_work(&ctx->fault_work); /* Only needed for dedicated process */
251

252 253 254 255 256 257 258
	/*
	 * Wait until no further interrupts are presented by the PSL
	 * for this context.
	 */
	if (cxl_ops->irq_wait)
		cxl_ops->irq_wait(ctx);

259
	/* release the reference to the group leader and mm handling pid */
M
Michael Neuling 已提交
260
	put_pid(ctx->pid);
261

M
Michael Neuling 已提交
262
	cxl_ctx_put();
263 264 265

	/* Decrease the attached context count on the adapter */
	cxl_adapter_context_put(ctx->afu->adapter);
266 267 268

	/* Decrease the mm count on the context */
	cxl_context_mm_count_put(ctx);
269 270
	if (ctx->mm)
		mm_context_remove_copro(ctx->mm);
271 272
	ctx->mm = NULL;

273
	return 0;
274 275 276 277 278 279 280 281 282 283
}

/*
 * Detach the given context from the AFU. This doesn't actually
 * free the context but it should stop the context running in hardware
 * (ie. prevent this context from generating any further interrupts
 * so that it can be freed).
 */
void cxl_context_detach(struct cxl_context *ctx)
{
284 285 286 287 288 289 290 291
	int rc;

	rc = __detach_context(ctx);
	if (rc)
		return;

	afu_release_irqs(ctx, ctx);
	wake_up_all(&ctx->wq);
292 293 294 295 296 297 298 299 300 301
}

/*
 * Detach all contexts on the given AFU.
 */
void cxl_context_detach_all(struct cxl_afu *afu)
{
	struct cxl_context *ctx;
	int tmp;

302 303
	mutex_lock(&afu->contexts_lock);
	idr_for_each_entry(&afu->contexts_idr, ctx, tmp) {
304 305 306 307
		/*
		 * Anything done in here needs to be setup before the IDR is
		 * created and torn down after the IDR removed
		 */
308
		cxl_context_detach(ctx);
309 310 311 312 313 314 315 316 317 318 319

		/*
		 * We are force detaching - remove any active PSA mappings so
		 * userspace cannot interfere with the card if it comes back.
		 * Easiest way to exercise this is to unbind and rebind the
		 * driver via sysfs while it is in use.
		 */
		mutex_lock(&ctx->mapping_lock);
		if (ctx->mapping)
			unmap_mapping_range(ctx->mapping, 0, 0, 1);
		mutex_unlock(&ctx->mapping_lock);
320 321
	}
	mutex_unlock(&afu->contexts_lock);
322 323
}

324
static void reclaim_ctx(struct rcu_head *rcu)
325
{
326
	struct cxl_context *ctx = container_of(rcu, struct cxl_context, rcu);
327

328
	if (cxl_is_power8())
329
		free_page((u64)ctx->sstp);
330 331
	if (ctx->ff_page)
		__free_page(ctx->ff_page);
332 333
	ctx->sstp = NULL;

334
	kfree(ctx->irq_bitmap);
335

336 337 338
	/* Drop ref to the afu device taken during cxl_context_init */
	cxl_afu_put(ctx->afu);

339 340
	kfree(ctx);
}
341 342 343

void cxl_context_free(struct cxl_context *ctx)
{
344 345
	if (ctx->kernelapi && ctx->mapping)
		cxl_release_mapping(ctx);
346 347 348 349 350
	mutex_lock(&ctx->afu->contexts_lock);
	idr_remove(&ctx->afu->contexts_idr, ctx->pe);
	mutex_unlock(&ctx->afu->contexts_lock);
	call_rcu(&ctx->rcu, reclaim_ctx);
}
351 352 353 354

void cxl_context_mm_count_get(struct cxl_context *ctx)
{
	if (ctx->mm)
J
Julia Lawall 已提交
355
		mmgrab(ctx->mm);
356 357 358 359 360 361 362
}

void cxl_context_mm_count_put(struct cxl_context *ctx)
{
	if (ctx->mm)
		mmdrop(ctx->mm);
}