kfd_device_queue_manager.h 8.4 KB
Newer Older
B
Ben Goz 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28
/*
 * Copyright 2014 Advanced Micro Devices, Inc.
 *
 * Permission is hereby granted, free of charge, to any person obtaining a
 * copy of this software and associated documentation files (the "Software"),
 * to deal in the Software without restriction, including without limitation
 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
 * and/or sell copies of the Software, and to permit persons to whom the
 * Software is furnished to do so, subject to the following conditions:
 *
 * The above copyright notice and this permission notice shall be included in
 * all copies or substantial portions of the Software.
 *
 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
 * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
 * OTHER DEALINGS IN THE SOFTWARE.
 *
 */

#ifndef KFD_DEVICE_QUEUE_MANAGER_H_
#define KFD_DEVICE_QUEUE_MANAGER_H_

#include <linux/rwsem.h>
#include <linux/list.h>
29 30
#include <linux/mutex.h>
#include <linux/sched/mm.h>
B
Ben Goz 已提交
31 32 33
#include "kfd_priv.h"
#include "kfd_mqd_manager.h"

34 35
#define KFD_UNMAP_LATENCY_MS			(4000)
#define QUEUE_PREEMPT_DEFAULT_TIMEOUT_MS (2 * KFD_UNMAP_LATENCY_MS + 1000)
B
Ben Goz 已提交
36 37 38 39 40 41

struct device_process_node {
	struct qcm_process_device *qpd;
	struct list_head list;
};

42
/**
43
 * struct device_queue_manager_ops
44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77
 *
 * @create_queue: Queue creation routine.
 *
 * @destroy_queue: Queue destruction routine.
 *
 * @update_queue: Queue update routine.
 *
 * @get_mqd_manager: Returns the mqd manager according to the mqd type.
 *
 * @exeute_queues: Dispatches the queues list to the H/W.
 *
 * @register_process: This routine associates a specific process with device.
 *
 * @unregister_process: destroys the associations between process to device.
 *
 * @initialize: Initializes the pipelines and memory module for that device.
 *
 * @start: Initializes the resources/modules the the device needs for queues
 * execution. This function is called on device initialization and after the
 * system woke up after suspension.
 *
 * @stop: This routine stops execution of all the active queue running on the
 * H/W and basically this function called on system suspend.
 *
 * @uninitialize: Destroys all the device queue manager resources allocated in
 * initialize routine.
 *
 * @create_kernel_queue: Creates kernel queue. Used for debug queue.
 *
 * @destroy_kernel_queue: Destroys kernel queue. Used for debug queue.
 *
 * @set_cache_memory_policy: Sets memory policy (cached/ non cached) for the
 * memory apertures.
 *
78 79
 * @process_termination: Clears all process queues belongs to that device.
 *
80 81 82 83
 * @evict_process_queues: Evict all active queues of a process
 *
 * @restore_process_queues: Restore all evicted queues queues of a process
 *
84 85
 * @get_wave_state: Retrieves context save state and optionally copies the
 * control stack, if kept in the MQD, to the given userspace address.
86 87
 */

88
struct device_queue_manager_ops {
B
Ben Goz 已提交
89 90
	int	(*create_queue)(struct device_queue_manager *dqm,
				struct queue *q,
91
				struct qcm_process_device *qpd);
92

B
Ben Goz 已提交
93 94 95
	int	(*destroy_queue)(struct device_queue_manager *dqm,
				struct qcm_process_device *qpd,
				struct queue *q);
96

B
Ben Goz 已提交
97 98
	int	(*update_queue)(struct device_queue_manager *dqm,
				struct queue *q);
99 100 101

	struct mqd_manager * (*get_mqd_manager)
					(struct device_queue_manager *dqm,
B
Ben Goz 已提交
102 103 104 105
					enum KFD_MQD_TYPE type);

	int	(*register_process)(struct device_queue_manager *dqm,
					struct qcm_process_device *qpd);
106

B
Ben Goz 已提交
107 108
	int	(*unregister_process)(struct device_queue_manager *dqm,
					struct qcm_process_device *qpd);
109

B
Ben Goz 已提交
110 111 112 113 114 115 116
	int	(*initialize)(struct device_queue_manager *dqm);
	int	(*start)(struct device_queue_manager *dqm);
	int	(*stop)(struct device_queue_manager *dqm);
	void	(*uninitialize)(struct device_queue_manager *dqm);
	int	(*create_kernel_queue)(struct device_queue_manager *dqm,
					struct kernel_queue *kq,
					struct qcm_process_device *qpd);
117

B
Ben Goz 已提交
118 119 120
	void	(*destroy_kernel_queue)(struct device_queue_manager *dqm,
					struct kernel_queue *kq,
					struct qcm_process_device *qpd);
121

B
Ben Goz 已提交
122 123 124 125 126 127
	bool	(*set_cache_memory_policy)(struct device_queue_manager *dqm,
					   struct qcm_process_device *qpd,
					   enum cache_policy default_policy,
					   enum cache_policy alternate_policy,
					   void __user *alternate_aperture_base,
					   uint64_t alternate_aperture_size);
128

129 130 131 132 133
	int	(*set_trap_handler)(struct device_queue_manager *dqm,
				    struct qcm_process_device *qpd,
				    uint64_t tba_addr,
				    uint64_t tma_addr);

134 135
	int (*process_termination)(struct device_queue_manager *dqm,
			struct qcm_process_device *qpd);
136 137 138 139 140

	int (*evict_process_queues)(struct device_queue_manager *dqm,
				    struct qcm_process_device *qpd);
	int (*restore_process_queues)(struct device_queue_manager *dqm,
				      struct qcm_process_device *qpd);
141 142 143 144 145 146

	int	(*get_wave_state)(struct device_queue_manager *dqm,
				  struct queue *q,
				  void __user *ctl_stack,
				  u32 *ctl_stack_used_size,
				  u32 *save_area_used_size);
147 148
};

149
struct device_queue_manager_asic_ops {
150
	int	(*update_qpd)(struct device_queue_manager *dqm,
151 152 153 154 155 156 157
					struct qcm_process_device *qpd);
	bool	(*set_cache_memory_policy)(struct device_queue_manager *dqm,
					   struct qcm_process_device *qpd,
					   enum cache_policy default_policy,
					   enum cache_policy alternate_policy,
					   void __user *alternate_aperture_base,
					   uint64_t alternate_aperture_size);
158 159 160
	void	(*init_sdma_vm)(struct device_queue_manager *dqm,
				struct queue *q,
				struct qcm_process_device *qpd);
161 162
};

163 164 165 166 167 168 169 170 171 172 173
/**
 * struct device_queue_manager
 *
 * This struct is a base class for the kfd queues scheduler in the
 * device level. The device base class should expose the basic operations
 * for queue creation and queue destruction. This base class hides the
 * scheduling mode of the driver and the specific implementation of the
 * concrete device. This class is the only class in the queues scheduler
 * that configures the H/W.
 *
 */
B
Ben Goz 已提交
174

175 176
struct device_queue_manager {
	struct device_queue_manager_ops ops;
177
	struct device_queue_manager_asic_ops asic_ops;
B
Ben Goz 已提交
178

179
	struct mqd_manager	*mqd_mgrs[KFD_MQD_TYPE_MAX];
B
Ben Goz 已提交
180 181
	struct packet_manager	packets;
	struct kfd_dev		*dev;
182
	struct mutex		lock_hidden; /* use dqm_lock/unlock(dqm) */
B
Ben Goz 已提交
183
	struct list_head	queues;
184
	unsigned int		saved_flags;
B
Ben Goz 已提交
185 186
	unsigned int		processes_count;
	unsigned int		queue_count;
187
	unsigned int		sdma_queue_count;
188
	unsigned int		total_queue_count;
B
Ben Goz 已提交
189 190
	unsigned int		next_pipe_to_allocate;
	unsigned int		*allocated_queues;
191
	unsigned int		sdma_bitmap;
B
Ben Goz 已提交
192 193 194 195 196 197 198
	unsigned int		vmid_bitmap;
	uint64_t		pipelines_addr;
	struct kfd_mem_obj	*pipeline_mem;
	uint64_t		fence_gpu_addr;
	unsigned int		*fence_addr;
	struct kfd_mem_obj	*fence_mem;
	bool			active_runlist;
199
	int			sched_policy;
200 201 202 203

	/* hw exception  */
	bool			is_hws_hang;
	struct work_struct	hw_exception_work;
B
Ben Goz 已提交
204 205
};

206 207
void device_queue_manager_init_cik(
		struct device_queue_manager_asic_ops *asic_ops);
208 209
void device_queue_manager_init_cik_hawaii(
		struct device_queue_manager_asic_ops *asic_ops);
210 211
void device_queue_manager_init_vi(
		struct device_queue_manager_asic_ops *asic_ops);
212 213
void device_queue_manager_init_vi_tonga(
		struct device_queue_manager_asic_ops *asic_ops);
214 215
void device_queue_manager_init_v9(
		struct device_queue_manager_asic_ops *asic_ops);
216 217
void program_sh_mem_settings(struct device_queue_manager *dqm,
					struct qcm_process_device *qpd);
218 219 220
unsigned int get_queues_num(struct device_queue_manager *dqm);
unsigned int get_queues_per_pipe(struct device_queue_manager *dqm);
unsigned int get_pipes_per_mec(struct device_queue_manager *dqm);
221
unsigned int get_num_sdma_queues(struct device_queue_manager *dqm);
O
Oded Gabbay 已提交
222

223
static inline unsigned int get_sh_mem_bases_32(struct kfd_process_device *pdd)
O
Oded Gabbay 已提交
224 225 226 227
{
	return (pdd->lds_base >> 16) & 0xFF;
}

228
static inline unsigned int
O
Oded Gabbay 已提交
229 230 231 232 233
get_sh_mem_bases_nybble_64(struct kfd_process_device *pdd)
{
	return (pdd->lds_base >> 60) & 0x0E;
}

234 235 236 237 238 239 240 241 242 243 244 245 246 247 248
/* The DQM lock can be taken in MMU notifiers. Make sure no reclaim-FS
 * happens while holding this lock anywhere to prevent deadlocks when
 * an MMU notifier runs in reclaim-FS context.
 */
static inline void dqm_lock(struct device_queue_manager *dqm)
{
	mutex_lock(&dqm->lock_hidden);
	dqm->saved_flags = memalloc_nofs_save();
}
static inline void dqm_unlock(struct device_queue_manager *dqm)
{
	memalloc_nofs_restore(dqm->saved_flags);
	mutex_unlock(&dqm->lock_hidden);
}

B
Ben Goz 已提交
249
#endif /* KFD_DEVICE_QUEUE_MANAGER_H_ */