kfd_device_queue_manager.h 8.5 KB
Newer Older
B
Ben Goz 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28
/*
 * Copyright 2014 Advanced Micro Devices, Inc.
 *
 * Permission is hereby granted, free of charge, to any person obtaining a
 * copy of this software and associated documentation files (the "Software"),
 * to deal in the Software without restriction, including without limitation
 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
 * and/or sell copies of the Software, and to permit persons to whom the
 * Software is furnished to do so, subject to the following conditions:
 *
 * The above copyright notice and this permission notice shall be included in
 * all copies or substantial portions of the Software.
 *
 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
 * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
 * OTHER DEALINGS IN THE SOFTWARE.
 *
 */

#ifndef KFD_DEVICE_QUEUE_MANAGER_H_
#define KFD_DEVICE_QUEUE_MANAGER_H_

#include <linux/rwsem.h>
#include <linux/list.h>
29 30
#include <linux/mutex.h>
#include <linux/sched/mm.h>
B
Ben Goz 已提交
31 32 33 34 35 36 37 38 39
#include "kfd_priv.h"
#include "kfd_mqd_manager.h"


struct device_process_node {
	struct qcm_process_device *qpd;
	struct list_head list;
};

40
/**
41
 * struct device_queue_manager_ops
42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73
 *
 * @create_queue: Queue creation routine.
 *
 * @destroy_queue: Queue destruction routine.
 *
 * @update_queue: Queue update routine.
 *
 * @exeute_queues: Dispatches the queues list to the H/W.
 *
 * @register_process: This routine associates a specific process with device.
 *
 * @unregister_process: destroys the associations between process to device.
 *
 * @initialize: Initializes the pipelines and memory module for that device.
 *
 * @start: Initializes the resources/modules the the device needs for queues
 * execution. This function is called on device initialization and after the
 * system woke up after suspension.
 *
 * @stop: This routine stops execution of all the active queue running on the
 * H/W and basically this function called on system suspend.
 *
 * @uninitialize: Destroys all the device queue manager resources allocated in
 * initialize routine.
 *
 * @create_kernel_queue: Creates kernel queue. Used for debug queue.
 *
 * @destroy_kernel_queue: Destroys kernel queue. Used for debug queue.
 *
 * @set_cache_memory_policy: Sets memory policy (cached/ non cached) for the
 * memory apertures.
 *
74 75
 * @process_termination: Clears all process queues belongs to that device.
 *
76 77 78 79
 * @evict_process_queues: Evict all active queues of a process
 *
 * @restore_process_queues: Restore all evicted queues queues of a process
 *
80 81
 * @get_wave_state: Retrieves context save state and optionally copies the
 * control stack, if kept in the MQD, to the given userspace address.
82 83
 */

84
struct device_queue_manager_ops {
B
Ben Goz 已提交
85 86
	int	(*create_queue)(struct device_queue_manager *dqm,
				struct queue *q,
87
				struct qcm_process_device *qpd);
88

B
Ben Goz 已提交
89 90 91
	int	(*destroy_queue)(struct device_queue_manager *dqm,
				struct qcm_process_device *qpd,
				struct queue *q);
92

B
Ben Goz 已提交
93 94
	int	(*update_queue)(struct device_queue_manager *dqm,
				struct queue *q);
95

B
Ben Goz 已提交
96 97
	int	(*register_process)(struct device_queue_manager *dqm,
					struct qcm_process_device *qpd);
98

B
Ben Goz 已提交
99 100
	int	(*unregister_process)(struct device_queue_manager *dqm,
					struct qcm_process_device *qpd);
101

B
Ben Goz 已提交
102 103 104 105 106 107 108
	int	(*initialize)(struct device_queue_manager *dqm);
	int	(*start)(struct device_queue_manager *dqm);
	int	(*stop)(struct device_queue_manager *dqm);
	void	(*uninitialize)(struct device_queue_manager *dqm);
	int	(*create_kernel_queue)(struct device_queue_manager *dqm,
					struct kernel_queue *kq,
					struct qcm_process_device *qpd);
109

B
Ben Goz 已提交
110 111 112
	void	(*destroy_kernel_queue)(struct device_queue_manager *dqm,
					struct kernel_queue *kq,
					struct qcm_process_device *qpd);
113

B
Ben Goz 已提交
114 115 116 117 118 119
	bool	(*set_cache_memory_policy)(struct device_queue_manager *dqm,
					   struct qcm_process_device *qpd,
					   enum cache_policy default_policy,
					   enum cache_policy alternate_policy,
					   void __user *alternate_aperture_base,
					   uint64_t alternate_aperture_size);
120

121 122 123 124 125
	int	(*set_trap_handler)(struct device_queue_manager *dqm,
				    struct qcm_process_device *qpd,
				    uint64_t tba_addr,
				    uint64_t tma_addr);

126 127
	int (*process_termination)(struct device_queue_manager *dqm,
			struct qcm_process_device *qpd);
128 129 130 131 132

	int (*evict_process_queues)(struct device_queue_manager *dqm,
				    struct qcm_process_device *qpd);
	int (*restore_process_queues)(struct device_queue_manager *dqm,
				      struct qcm_process_device *qpd);
133 134 135 136 137 138

	int	(*get_wave_state)(struct device_queue_manager *dqm,
				  struct queue *q,
				  void __user *ctl_stack,
				  u32 *ctl_stack_used_size,
				  u32 *save_area_used_size);
139 140
};

141
struct device_queue_manager_asic_ops {
142
	int	(*update_qpd)(struct device_queue_manager *dqm,
143 144 145 146 147 148 149
					struct qcm_process_device *qpd);
	bool	(*set_cache_memory_policy)(struct device_queue_manager *dqm,
					   struct qcm_process_device *qpd,
					   enum cache_policy default_policy,
					   enum cache_policy alternate_policy,
					   void __user *alternate_aperture_base,
					   uint64_t alternate_aperture_size);
150 151 152
	void	(*init_sdma_vm)(struct device_queue_manager *dqm,
				struct queue *q,
				struct qcm_process_device *qpd);
153 154
	struct mqd_manager *	(*mqd_manager_init)(enum KFD_MQD_TYPE type,
				 struct kfd_dev *dev);
155 156
};

157 158 159 160 161 162 163 164 165 166 167
/**
 * struct device_queue_manager
 *
 * This struct is a base class for the kfd queues scheduler in the
 * device level. The device base class should expose the basic operations
 * for queue creation and queue destruction. This base class hides the
 * scheduling mode of the driver and the specific implementation of the
 * concrete device. This class is the only class in the queues scheduler
 * that configures the H/W.
 *
 */
B
Ben Goz 已提交
168

169 170
struct device_queue_manager {
	struct device_queue_manager_ops ops;
171
	struct device_queue_manager_asic_ops asic_ops;
B
Ben Goz 已提交
172

173
	struct mqd_manager	*mqd_mgrs[KFD_MQD_TYPE_MAX];
B
Ben Goz 已提交
174 175
	struct packet_manager	packets;
	struct kfd_dev		*dev;
176
	struct mutex		lock_hidden; /* use dqm_lock/unlock(dqm) */
B
Ben Goz 已提交
177
	struct list_head	queues;
178
	unsigned int		saved_flags;
B
Ben Goz 已提交
179 180
	unsigned int		processes_count;
	unsigned int		queue_count;
181
	unsigned int		sdma_queue_count;
182
	unsigned int		xgmi_sdma_queue_count;
183
	unsigned int		total_queue_count;
B
Ben Goz 已提交
184 185
	unsigned int		next_pipe_to_allocate;
	unsigned int		*allocated_queues;
O
Oak Zeng 已提交
186
	uint64_t		sdma_bitmap;
187
	uint64_t		xgmi_sdma_bitmap;
B
Ben Goz 已提交
188 189 190 191 192 193 194
	unsigned int		vmid_bitmap;
	uint64_t		pipelines_addr;
	struct kfd_mem_obj	*pipeline_mem;
	uint64_t		fence_gpu_addr;
	unsigned int		*fence_addr;
	struct kfd_mem_obj	*fence_mem;
	bool			active_runlist;
195
	int			sched_policy;
196 197 198 199

	/* hw exception  */
	bool			is_hws_hang;
	struct work_struct	hw_exception_work;
200
	struct kfd_mem_obj	hiq_sdma_mqd;
B
Ben Goz 已提交
201 202
};

203 204
void device_queue_manager_init_cik(
		struct device_queue_manager_asic_ops *asic_ops);
205 206
void device_queue_manager_init_cik_hawaii(
		struct device_queue_manager_asic_ops *asic_ops);
207 208
void device_queue_manager_init_vi(
		struct device_queue_manager_asic_ops *asic_ops);
209 210
void device_queue_manager_init_vi_tonga(
		struct device_queue_manager_asic_ops *asic_ops);
211 212
void device_queue_manager_init_v9(
		struct device_queue_manager_asic_ops *asic_ops);
213 214
void device_queue_manager_init_v10_navi10(
		struct device_queue_manager_asic_ops *asic_ops);
215 216
void program_sh_mem_settings(struct device_queue_manager *dqm,
					struct qcm_process_device *qpd);
217 218 219
unsigned int get_queues_num(struct device_queue_manager *dqm);
unsigned int get_queues_per_pipe(struct device_queue_manager *dqm);
unsigned int get_pipes_per_mec(struct device_queue_manager *dqm);
220
unsigned int get_num_sdma_queues(struct device_queue_manager *dqm);
221
unsigned int get_num_xgmi_sdma_queues(struct device_queue_manager *dqm);
O
Oded Gabbay 已提交
222

223
static inline unsigned int get_sh_mem_bases_32(struct kfd_process_device *pdd)
O
Oded Gabbay 已提交
224 225 226 227
{
	return (pdd->lds_base >> 16) & 0xFF;
}

228
static inline unsigned int
O
Oded Gabbay 已提交
229 230 231 232 233
get_sh_mem_bases_nybble_64(struct kfd_process_device *pdd)
{
	return (pdd->lds_base >> 60) & 0x0E;
}

234 235 236 237 238 239 240 241 242 243 244 245 246 247 248
/* The DQM lock can be taken in MMU notifiers. Make sure no reclaim-FS
 * happens while holding this lock anywhere to prevent deadlocks when
 * an MMU notifier runs in reclaim-FS context.
 */
static inline void dqm_lock(struct device_queue_manager *dqm)
{
	mutex_lock(&dqm->lock_hidden);
	dqm->saved_flags = memalloc_nofs_save();
}
static inline void dqm_unlock(struct device_queue_manager *dqm)
{
	memalloc_nofs_restore(dqm->saved_flags);
	mutex_unlock(&dqm->lock_hidden);
}

B
Ben Goz 已提交
249
#endif /* KFD_DEVICE_QUEUE_MANAGER_H_ */