kfd_device_queue_manager.h 8.3 KB
Newer Older
B
Ben Goz 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28
/*
 * Copyright 2014 Advanced Micro Devices, Inc.
 *
 * Permission is hereby granted, free of charge, to any person obtaining a
 * copy of this software and associated documentation files (the "Software"),
 * to deal in the Software without restriction, including without limitation
 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
 * and/or sell copies of the Software, and to permit persons to whom the
 * Software is furnished to do so, subject to the following conditions:
 *
 * The above copyright notice and this permission notice shall be included in
 * all copies or substantial portions of the Software.
 *
 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
 * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
 * OTHER DEALINGS IN THE SOFTWARE.
 *
 */

#ifndef KFD_DEVICE_QUEUE_MANAGER_H_
#define KFD_DEVICE_QUEUE_MANAGER_H_

#include <linux/rwsem.h>
#include <linux/list.h>
29 30
#include <linux/mutex.h>
#include <linux/sched/mm.h>
B
Ben Goz 已提交
31 32 33
#include "kfd_priv.h"
#include "kfd_mqd_manager.h"

34 35
#define KFD_UNMAP_LATENCY_MS			(4000)
#define QUEUE_PREEMPT_DEFAULT_TIMEOUT_MS (2 * KFD_UNMAP_LATENCY_MS + 1000)
B
Ben Goz 已提交
36 37 38 39 40 41

struct device_process_node {
	struct qcm_process_device *qpd;
	struct list_head list;
};

42
/**
43
 * struct device_queue_manager_ops
44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75
 *
 * @create_queue: Queue creation routine.
 *
 * @destroy_queue: Queue destruction routine.
 *
 * @update_queue: Queue update routine.
 *
 * @exeute_queues: Dispatches the queues list to the H/W.
 *
 * @register_process: This routine associates a specific process with device.
 *
 * @unregister_process: destroys the associations between process to device.
 *
 * @initialize: Initializes the pipelines and memory module for that device.
 *
 * @start: Initializes the resources/modules the the device needs for queues
 * execution. This function is called on device initialization and after the
 * system woke up after suspension.
 *
 * @stop: This routine stops execution of all the active queue running on the
 * H/W and basically this function called on system suspend.
 *
 * @uninitialize: Destroys all the device queue manager resources allocated in
 * initialize routine.
 *
 * @create_kernel_queue: Creates kernel queue. Used for debug queue.
 *
 * @destroy_kernel_queue: Destroys kernel queue. Used for debug queue.
 *
 * @set_cache_memory_policy: Sets memory policy (cached/ non cached) for the
 * memory apertures.
 *
76 77
 * @process_termination: Clears all process queues belongs to that device.
 *
78 79 80 81
 * @evict_process_queues: Evict all active queues of a process
 *
 * @restore_process_queues: Restore all evicted queues queues of a process
 *
82 83
 * @get_wave_state: Retrieves context save state and optionally copies the
 * control stack, if kept in the MQD, to the given userspace address.
84 85
 */

86
struct device_queue_manager_ops {
B
Ben Goz 已提交
87 88
	int	(*create_queue)(struct device_queue_manager *dqm,
				struct queue *q,
89
				struct qcm_process_device *qpd);
90

B
Ben Goz 已提交
91 92 93
	int	(*destroy_queue)(struct device_queue_manager *dqm,
				struct qcm_process_device *qpd,
				struct queue *q);
94

B
Ben Goz 已提交
95 96
	int	(*update_queue)(struct device_queue_manager *dqm,
				struct queue *q);
97

B
Ben Goz 已提交
98 99
	int	(*register_process)(struct device_queue_manager *dqm,
					struct qcm_process_device *qpd);
100

B
Ben Goz 已提交
101 102
	int	(*unregister_process)(struct device_queue_manager *dqm,
					struct qcm_process_device *qpd);
103

B
Ben Goz 已提交
104 105 106 107 108 109 110
	int	(*initialize)(struct device_queue_manager *dqm);
	int	(*start)(struct device_queue_manager *dqm);
	int	(*stop)(struct device_queue_manager *dqm);
	void	(*uninitialize)(struct device_queue_manager *dqm);
	int	(*create_kernel_queue)(struct device_queue_manager *dqm,
					struct kernel_queue *kq,
					struct qcm_process_device *qpd);
111

B
Ben Goz 已提交
112 113 114
	void	(*destroy_kernel_queue)(struct device_queue_manager *dqm,
					struct kernel_queue *kq,
					struct qcm_process_device *qpd);
115

B
Ben Goz 已提交
116 117 118 119 120 121
	bool	(*set_cache_memory_policy)(struct device_queue_manager *dqm,
					   struct qcm_process_device *qpd,
					   enum cache_policy default_policy,
					   enum cache_policy alternate_policy,
					   void __user *alternate_aperture_base,
					   uint64_t alternate_aperture_size);
122

123 124 125 126 127
	int	(*set_trap_handler)(struct device_queue_manager *dqm,
				    struct qcm_process_device *qpd,
				    uint64_t tba_addr,
				    uint64_t tma_addr);

128 129
	int (*process_termination)(struct device_queue_manager *dqm,
			struct qcm_process_device *qpd);
130 131 132 133 134

	int (*evict_process_queues)(struct device_queue_manager *dqm,
				    struct qcm_process_device *qpd);
	int (*restore_process_queues)(struct device_queue_manager *dqm,
				      struct qcm_process_device *qpd);
135 136 137 138 139 140

	int	(*get_wave_state)(struct device_queue_manager *dqm,
				  struct queue *q,
				  void __user *ctl_stack,
				  u32 *ctl_stack_used_size,
				  u32 *save_area_used_size);
141 142
};

143
struct device_queue_manager_asic_ops {
144
	int	(*update_qpd)(struct device_queue_manager *dqm,
145 146 147 148 149 150 151
					struct qcm_process_device *qpd);
	bool	(*set_cache_memory_policy)(struct device_queue_manager *dqm,
					   struct qcm_process_device *qpd,
					   enum cache_policy default_policy,
					   enum cache_policy alternate_policy,
					   void __user *alternate_aperture_base,
					   uint64_t alternate_aperture_size);
152 153 154
	void	(*init_sdma_vm)(struct device_queue_manager *dqm,
				struct queue *q,
				struct qcm_process_device *qpd);
155 156
	struct mqd_manager *	(*mqd_manager_init)(enum KFD_MQD_TYPE type,
				 struct kfd_dev *dev);
157 158
};

159 160 161 162 163 164 165 166 167 168 169
/**
 * struct device_queue_manager
 *
 * This struct is a base class for the kfd queues scheduler in the
 * device level. The device base class should expose the basic operations
 * for queue creation and queue destruction. This base class hides the
 * scheduling mode of the driver and the specific implementation of the
 * concrete device. This class is the only class in the queues scheduler
 * that configures the H/W.
 *
 */
B
Ben Goz 已提交
170

171 172
struct device_queue_manager {
	struct device_queue_manager_ops ops;
173
	struct device_queue_manager_asic_ops asic_ops;
B
Ben Goz 已提交
174

175
	struct mqd_manager	*mqd_mgrs[KFD_MQD_TYPE_MAX];
B
Ben Goz 已提交
176 177
	struct packet_manager	packets;
	struct kfd_dev		*dev;
178
	struct mutex		lock_hidden; /* use dqm_lock/unlock(dqm) */
B
Ben Goz 已提交
179
	struct list_head	queues;
180
	unsigned int		saved_flags;
B
Ben Goz 已提交
181 182
	unsigned int		processes_count;
	unsigned int		queue_count;
183
	unsigned int		sdma_queue_count;
184
	unsigned int		total_queue_count;
B
Ben Goz 已提交
185 186
	unsigned int		next_pipe_to_allocate;
	unsigned int		*allocated_queues;
O
Oak Zeng 已提交
187
	uint64_t		sdma_bitmap;
B
Ben Goz 已提交
188 189 190 191 192 193 194
	unsigned int		vmid_bitmap;
	uint64_t		pipelines_addr;
	struct kfd_mem_obj	*pipeline_mem;
	uint64_t		fence_gpu_addr;
	unsigned int		*fence_addr;
	struct kfd_mem_obj	*fence_mem;
	bool			active_runlist;
195
	int			sched_policy;
196 197 198 199

	/* hw exception  */
	bool			is_hws_hang;
	struct work_struct	hw_exception_work;
B
Ben Goz 已提交
200 201
};

202 203
void device_queue_manager_init_cik(
		struct device_queue_manager_asic_ops *asic_ops);
204 205
void device_queue_manager_init_cik_hawaii(
		struct device_queue_manager_asic_ops *asic_ops);
206 207
void device_queue_manager_init_vi(
		struct device_queue_manager_asic_ops *asic_ops);
208 209
void device_queue_manager_init_vi_tonga(
		struct device_queue_manager_asic_ops *asic_ops);
210 211
void device_queue_manager_init_v9(
		struct device_queue_manager_asic_ops *asic_ops);
212 213
void program_sh_mem_settings(struct device_queue_manager *dqm,
					struct qcm_process_device *qpd);
214 215 216
unsigned int get_queues_num(struct device_queue_manager *dqm);
unsigned int get_queues_per_pipe(struct device_queue_manager *dqm);
unsigned int get_pipes_per_mec(struct device_queue_manager *dqm);
217
unsigned int get_num_sdma_queues(struct device_queue_manager *dqm);
O
Oded Gabbay 已提交
218

219
static inline unsigned int get_sh_mem_bases_32(struct kfd_process_device *pdd)
O
Oded Gabbay 已提交
220 221 222 223
{
	return (pdd->lds_base >> 16) & 0xFF;
}

224
static inline unsigned int
O
Oded Gabbay 已提交
225 226 227 228 229
get_sh_mem_bases_nybble_64(struct kfd_process_device *pdd)
{
	return (pdd->lds_base >> 60) & 0x0E;
}

230 231 232 233 234 235 236 237 238 239 240 241 242 243 244
/* The DQM lock can be taken in MMU notifiers. Make sure no reclaim-FS
 * happens while holding this lock anywhere to prevent deadlocks when
 * an MMU notifier runs in reclaim-FS context.
 */
static inline void dqm_lock(struct device_queue_manager *dqm)
{
	mutex_lock(&dqm->lock_hidden);
	dqm->saved_flags = memalloc_nofs_save();
}
static inline void dqm_unlock(struct device_queue_manager *dqm)
{
	memalloc_nofs_restore(dqm->saved_flags);
	mutex_unlock(&dqm->lock_hidden);
}

B
Ben Goz 已提交
245
#endif /* KFD_DEVICE_QUEUE_MANAGER_H_ */