eeh.h 10.7 KB
Newer Older
1
/*
L
Linus Torvalds 已提交
2
 * Copyright (C) 2001  Dave Engebretsen & Todd Inglett IBM Corporation.
3
 * Copyright 2001-2012 IBM Corporation.
L
Linus Torvalds 已提交
4 5 6 7 8
 *
 * This program is free software; you can redistribute it and/or modify
 * it under the terms of the GNU General Public License as published by
 * the Free Software Foundation; either version 2 of the License, or
 * (at your option) any later version.
9
 *
L
Linus Torvalds 已提交
10 11 12 13
 * This program is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 * GNU General Public License for more details.
14
 *
L
Linus Torvalds 已提交
15 16 17 18 19
 * You should have received a copy of the GNU General Public License
 * along with this program; if not, write to the Free Software
 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307 USA
 */

20 21
#ifndef _POWERPC_EEH_H
#define _POWERPC_EEH_H
22
#ifdef __KERNEL__
L
Linus Torvalds 已提交
23 24 25 26 27 28

#include <linux/init.h>
#include <linux/list.h>
#include <linux/string.h>

struct pci_dev;
29
struct pci_bus;
L
Linus Torvalds 已提交
30 31 32 33
struct device_node;

#ifdef CONFIG_EEH

34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69
/*
 * The struct is used to trace PE related EEH functionality.
 * In theory, there will have one instance of the struct to
 * be created against particular PE. In nature, PEs corelate
 * to each other. the struct has to reflect that hierarchy in
 * order to easily pick up those affected PEs when one particular
 * PE has EEH errors.
 *
 * Also, one particular PE might be composed of PCI device, PCI
 * bus and its subordinate components. The struct also need ship
 * the information. Further more, one particular PE is only meaingful
 * in the corresponding PHB. Therefore, the root PEs should be created
 * against existing PHBs in on-to-one fashion.
 */
#define EEH_PE_PHB	1	/* PHB PE    */
#define EEH_PE_DEVICE 	2	/* Device PE */
#define EEH_PE_BUS	3	/* Bus PE    */

#define EEH_PE_ISOLATED		(1 << 0)	/* Isolated PE		*/
#define EEH_PE_RECOVERING	(1 << 1)	/* Recovering PE	*/

struct eeh_pe {
	int type;			/* PE type: PHB/Bus/Device	*/
	int state;			/* PE EEH dependent mode	*/
	int config_addr;		/* Traditional PCI address	*/
	int addr;			/* PE configuration address	*/
	struct pci_controller *phb;	/* Associated PHB		*/
	int check_count;		/* Times of ignored error	*/
	int freeze_count;		/* Times of froze up		*/
	int false_positives;		/* Times of reported #ff's	*/
	struct eeh_pe *parent;		/* Parent PE			*/
	struct list_head child_list;	/* Link PE to the child list	*/
	struct list_head edevs;		/* Link list of EEH devices	*/
	struct list_head child;		/* Child PEs			*/
};

70 71 72
#define eeh_pe_for_each_dev(pe, edev) \
		list_for_each_entry(edev, &pe->edevs, list)

G
Gavin Shan 已提交
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94
/*
 * The struct is used to trace EEH state for the associated
 * PCI device node or PCI device. In future, it might
 * represent PE as well so that the EEH device to form
 * another tree except the currently existing tree of PCI
 * buses and PCI devices
 */
#define EEH_MODE_SUPPORTED	(1<<0)	/* EEH supported on the device	*/
#define EEH_MODE_NOCHECK	(1<<1)	/* EEH check should be skipped	*/
#define EEH_MODE_ISOLATED	(1<<2)	/* The device has been isolated	*/
#define EEH_MODE_RECOVERING	(1<<3)	/* Recovering the device	*/
#define EEH_MODE_IRQ_DISABLED	(1<<4)	/* Interrupt disabled		*/

struct eeh_dev {
	int mode;			/* EEH mode			*/
	int class_code;			/* Class code of the device	*/
	int config_addr;		/* Config address		*/
	int pe_config_addr;		/* PE config address		*/
	int check_count;		/* Times of ignored error	*/
	int freeze_count;		/* Times of froze up		*/
	int false_positives;		/* Times of reported #ff's	*/
	u32 config_space[16];		/* Saved PCI config space	*/
95 96
	struct eeh_pe *pe;		/* Associated PE		*/
	struct list_head list;		/* Form link list in the PE	*/
G
Gavin Shan 已提交
97 98 99 100 101 102 103 104 105 106 107 108 109 110 111
	struct pci_controller *phb;	/* Associated PHB		*/
	struct device_node *dn;		/* Associated device node	*/
	struct pci_dev *pdev;		/* Associated PCI device	*/
};

static inline struct device_node *eeh_dev_to_of_node(struct eeh_dev *edev)
{
	return edev->dn;
}

static inline struct pci_dev *eeh_dev_to_pci_dev(struct eeh_dev *edev)
{
	return edev->pdev;
}

112 113 114 115 116 117 118
/*
 * The struct is used to trace the registered EEH operation
 * callback functions. Actually, those operation callback
 * functions are heavily platform dependent. That means the
 * platform should register its own EEH operation callback
 * functions before any EEH further operations.
 */
119 120 121 122
#define EEH_OPT_DISABLE		0	/* EEH disable	*/
#define EEH_OPT_ENABLE		1	/* EEH enable	*/
#define EEH_OPT_THAW_MMIO	2	/* MMIO enable	*/
#define EEH_OPT_THAW_DMA	3	/* DMA enable	*/
123 124 125 126 127 128 129
#define EEH_STATE_UNAVAILABLE	(1 << 0)	/* State unavailable	*/
#define EEH_STATE_NOT_SUPPORT	(1 << 1)	/* EEH not supported	*/
#define EEH_STATE_RESET_ACTIVE	(1 << 2)	/* Active reset		*/
#define EEH_STATE_MMIO_ACTIVE	(1 << 3)	/* Active MMIO		*/
#define EEH_STATE_DMA_ACTIVE	(1 << 4)	/* Active DMA		*/
#define EEH_STATE_MMIO_ENABLED	(1 << 5)	/* MMIO enabled		*/
#define EEH_STATE_DMA_ENABLED	(1 << 6)	/* DMA enabled		*/
130 131 132
#define EEH_RESET_DEACTIVATE	0	/* Deactivate the PE reset	*/
#define EEH_RESET_HOT		1	/* Hot reset			*/
#define EEH_RESET_FUNDAMENTAL	3	/* Fundamental reset		*/
133 134
#define EEH_LOG_TEMP		1	/* EEH temporary error log	*/
#define EEH_LOG_PERM		2	/* EEH permanent error log	*/
135

136 137 138
struct eeh_ops {
	char *name;
	int (*init)(void);
139 140 141 142 143 144 145
	int (*set_option)(struct eeh_pe *pe, int option);
	int (*get_pe_addr)(struct eeh_pe *pe);
	int (*get_state)(struct eeh_pe *pe, int *state);
	int (*reset)(struct eeh_pe *pe, int option);
	int (*wait_state)(struct eeh_pe *pe, int max_wait);
	int (*get_log)(struct eeh_pe *pe, int severity, char *drv_log, unsigned long len);
	int (*configure_bridge)(struct eeh_pe *pe);
146 147
	int (*read_config)(struct device_node *dn, int where, int size, u32 *val);
	int (*write_config)(struct device_node *dn, int where, int size, u32 val);
148 149 150
};

extern struct eeh_ops *eeh_ops;
151
extern int eeh_subsystem_enabled;
G
Gavin Shan 已提交
152 153 154 155 156 157 158 159 160 161 162
extern struct mutex eeh_mutex;

static inline void eeh_lock(void)
{
	mutex_lock(&eeh_mutex);
}

static inline void eeh_unlock(void)
{
	mutex_unlock(&eeh_mutex);
}
163

164 165 166 167
/*
 * Max number of EEH freezes allowed before we consider the device
 * to be permanently disabled.
 */
168 169
#define EEH_MAX_ALLOWED_FREEZES 5

170
typedef void *(*eeh_traverse_func)(void *data, void *flag);
G
Gavin Shan 已提交
171
int __devinit eeh_phb_pe_create(struct pci_controller *phb);
172
int eeh_add_to_parent_pe(struct eeh_dev *edev);
173
int eeh_rmv_from_parent_pe(struct eeh_dev *edev);
174 175 176
void *eeh_pe_dev_traverse(struct eeh_pe *root,
		eeh_traverse_func fn, void *flag);
void eeh_pe_restore_bars(struct eeh_pe *pe);
G
Gavin Shan 已提交
177

G
Gavin Shan 已提交
178 179
void * __devinit eeh_dev_init(struct device_node *dn, void *data);
void __devinit eeh_dev_phb_init_dynamic(struct pci_controller *phb);
180 181
int __init eeh_ops_register(struct eeh_ops *ops);
int __exit eeh_ops_unregister(const char *name);
L
Linus Torvalds 已提交
182 183 184 185
unsigned long eeh_check_failure(const volatile void __iomem *token,
				unsigned long val);
int eeh_dn_check_failure(struct device_node *dn, struct pci_dev *dev);
void __init pci_addr_cache_build(void);
186
void eeh_add_device_tree_early(struct device_node *);
187
void eeh_add_device_tree_late(struct pci_bus *);
188 189
void eeh_remove_bus_device(struct pci_dev *);

L
Linus Torvalds 已提交
190 191 192 193 194 195
/**
 * EEH_POSSIBLE_ERROR() -- test for possible MMIO failure.
 *
 * If this macro yields TRUE, the caller relays to eeh_check_failure()
 * which does further tests out of line.
 */
196
#define EEH_POSSIBLE_ERROR(val, type)	((val) == (type)~0 && eeh_subsystem_enabled)
L
Linus Torvalds 已提交
197 198 199 200 201 202 203 204 205

/*
 * Reads from a device which has been isolated by EEH will return
 * all 1s.  This macro gives an all-1s value of the given size (in
 * bytes: 1, 2, or 4) for comparing with the result of a read.
 */
#define EEH_IO_ERROR_VALUE(size)	(~0U >> ((4 - (size)) * 8))

#else /* !CONFIG_EEH */
G
Gavin Shan 已提交
206 207 208 209 210 211 212 213

static inline void *eeh_dev_init(struct device_node *dn, void *data)
{
	return NULL;
}

static inline void eeh_dev_phb_init_dynamic(struct pci_controller *phb) { }

L
Linus Torvalds 已提交
214 215 216 217 218 219 220 221 222 223 224 225
static inline unsigned long eeh_check_failure(const volatile void __iomem *token, unsigned long val)
{
	return val;
}

static inline int eeh_dn_check_failure(struct device_node *dn, struct pci_dev *dev)
{
	return 0;
}

static inline void pci_addr_cache_build(void) { }

226 227
static inline void eeh_add_device_tree_early(struct device_node *dn) { }

228 229
static inline void eeh_add_device_tree_late(struct pci_bus *bus) { }

230
static inline void eeh_remove_bus_device(struct pci_dev *dev) { }
G
Gavin Shan 已提交
231 232 233 234

static inline void eeh_lock(void) { }
static inline void eeh_unlock(void) { }

L
Linus Torvalds 已提交
235 236 237 238
#define EEH_POSSIBLE_ERROR(val, type) (0)
#define EEH_IO_ERROR_VALUE(size) (-1UL)
#endif /* CONFIG_EEH */

239
#ifdef CONFIG_PPC64
240
/*
L
Linus Torvalds 已提交
241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265
 * MMIO read/write operations with EEH support.
 */
static inline u8 eeh_readb(const volatile void __iomem *addr)
{
	u8 val = in_8(addr);
	if (EEH_POSSIBLE_ERROR(val, u8))
		return eeh_check_failure(addr, val);
	return val;
}

static inline u16 eeh_readw(const volatile void __iomem *addr)
{
	u16 val = in_le16(addr);
	if (EEH_POSSIBLE_ERROR(val, u16))
		return eeh_check_failure(addr, val);
	return val;
}

static inline u32 eeh_readl(const volatile void __iomem *addr)
{
	u32 val = in_le32(addr);
	if (EEH_POSSIBLE_ERROR(val, u32))
		return eeh_check_failure(addr, val);
	return val;
}
266 267

static inline u64 eeh_readq(const volatile void __iomem *addr)
L
Linus Torvalds 已提交
268
{
269 270
	u64 val = in_le64(addr);
	if (EEH_POSSIBLE_ERROR(val, u64))
L
Linus Torvalds 已提交
271 272 273 274
		return eeh_check_failure(addr, val);
	return val;
}

275
static inline u16 eeh_readw_be(const volatile void __iomem *addr)
L
Linus Torvalds 已提交
276
{
277 278
	u16 val = in_be16(addr);
	if (EEH_POSSIBLE_ERROR(val, u16))
L
Linus Torvalds 已提交
279 280 281
		return eeh_check_failure(addr, val);
	return val;
}
282 283

static inline u32 eeh_readl_be(const volatile void __iomem *addr)
L
Linus Torvalds 已提交
284
{
285 286 287 288
	u32 val = in_be32(addr);
	if (EEH_POSSIBLE_ERROR(val, u32))
		return eeh_check_failure(addr, val);
	return val;
L
Linus Torvalds 已提交
289
}
290 291

static inline u64 eeh_readq_be(const volatile void __iomem *addr)
L
Linus Torvalds 已提交
292 293 294 295 296 297 298
{
	u64 val = in_be64(addr);
	if (EEH_POSSIBLE_ERROR(val, u64))
		return eeh_check_failure(addr, val);
	return val;
}

299 300
static inline void eeh_memcpy_fromio(void *dest, const
				     volatile void __iomem *src,
L
Linus Torvalds 已提交
301 302
				     unsigned long n)
{
303
	_memcpy_fromio(dest, src, n);
L
Linus Torvalds 已提交
304 305 306 307

	/* Look for ffff's here at dest[n].  Assume that at least 4 bytes
	 * were copied. Check all four bytes.
	 */
308 309
	if (n >= 4 && EEH_POSSIBLE_ERROR(*((u32 *)(dest + n - 4)), u32))
		eeh_check_failure(src, *((u32 *)(dest + n - 4)));
L
Linus Torvalds 已提交
310 311 312
}

/* in-string eeh macros */
313 314
static inline void eeh_readsb(const volatile void __iomem *addr, void * buf,
			      int ns)
L
Linus Torvalds 已提交
315
{
316
	_insb(addr, buf, ns);
L
Linus Torvalds 已提交
317
	if (EEH_POSSIBLE_ERROR((*(((u8*)buf)+ns-1)), u8))
318
		eeh_check_failure(addr, *(u8*)buf);
L
Linus Torvalds 已提交
319 320
}

321 322
static inline void eeh_readsw(const volatile void __iomem *addr, void * buf,
			      int ns)
L
Linus Torvalds 已提交
323
{
324
	_insw(addr, buf, ns);
L
Linus Torvalds 已提交
325
	if (EEH_POSSIBLE_ERROR((*(((u16*)buf)+ns-1)), u16))
326
		eeh_check_failure(addr, *(u16*)buf);
L
Linus Torvalds 已提交
327 328
}

329 330
static inline void eeh_readsl(const volatile void __iomem *addr, void * buf,
			      int nl)
L
Linus Torvalds 已提交
331
{
332
	_insl(addr, buf, nl);
L
Linus Torvalds 已提交
333
	if (EEH_POSSIBLE_ERROR((*(((u32*)buf)+nl-1)), u32))
334
		eeh_check_failure(addr, *(u32*)buf);
L
Linus Torvalds 已提交
335 336
}

337
#endif /* CONFIG_PPC64 */
338
#endif /* __KERNEL__ */
339
#endif /* _POWERPC_EEH_H */