eeh.h 10.5 KB
Newer Older
1
/*
L
Linus Torvalds 已提交
2
 * Copyright (C) 2001  Dave Engebretsen & Todd Inglett IBM Corporation.
3
 * Copyright 2001-2012 IBM Corporation.
L
Linus Torvalds 已提交
4 5 6 7 8
 *
 * This program is free software; you can redistribute it and/or modify
 * it under the terms of the GNU General Public License as published by
 * the Free Software Foundation; either version 2 of the License, or
 * (at your option) any later version.
9
 *
L
Linus Torvalds 已提交
10 11 12 13
 * This program is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 * GNU General Public License for more details.
14
 *
L
Linus Torvalds 已提交
15 16 17 18 19
 * You should have received a copy of the GNU General Public License
 * along with this program; if not, write to the Free Software
 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307 USA
 */

20 21
#ifndef _POWERPC_EEH_H
#define _POWERPC_EEH_H
22
#ifdef __KERNEL__
L
Linus Torvalds 已提交
23 24 25 26 27 28

#include <linux/init.h>
#include <linux/list.h>
#include <linux/string.h>

struct pci_dev;
29
struct pci_bus;
L
Linus Torvalds 已提交
30 31 32 33
struct device_node;

#ifdef CONFIG_EEH

34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69
/*
 * The struct is used to trace PE related EEH functionality.
 * In theory, there will have one instance of the struct to
 * be created against particular PE. In nature, PEs corelate
 * to each other. the struct has to reflect that hierarchy in
 * order to easily pick up those affected PEs when one particular
 * PE has EEH errors.
 *
 * Also, one particular PE might be composed of PCI device, PCI
 * bus and its subordinate components. The struct also need ship
 * the information. Further more, one particular PE is only meaingful
 * in the corresponding PHB. Therefore, the root PEs should be created
 * against existing PHBs in on-to-one fashion.
 */
#define EEH_PE_PHB	1	/* PHB PE    */
#define EEH_PE_DEVICE 	2	/* Device PE */
#define EEH_PE_BUS	3	/* Bus PE    */

#define EEH_PE_ISOLATED		(1 << 0)	/* Isolated PE		*/
#define EEH_PE_RECOVERING	(1 << 1)	/* Recovering PE	*/

struct eeh_pe {
	int type;			/* PE type: PHB/Bus/Device	*/
	int state;			/* PE EEH dependent mode	*/
	int config_addr;		/* Traditional PCI address	*/
	int addr;			/* PE configuration address	*/
	struct pci_controller *phb;	/* Associated PHB		*/
	int check_count;		/* Times of ignored error	*/
	int freeze_count;		/* Times of froze up		*/
	int false_positives;		/* Times of reported #ff's	*/
	struct eeh_pe *parent;		/* Parent PE			*/
	struct list_head child_list;	/* Link PE to the child list	*/
	struct list_head edevs;		/* Link list of EEH devices	*/
	struct list_head child;		/* Child PEs			*/
};

G
Gavin Shan 已提交
70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91
/*
 * The struct is used to trace EEH state for the associated
 * PCI device node or PCI device. In future, it might
 * represent PE as well so that the EEH device to form
 * another tree except the currently existing tree of PCI
 * buses and PCI devices
 */
#define EEH_MODE_SUPPORTED	(1<<0)	/* EEH supported on the device	*/
#define EEH_MODE_NOCHECK	(1<<1)	/* EEH check should be skipped	*/
#define EEH_MODE_ISOLATED	(1<<2)	/* The device has been isolated	*/
#define EEH_MODE_RECOVERING	(1<<3)	/* Recovering the device	*/
#define EEH_MODE_IRQ_DISABLED	(1<<4)	/* Interrupt disabled		*/

struct eeh_dev {
	int mode;			/* EEH mode			*/
	int class_code;			/* Class code of the device	*/
	int config_addr;		/* Config address		*/
	int pe_config_addr;		/* PE config address		*/
	int check_count;		/* Times of ignored error	*/
	int freeze_count;		/* Times of froze up		*/
	int false_positives;		/* Times of reported #ff's	*/
	u32 config_space[16];		/* Saved PCI config space	*/
92 93
	struct eeh_pe *pe;		/* Associated PE		*/
	struct list_head list;		/* Form link list in the PE	*/
G
Gavin Shan 已提交
94 95 96 97 98 99 100 101 102 103 104 105 106 107 108
	struct pci_controller *phb;	/* Associated PHB		*/
	struct device_node *dn;		/* Associated device node	*/
	struct pci_dev *pdev;		/* Associated PCI device	*/
};

static inline struct device_node *eeh_dev_to_of_node(struct eeh_dev *edev)
{
	return edev->dn;
}

static inline struct pci_dev *eeh_dev_to_pci_dev(struct eeh_dev *edev)
{
	return edev->pdev;
}

109 110 111 112 113 114 115
/*
 * The struct is used to trace the registered EEH operation
 * callback functions. Actually, those operation callback
 * functions are heavily platform dependent. That means the
 * platform should register its own EEH operation callback
 * functions before any EEH further operations.
 */
116 117 118 119
#define EEH_OPT_DISABLE		0	/* EEH disable	*/
#define EEH_OPT_ENABLE		1	/* EEH enable	*/
#define EEH_OPT_THAW_MMIO	2	/* MMIO enable	*/
#define EEH_OPT_THAW_DMA	3	/* DMA enable	*/
120 121 122 123 124 125 126
#define EEH_STATE_UNAVAILABLE	(1 << 0)	/* State unavailable	*/
#define EEH_STATE_NOT_SUPPORT	(1 << 1)	/* EEH not supported	*/
#define EEH_STATE_RESET_ACTIVE	(1 << 2)	/* Active reset		*/
#define EEH_STATE_MMIO_ACTIVE	(1 << 3)	/* Active MMIO		*/
#define EEH_STATE_DMA_ACTIVE	(1 << 4)	/* Active DMA		*/
#define EEH_STATE_MMIO_ENABLED	(1 << 5)	/* MMIO enabled		*/
#define EEH_STATE_DMA_ENABLED	(1 << 6)	/* DMA enabled		*/
127 128 129
#define EEH_RESET_DEACTIVATE	0	/* Deactivate the PE reset	*/
#define EEH_RESET_HOT		1	/* Hot reset			*/
#define EEH_RESET_FUNDAMENTAL	3	/* Fundamental reset		*/
130 131
#define EEH_LOG_TEMP		1	/* EEH temporary error log	*/
#define EEH_LOG_PERM		2	/* EEH permanent error log	*/
132

133 134 135 136 137 138 139 140 141 142
struct eeh_ops {
	char *name;
	int (*init)(void);
	int (*set_option)(struct device_node *dn, int option);
	int (*get_pe_addr)(struct device_node *dn);
	int (*get_state)(struct device_node *dn, int *state);
	int (*reset)(struct device_node *dn, int option);
	int (*wait_state)(struct device_node *dn, int max_wait);
	int (*get_log)(struct device_node *dn, int severity, char *drv_log, unsigned long len);
	int (*configure_bridge)(struct device_node *dn);
143 144
	int (*read_config)(struct device_node *dn, int where, int size, u32 *val);
	int (*write_config)(struct device_node *dn, int where, int size, u32 val);
145 146 147
};

extern struct eeh_ops *eeh_ops;
148
extern int eeh_subsystem_enabled;
G
Gavin Shan 已提交
149 150 151 152 153 154 155 156 157 158 159
extern struct mutex eeh_mutex;

static inline void eeh_lock(void)
{
	mutex_lock(&eeh_mutex);
}

static inline void eeh_unlock(void)
{
	mutex_unlock(&eeh_mutex);
}
160

161 162 163 164
/*
 * Max number of EEH freezes allowed before we consider the device
 * to be permanently disabled.
 */
165 166
#define EEH_MAX_ALLOWED_FREEZES 5

167
typedef void *(*eeh_traverse_func)(void *data, void *flag);
G
Gavin Shan 已提交
168
int __devinit eeh_phb_pe_create(struct pci_controller *phb);
169
int eeh_add_to_parent_pe(struct eeh_dev *edev);
170
int eeh_rmv_from_parent_pe(struct eeh_dev *edev);
G
Gavin Shan 已提交
171

G
Gavin Shan 已提交
172 173
void * __devinit eeh_dev_init(struct device_node *dn, void *data);
void __devinit eeh_dev_phb_init_dynamic(struct pci_controller *phb);
174 175
int __init eeh_ops_register(struct eeh_ops *ops);
int __exit eeh_ops_unregister(const char *name);
L
Linus Torvalds 已提交
176 177 178 179
unsigned long eeh_check_failure(const volatile void __iomem *token,
				unsigned long val);
int eeh_dn_check_failure(struct device_node *dn, struct pci_dev *dev);
void __init pci_addr_cache_build(void);
180
void eeh_add_device_tree_early(struct device_node *);
181
void eeh_add_device_tree_late(struct pci_bus *);
182 183
void eeh_remove_bus_device(struct pci_dev *);

L
Linus Torvalds 已提交
184 185 186 187 188 189
/**
 * EEH_POSSIBLE_ERROR() -- test for possible MMIO failure.
 *
 * If this macro yields TRUE, the caller relays to eeh_check_failure()
 * which does further tests out of line.
 */
190
#define EEH_POSSIBLE_ERROR(val, type)	((val) == (type)~0 && eeh_subsystem_enabled)
L
Linus Torvalds 已提交
191 192 193 194 195 196 197 198 199

/*
 * Reads from a device which has been isolated by EEH will return
 * all 1s.  This macro gives an all-1s value of the given size (in
 * bytes: 1, 2, or 4) for comparing with the result of a read.
 */
#define EEH_IO_ERROR_VALUE(size)	(~0U >> ((4 - (size)) * 8))

#else /* !CONFIG_EEH */
G
Gavin Shan 已提交
200 201 202 203 204 205 206 207

static inline void *eeh_dev_init(struct device_node *dn, void *data)
{
	return NULL;
}

static inline void eeh_dev_phb_init_dynamic(struct pci_controller *phb) { }

L
Linus Torvalds 已提交
208 209 210 211 212 213 214 215 216 217 218 219
static inline unsigned long eeh_check_failure(const volatile void __iomem *token, unsigned long val)
{
	return val;
}

static inline int eeh_dn_check_failure(struct device_node *dn, struct pci_dev *dev)
{
	return 0;
}

static inline void pci_addr_cache_build(void) { }

220 221
static inline void eeh_add_device_tree_early(struct device_node *dn) { }

222 223
static inline void eeh_add_device_tree_late(struct pci_bus *bus) { }

224
static inline void eeh_remove_bus_device(struct pci_dev *dev) { }
G
Gavin Shan 已提交
225 226 227 228

static inline void eeh_lock(void) { }
static inline void eeh_unlock(void) { }

L
Linus Torvalds 已提交
229 230 231 232
#define EEH_POSSIBLE_ERROR(val, type) (0)
#define EEH_IO_ERROR_VALUE(size) (-1UL)
#endif /* CONFIG_EEH */

233
#ifdef CONFIG_PPC64
234
/*
L
Linus Torvalds 已提交
235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259
 * MMIO read/write operations with EEH support.
 */
static inline u8 eeh_readb(const volatile void __iomem *addr)
{
	u8 val = in_8(addr);
	if (EEH_POSSIBLE_ERROR(val, u8))
		return eeh_check_failure(addr, val);
	return val;
}

static inline u16 eeh_readw(const volatile void __iomem *addr)
{
	u16 val = in_le16(addr);
	if (EEH_POSSIBLE_ERROR(val, u16))
		return eeh_check_failure(addr, val);
	return val;
}

static inline u32 eeh_readl(const volatile void __iomem *addr)
{
	u32 val = in_le32(addr);
	if (EEH_POSSIBLE_ERROR(val, u32))
		return eeh_check_failure(addr, val);
	return val;
}
260 261

static inline u64 eeh_readq(const volatile void __iomem *addr)
L
Linus Torvalds 已提交
262
{
263 264
	u64 val = in_le64(addr);
	if (EEH_POSSIBLE_ERROR(val, u64))
L
Linus Torvalds 已提交
265 266 267 268
		return eeh_check_failure(addr, val);
	return val;
}

269
static inline u16 eeh_readw_be(const volatile void __iomem *addr)
L
Linus Torvalds 已提交
270
{
271 272
	u16 val = in_be16(addr);
	if (EEH_POSSIBLE_ERROR(val, u16))
L
Linus Torvalds 已提交
273 274 275
		return eeh_check_failure(addr, val);
	return val;
}
276 277

static inline u32 eeh_readl_be(const volatile void __iomem *addr)
L
Linus Torvalds 已提交
278
{
279 280 281 282
	u32 val = in_be32(addr);
	if (EEH_POSSIBLE_ERROR(val, u32))
		return eeh_check_failure(addr, val);
	return val;
L
Linus Torvalds 已提交
283
}
284 285

static inline u64 eeh_readq_be(const volatile void __iomem *addr)
L
Linus Torvalds 已提交
286 287 288 289 290 291 292
{
	u64 val = in_be64(addr);
	if (EEH_POSSIBLE_ERROR(val, u64))
		return eeh_check_failure(addr, val);
	return val;
}

293 294
static inline void eeh_memcpy_fromio(void *dest, const
				     volatile void __iomem *src,
L
Linus Torvalds 已提交
295 296
				     unsigned long n)
{
297
	_memcpy_fromio(dest, src, n);
L
Linus Torvalds 已提交
298 299 300 301

	/* Look for ffff's here at dest[n].  Assume that at least 4 bytes
	 * were copied. Check all four bytes.
	 */
302 303
	if (n >= 4 && EEH_POSSIBLE_ERROR(*((u32 *)(dest + n - 4)), u32))
		eeh_check_failure(src, *((u32 *)(dest + n - 4)));
L
Linus Torvalds 已提交
304 305 306
}

/* in-string eeh macros */
307 308
static inline void eeh_readsb(const volatile void __iomem *addr, void * buf,
			      int ns)
L
Linus Torvalds 已提交
309
{
310
	_insb(addr, buf, ns);
L
Linus Torvalds 已提交
311
	if (EEH_POSSIBLE_ERROR((*(((u8*)buf)+ns-1)), u8))
312
		eeh_check_failure(addr, *(u8*)buf);
L
Linus Torvalds 已提交
313 314
}

315 316
static inline void eeh_readsw(const volatile void __iomem *addr, void * buf,
			      int ns)
L
Linus Torvalds 已提交
317
{
318
	_insw(addr, buf, ns);
L
Linus Torvalds 已提交
319
	if (EEH_POSSIBLE_ERROR((*(((u16*)buf)+ns-1)), u16))
320
		eeh_check_failure(addr, *(u16*)buf);
L
Linus Torvalds 已提交
321 322
}

323 324
static inline void eeh_readsl(const volatile void __iomem *addr, void * buf,
			      int nl)
L
Linus Torvalds 已提交
325
{
326
	_insl(addr, buf, nl);
L
Linus Torvalds 已提交
327
	if (EEH_POSSIBLE_ERROR((*(((u32*)buf)+nl-1)), u32))
328
		eeh_check_failure(addr, *(u32*)buf);
L
Linus Torvalds 已提交
329 330
}

331
#endif /* CONFIG_PPC64 */
332
#endif /* __KERNEL__ */
333
#endif /* _POWERPC_EEH_H */