eeh.h 10.6 KB
Newer Older
1
/*
L
Linus Torvalds 已提交
2
 * Copyright (C) 2001  Dave Engebretsen & Todd Inglett IBM Corporation.
3
 * Copyright 2001-2012 IBM Corporation.
L
Linus Torvalds 已提交
4 5 6 7 8
 *
 * This program is free software; you can redistribute it and/or modify
 * it under the terms of the GNU General Public License as published by
 * the Free Software Foundation; either version 2 of the License, or
 * (at your option) any later version.
9
 *
L
Linus Torvalds 已提交
10 11 12 13
 * This program is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 * GNU General Public License for more details.
14
 *
L
Linus Torvalds 已提交
15 16 17 18 19
 * You should have received a copy of the GNU General Public License
 * along with this program; if not, write to the Free Software
 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307 USA
 */

20 21
#ifndef _POWERPC_EEH_H
#define _POWERPC_EEH_H
22
#ifdef __KERNEL__
L
Linus Torvalds 已提交
23 24 25 26 27 28

#include <linux/init.h>
#include <linux/list.h>
#include <linux/string.h>

struct pci_dev;
29
struct pci_bus;
L
Linus Torvalds 已提交
30 31 32 33
struct device_node;

#ifdef CONFIG_EEH

34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69
/*
 * The struct is used to trace PE related EEH functionality.
 * In theory, there will have one instance of the struct to
 * be created against particular PE. In nature, PEs corelate
 * to each other. the struct has to reflect that hierarchy in
 * order to easily pick up those affected PEs when one particular
 * PE has EEH errors.
 *
 * Also, one particular PE might be composed of PCI device, PCI
 * bus and its subordinate components. The struct also need ship
 * the information. Further more, one particular PE is only meaingful
 * in the corresponding PHB. Therefore, the root PEs should be created
 * against existing PHBs in on-to-one fashion.
 */
#define EEH_PE_PHB	1	/* PHB PE    */
#define EEH_PE_DEVICE 	2	/* Device PE */
#define EEH_PE_BUS	3	/* Bus PE    */

#define EEH_PE_ISOLATED		(1 << 0)	/* Isolated PE		*/
#define EEH_PE_RECOVERING	(1 << 1)	/* Recovering PE	*/

struct eeh_pe {
	int type;			/* PE type: PHB/Bus/Device	*/
	int state;			/* PE EEH dependent mode	*/
	int config_addr;		/* Traditional PCI address	*/
	int addr;			/* PE configuration address	*/
	struct pci_controller *phb;	/* Associated PHB		*/
	int check_count;		/* Times of ignored error	*/
	int freeze_count;		/* Times of froze up		*/
	int false_positives;		/* Times of reported #ff's	*/
	struct eeh_pe *parent;		/* Parent PE			*/
	struct list_head child_list;	/* Link PE to the child list	*/
	struct list_head edevs;		/* Link list of EEH devices	*/
	struct list_head child;		/* Child PEs			*/
};

70 71 72
#define eeh_pe_for_each_dev(pe, edev) \
		list_for_each_entry(edev, &pe->edevs, list)

G
Gavin Shan 已提交
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94
/*
 * The struct is used to trace EEH state for the associated
 * PCI device node or PCI device. In future, it might
 * represent PE as well so that the EEH device to form
 * another tree except the currently existing tree of PCI
 * buses and PCI devices
 */
#define EEH_MODE_SUPPORTED	(1<<0)	/* EEH supported on the device	*/
#define EEH_MODE_NOCHECK	(1<<1)	/* EEH check should be skipped	*/
#define EEH_MODE_ISOLATED	(1<<2)	/* The device has been isolated	*/
#define EEH_MODE_RECOVERING	(1<<3)	/* Recovering the device	*/
#define EEH_MODE_IRQ_DISABLED	(1<<4)	/* Interrupt disabled		*/

struct eeh_dev {
	int mode;			/* EEH mode			*/
	int class_code;			/* Class code of the device	*/
	int config_addr;		/* Config address		*/
	int pe_config_addr;		/* PE config address		*/
	int check_count;		/* Times of ignored error	*/
	int freeze_count;		/* Times of froze up		*/
	int false_positives;		/* Times of reported #ff's	*/
	u32 config_space[16];		/* Saved PCI config space	*/
95 96
	struct eeh_pe *pe;		/* Associated PE		*/
	struct list_head list;		/* Form link list in the PE	*/
G
Gavin Shan 已提交
97 98 99 100 101 102 103 104 105 106 107 108 109 110 111
	struct pci_controller *phb;	/* Associated PHB		*/
	struct device_node *dn;		/* Associated device node	*/
	struct pci_dev *pdev;		/* Associated PCI device	*/
};

static inline struct device_node *eeh_dev_to_of_node(struct eeh_dev *edev)
{
	return edev->dn;
}

static inline struct pci_dev *eeh_dev_to_pci_dev(struct eeh_dev *edev)
{
	return edev->pdev;
}

112 113 114 115 116 117 118
/*
 * The struct is used to trace the registered EEH operation
 * callback functions. Actually, those operation callback
 * functions are heavily platform dependent. That means the
 * platform should register its own EEH operation callback
 * functions before any EEH further operations.
 */
119 120 121 122
#define EEH_OPT_DISABLE		0	/* EEH disable	*/
#define EEH_OPT_ENABLE		1	/* EEH enable	*/
#define EEH_OPT_THAW_MMIO	2	/* MMIO enable	*/
#define EEH_OPT_THAW_DMA	3	/* DMA enable	*/
123 124 125 126 127 128 129
#define EEH_STATE_UNAVAILABLE	(1 << 0)	/* State unavailable	*/
#define EEH_STATE_NOT_SUPPORT	(1 << 1)	/* EEH not supported	*/
#define EEH_STATE_RESET_ACTIVE	(1 << 2)	/* Active reset		*/
#define EEH_STATE_MMIO_ACTIVE	(1 << 3)	/* Active MMIO		*/
#define EEH_STATE_DMA_ACTIVE	(1 << 4)	/* Active DMA		*/
#define EEH_STATE_MMIO_ENABLED	(1 << 5)	/* MMIO enabled		*/
#define EEH_STATE_DMA_ENABLED	(1 << 6)	/* DMA enabled		*/
130 131 132
#define EEH_RESET_DEACTIVATE	0	/* Deactivate the PE reset	*/
#define EEH_RESET_HOT		1	/* Hot reset			*/
#define EEH_RESET_FUNDAMENTAL	3	/* Fundamental reset		*/
133 134
#define EEH_LOG_TEMP		1	/* EEH temporary error log	*/
#define EEH_LOG_PERM		2	/* EEH permanent error log	*/
135

136 137 138 139 140 141 142 143 144 145
struct eeh_ops {
	char *name;
	int (*init)(void);
	int (*set_option)(struct device_node *dn, int option);
	int (*get_pe_addr)(struct device_node *dn);
	int (*get_state)(struct device_node *dn, int *state);
	int (*reset)(struct device_node *dn, int option);
	int (*wait_state)(struct device_node *dn, int max_wait);
	int (*get_log)(struct device_node *dn, int severity, char *drv_log, unsigned long len);
	int (*configure_bridge)(struct device_node *dn);
146 147
	int (*read_config)(struct device_node *dn, int where, int size, u32 *val);
	int (*write_config)(struct device_node *dn, int where, int size, u32 val);
148 149 150
};

extern struct eeh_ops *eeh_ops;
151
extern int eeh_subsystem_enabled;
G
Gavin Shan 已提交
152 153 154 155 156 157 158 159 160 161 162
extern struct mutex eeh_mutex;

static inline void eeh_lock(void)
{
	mutex_lock(&eeh_mutex);
}

static inline void eeh_unlock(void)
{
	mutex_unlock(&eeh_mutex);
}
163

164 165 166 167
/*
 * Max number of EEH freezes allowed before we consider the device
 * to be permanently disabled.
 */
168 169
#define EEH_MAX_ALLOWED_FREEZES 5

170
typedef void *(*eeh_traverse_func)(void *data, void *flag);
G
Gavin Shan 已提交
171
int __devinit eeh_phb_pe_create(struct pci_controller *phb);
172
int eeh_add_to_parent_pe(struct eeh_dev *edev);
173
int eeh_rmv_from_parent_pe(struct eeh_dev *edev);
G
Gavin Shan 已提交
174

G
Gavin Shan 已提交
175 176
void * __devinit eeh_dev_init(struct device_node *dn, void *data);
void __devinit eeh_dev_phb_init_dynamic(struct pci_controller *phb);
177 178
int __init eeh_ops_register(struct eeh_ops *ops);
int __exit eeh_ops_unregister(const char *name);
L
Linus Torvalds 已提交
179 180 181 182
unsigned long eeh_check_failure(const volatile void __iomem *token,
				unsigned long val);
int eeh_dn_check_failure(struct device_node *dn, struct pci_dev *dev);
void __init pci_addr_cache_build(void);
183
void eeh_add_device_tree_early(struct device_node *);
184
void eeh_add_device_tree_late(struct pci_bus *);
185 186
void eeh_remove_bus_device(struct pci_dev *);

L
Linus Torvalds 已提交
187 188 189 190 191 192
/**
 * EEH_POSSIBLE_ERROR() -- test for possible MMIO failure.
 *
 * If this macro yields TRUE, the caller relays to eeh_check_failure()
 * which does further tests out of line.
 */
193
#define EEH_POSSIBLE_ERROR(val, type)	((val) == (type)~0 && eeh_subsystem_enabled)
L
Linus Torvalds 已提交
194 195 196 197 198 199 200 201 202

/*
 * Reads from a device which has been isolated by EEH will return
 * all 1s.  This macro gives an all-1s value of the given size (in
 * bytes: 1, 2, or 4) for comparing with the result of a read.
 */
#define EEH_IO_ERROR_VALUE(size)	(~0U >> ((4 - (size)) * 8))

#else /* !CONFIG_EEH */
G
Gavin Shan 已提交
203 204 205 206 207 208 209 210

static inline void *eeh_dev_init(struct device_node *dn, void *data)
{
	return NULL;
}

static inline void eeh_dev_phb_init_dynamic(struct pci_controller *phb) { }

L
Linus Torvalds 已提交
211 212 213 214 215 216 217 218 219 220 221 222
static inline unsigned long eeh_check_failure(const volatile void __iomem *token, unsigned long val)
{
	return val;
}

static inline int eeh_dn_check_failure(struct device_node *dn, struct pci_dev *dev)
{
	return 0;
}

static inline void pci_addr_cache_build(void) { }

223 224
static inline void eeh_add_device_tree_early(struct device_node *dn) { }

225 226
static inline void eeh_add_device_tree_late(struct pci_bus *bus) { }

227
static inline void eeh_remove_bus_device(struct pci_dev *dev) { }
G
Gavin Shan 已提交
228 229 230 231

static inline void eeh_lock(void) { }
static inline void eeh_unlock(void) { }

L
Linus Torvalds 已提交
232 233 234 235
#define EEH_POSSIBLE_ERROR(val, type) (0)
#define EEH_IO_ERROR_VALUE(size) (-1UL)
#endif /* CONFIG_EEH */

236
#ifdef CONFIG_PPC64
237
/*
L
Linus Torvalds 已提交
238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262
 * MMIO read/write operations with EEH support.
 */
static inline u8 eeh_readb(const volatile void __iomem *addr)
{
	u8 val = in_8(addr);
	if (EEH_POSSIBLE_ERROR(val, u8))
		return eeh_check_failure(addr, val);
	return val;
}

static inline u16 eeh_readw(const volatile void __iomem *addr)
{
	u16 val = in_le16(addr);
	if (EEH_POSSIBLE_ERROR(val, u16))
		return eeh_check_failure(addr, val);
	return val;
}

static inline u32 eeh_readl(const volatile void __iomem *addr)
{
	u32 val = in_le32(addr);
	if (EEH_POSSIBLE_ERROR(val, u32))
		return eeh_check_failure(addr, val);
	return val;
}
263 264

static inline u64 eeh_readq(const volatile void __iomem *addr)
L
Linus Torvalds 已提交
265
{
266 267
	u64 val = in_le64(addr);
	if (EEH_POSSIBLE_ERROR(val, u64))
L
Linus Torvalds 已提交
268 269 270 271
		return eeh_check_failure(addr, val);
	return val;
}

272
static inline u16 eeh_readw_be(const volatile void __iomem *addr)
L
Linus Torvalds 已提交
273
{
274 275
	u16 val = in_be16(addr);
	if (EEH_POSSIBLE_ERROR(val, u16))
L
Linus Torvalds 已提交
276 277 278
		return eeh_check_failure(addr, val);
	return val;
}
279 280

static inline u32 eeh_readl_be(const volatile void __iomem *addr)
L
Linus Torvalds 已提交
281
{
282 283 284 285
	u32 val = in_be32(addr);
	if (EEH_POSSIBLE_ERROR(val, u32))
		return eeh_check_failure(addr, val);
	return val;
L
Linus Torvalds 已提交
286
}
287 288

static inline u64 eeh_readq_be(const volatile void __iomem *addr)
L
Linus Torvalds 已提交
289 290 291 292 293 294 295
{
	u64 val = in_be64(addr);
	if (EEH_POSSIBLE_ERROR(val, u64))
		return eeh_check_failure(addr, val);
	return val;
}

296 297
static inline void eeh_memcpy_fromio(void *dest, const
				     volatile void __iomem *src,
L
Linus Torvalds 已提交
298 299
				     unsigned long n)
{
300
	_memcpy_fromio(dest, src, n);
L
Linus Torvalds 已提交
301 302 303 304

	/* Look for ffff's here at dest[n].  Assume that at least 4 bytes
	 * were copied. Check all four bytes.
	 */
305 306
	if (n >= 4 && EEH_POSSIBLE_ERROR(*((u32 *)(dest + n - 4)), u32))
		eeh_check_failure(src, *((u32 *)(dest + n - 4)));
L
Linus Torvalds 已提交
307 308 309
}

/* in-string eeh macros */
310 311
static inline void eeh_readsb(const volatile void __iomem *addr, void * buf,
			      int ns)
L
Linus Torvalds 已提交
312
{
313
	_insb(addr, buf, ns);
L
Linus Torvalds 已提交
314
	if (EEH_POSSIBLE_ERROR((*(((u8*)buf)+ns-1)), u8))
315
		eeh_check_failure(addr, *(u8*)buf);
L
Linus Torvalds 已提交
316 317
}

318 319
static inline void eeh_readsw(const volatile void __iomem *addr, void * buf,
			      int ns)
L
Linus Torvalds 已提交
320
{
321
	_insw(addr, buf, ns);
L
Linus Torvalds 已提交
322
	if (EEH_POSSIBLE_ERROR((*(((u16*)buf)+ns-1)), u16))
323
		eeh_check_failure(addr, *(u16*)buf);
L
Linus Torvalds 已提交
324 325
}

326 327
static inline void eeh_readsl(const volatile void __iomem *addr, void * buf,
			      int nl)
L
Linus Torvalds 已提交
328
{
329
	_insl(addr, buf, nl);
L
Linus Torvalds 已提交
330
	if (EEH_POSSIBLE_ERROR((*(((u32*)buf)+nl-1)), u32))
331
		eeh_check_failure(addr, *(u32*)buf);
L
Linus Torvalds 已提交
332 333
}

334
#endif /* CONFIG_PPC64 */
335
#endif /* __KERNEL__ */
336
#endif /* _POWERPC_EEH_H */