eeh.h 10.7 KB
Newer Older
1
/*
L
Linus Torvalds 已提交
2
 * Copyright (C) 2001  Dave Engebretsen & Todd Inglett IBM Corporation.
3
 * Copyright 2001-2012 IBM Corporation.
L
Linus Torvalds 已提交
4 5 6 7 8
 *
 * This program is free software; you can redistribute it and/or modify
 * it under the terms of the GNU General Public License as published by
 * the Free Software Foundation; either version 2 of the License, or
 * (at your option) any later version.
9
 *
L
Linus Torvalds 已提交
10 11 12 13
 * This program is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 * GNU General Public License for more details.
14
 *
L
Linus Torvalds 已提交
15 16 17 18 19
 * You should have received a copy of the GNU General Public License
 * along with this program; if not, write to the Free Software
 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307 USA
 */

20 21
#ifndef _POWERPC_EEH_H
#define _POWERPC_EEH_H
22
#ifdef __KERNEL__
L
Linus Torvalds 已提交
23 24 25 26 27 28

#include <linux/init.h>
#include <linux/list.h>
#include <linux/string.h>

struct pci_dev;
29
struct pci_bus;
L
Linus Torvalds 已提交
30 31 32 33
struct device_node;

#ifdef CONFIG_EEH

34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69
/*
 * The struct is used to trace PE related EEH functionality.
 * In theory, there will have one instance of the struct to
 * be created against particular PE. In nature, PEs corelate
 * to each other. the struct has to reflect that hierarchy in
 * order to easily pick up those affected PEs when one particular
 * PE has EEH errors.
 *
 * Also, one particular PE might be composed of PCI device, PCI
 * bus and its subordinate components. The struct also need ship
 * the information. Further more, one particular PE is only meaingful
 * in the corresponding PHB. Therefore, the root PEs should be created
 * against existing PHBs in on-to-one fashion.
 */
#define EEH_PE_PHB	1	/* PHB PE    */
#define EEH_PE_DEVICE 	2	/* Device PE */
#define EEH_PE_BUS	3	/* Bus PE    */

#define EEH_PE_ISOLATED		(1 << 0)	/* Isolated PE		*/
#define EEH_PE_RECOVERING	(1 << 1)	/* Recovering PE	*/

struct eeh_pe {
	int type;			/* PE type: PHB/Bus/Device	*/
	int state;			/* PE EEH dependent mode	*/
	int config_addr;		/* Traditional PCI address	*/
	int addr;			/* PE configuration address	*/
	struct pci_controller *phb;	/* Associated PHB		*/
	int check_count;		/* Times of ignored error	*/
	int freeze_count;		/* Times of froze up		*/
	int false_positives;		/* Times of reported #ff's	*/
	struct eeh_pe *parent;		/* Parent PE			*/
	struct list_head child_list;	/* Link PE to the child list	*/
	struct list_head edevs;		/* Link list of EEH devices	*/
	struct list_head child;		/* Child PEs			*/
};

70 71 72
#define eeh_pe_for_each_dev(pe, edev) \
		list_for_each_entry(edev, &pe->edevs, list)

G
Gavin Shan 已提交
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94
/*
 * The struct is used to trace EEH state for the associated
 * PCI device node or PCI device. In future, it might
 * represent PE as well so that the EEH device to form
 * another tree except the currently existing tree of PCI
 * buses and PCI devices
 */
#define EEH_MODE_SUPPORTED	(1<<0)	/* EEH supported on the device	*/
#define EEH_MODE_NOCHECK	(1<<1)	/* EEH check should be skipped	*/
#define EEH_MODE_ISOLATED	(1<<2)	/* The device has been isolated	*/
#define EEH_MODE_RECOVERING	(1<<3)	/* Recovering the device	*/
#define EEH_MODE_IRQ_DISABLED	(1<<4)	/* Interrupt disabled		*/

struct eeh_dev {
	int mode;			/* EEH mode			*/
	int class_code;			/* Class code of the device	*/
	int config_addr;		/* Config address		*/
	int pe_config_addr;		/* PE config address		*/
	int check_count;		/* Times of ignored error	*/
	int freeze_count;		/* Times of froze up		*/
	int false_positives;		/* Times of reported #ff's	*/
	u32 config_space[16];		/* Saved PCI config space	*/
95 96
	struct eeh_pe *pe;		/* Associated PE		*/
	struct list_head list;		/* Form link list in the PE	*/
G
Gavin Shan 已提交
97 98 99 100 101 102 103 104 105 106 107 108 109 110 111
	struct pci_controller *phb;	/* Associated PHB		*/
	struct device_node *dn;		/* Associated device node	*/
	struct pci_dev *pdev;		/* Associated PCI device	*/
};

static inline struct device_node *eeh_dev_to_of_node(struct eeh_dev *edev)
{
	return edev->dn;
}

static inline struct pci_dev *eeh_dev_to_pci_dev(struct eeh_dev *edev)
{
	return edev->pdev;
}

112 113 114 115 116 117 118
/*
 * The struct is used to trace the registered EEH operation
 * callback functions. Actually, those operation callback
 * functions are heavily platform dependent. That means the
 * platform should register its own EEH operation callback
 * functions before any EEH further operations.
 */
119 120 121 122
#define EEH_OPT_DISABLE		0	/* EEH disable	*/
#define EEH_OPT_ENABLE		1	/* EEH enable	*/
#define EEH_OPT_THAW_MMIO	2	/* MMIO enable	*/
#define EEH_OPT_THAW_DMA	3	/* DMA enable	*/
123 124 125 126 127 128 129
#define EEH_STATE_UNAVAILABLE	(1 << 0)	/* State unavailable	*/
#define EEH_STATE_NOT_SUPPORT	(1 << 1)	/* EEH not supported	*/
#define EEH_STATE_RESET_ACTIVE	(1 << 2)	/* Active reset		*/
#define EEH_STATE_MMIO_ACTIVE	(1 << 3)	/* Active MMIO		*/
#define EEH_STATE_DMA_ACTIVE	(1 << 4)	/* Active DMA		*/
#define EEH_STATE_MMIO_ENABLED	(1 << 5)	/* MMIO enabled		*/
#define EEH_STATE_DMA_ENABLED	(1 << 6)	/* DMA enabled		*/
130 131 132
#define EEH_RESET_DEACTIVATE	0	/* Deactivate the PE reset	*/
#define EEH_RESET_HOT		1	/* Hot reset			*/
#define EEH_RESET_FUNDAMENTAL	3	/* Fundamental reset		*/
133 134
#define EEH_LOG_TEMP		1	/* EEH temporary error log	*/
#define EEH_LOG_PERM		2	/* EEH permanent error log	*/
135

136 137 138
struct eeh_ops {
	char *name;
	int (*init)(void);
139 140 141 142 143 144 145
	int (*set_option)(struct eeh_pe *pe, int option);
	int (*get_pe_addr)(struct eeh_pe *pe);
	int (*get_state)(struct eeh_pe *pe, int *state);
	int (*reset)(struct eeh_pe *pe, int option);
	int (*wait_state)(struct eeh_pe *pe, int max_wait);
	int (*get_log)(struct eeh_pe *pe, int severity, char *drv_log, unsigned long len);
	int (*configure_bridge)(struct eeh_pe *pe);
146 147
	int (*read_config)(struct device_node *dn, int where, int size, u32 *val);
	int (*write_config)(struct device_node *dn, int where, int size, u32 val);
148 149 150
};

extern struct eeh_ops *eeh_ops;
151
extern int eeh_subsystem_enabled;
G
Gavin Shan 已提交
152 153 154 155 156 157 158 159 160 161 162
extern struct mutex eeh_mutex;

static inline void eeh_lock(void)
{
	mutex_lock(&eeh_mutex);
}

static inline void eeh_unlock(void)
{
	mutex_unlock(&eeh_mutex);
}
163

164 165 166 167
/*
 * Max number of EEH freezes allowed before we consider the device
 * to be permanently disabled.
 */
168 169
#define EEH_MAX_ALLOWED_FREEZES 5

170
typedef void *(*eeh_traverse_func)(void *data, void *flag);
G
Gavin Shan 已提交
171
int __devinit eeh_phb_pe_create(struct pci_controller *phb);
172
int eeh_add_to_parent_pe(struct eeh_dev *edev);
173
int eeh_rmv_from_parent_pe(struct eeh_dev *edev);
174 175 176
void *eeh_pe_dev_traverse(struct eeh_pe *root,
		eeh_traverse_func fn, void *flag);
void eeh_pe_restore_bars(struct eeh_pe *pe);
177
struct pci_bus *eeh_pe_bus_get(struct eeh_pe *pe);
G
Gavin Shan 已提交
178

G
Gavin Shan 已提交
179 180
void * __devinit eeh_dev_init(struct device_node *dn, void *data);
void __devinit eeh_dev_phb_init_dynamic(struct pci_controller *phb);
181 182
int __init eeh_ops_register(struct eeh_ops *ops);
int __exit eeh_ops_unregister(const char *name);
L
Linus Torvalds 已提交
183 184 185 186
unsigned long eeh_check_failure(const volatile void __iomem *token,
				unsigned long val);
int eeh_dn_check_failure(struct device_node *dn, struct pci_dev *dev);
void __init pci_addr_cache_build(void);
187
void eeh_add_device_tree_early(struct device_node *);
188
void eeh_add_device_tree_late(struct pci_bus *);
189 190
void eeh_remove_bus_device(struct pci_dev *);

L
Linus Torvalds 已提交
191 192 193 194 195 196
/**
 * EEH_POSSIBLE_ERROR() -- test for possible MMIO failure.
 *
 * If this macro yields TRUE, the caller relays to eeh_check_failure()
 * which does further tests out of line.
 */
197
#define EEH_POSSIBLE_ERROR(val, type)	((val) == (type)~0 && eeh_subsystem_enabled)
L
Linus Torvalds 已提交
198 199 200 201 202 203 204 205 206

/*
 * Reads from a device which has been isolated by EEH will return
 * all 1s.  This macro gives an all-1s value of the given size (in
 * bytes: 1, 2, or 4) for comparing with the result of a read.
 */
#define EEH_IO_ERROR_VALUE(size)	(~0U >> ((4 - (size)) * 8))

#else /* !CONFIG_EEH */
G
Gavin Shan 已提交
207 208 209 210 211 212 213 214

static inline void *eeh_dev_init(struct device_node *dn, void *data)
{
	return NULL;
}

static inline void eeh_dev_phb_init_dynamic(struct pci_controller *phb) { }

L
Linus Torvalds 已提交
215 216 217 218 219 220 221 222 223 224 225 226
static inline unsigned long eeh_check_failure(const volatile void __iomem *token, unsigned long val)
{
	return val;
}

static inline int eeh_dn_check_failure(struct device_node *dn, struct pci_dev *dev)
{
	return 0;
}

static inline void pci_addr_cache_build(void) { }

227 228
static inline void eeh_add_device_tree_early(struct device_node *dn) { }

229 230
static inline void eeh_add_device_tree_late(struct pci_bus *bus) { }

231
static inline void eeh_remove_bus_device(struct pci_dev *dev) { }
G
Gavin Shan 已提交
232 233 234 235

static inline void eeh_lock(void) { }
static inline void eeh_unlock(void) { }

L
Linus Torvalds 已提交
236 237 238 239
#define EEH_POSSIBLE_ERROR(val, type) (0)
#define EEH_IO_ERROR_VALUE(size) (-1UL)
#endif /* CONFIG_EEH */

240
#ifdef CONFIG_PPC64
241
/*
L
Linus Torvalds 已提交
242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266
 * MMIO read/write operations with EEH support.
 */
static inline u8 eeh_readb(const volatile void __iomem *addr)
{
	u8 val = in_8(addr);
	if (EEH_POSSIBLE_ERROR(val, u8))
		return eeh_check_failure(addr, val);
	return val;
}

static inline u16 eeh_readw(const volatile void __iomem *addr)
{
	u16 val = in_le16(addr);
	if (EEH_POSSIBLE_ERROR(val, u16))
		return eeh_check_failure(addr, val);
	return val;
}

static inline u32 eeh_readl(const volatile void __iomem *addr)
{
	u32 val = in_le32(addr);
	if (EEH_POSSIBLE_ERROR(val, u32))
		return eeh_check_failure(addr, val);
	return val;
}
267 268

static inline u64 eeh_readq(const volatile void __iomem *addr)
L
Linus Torvalds 已提交
269
{
270 271
	u64 val = in_le64(addr);
	if (EEH_POSSIBLE_ERROR(val, u64))
L
Linus Torvalds 已提交
272 273 274 275
		return eeh_check_failure(addr, val);
	return val;
}

276
static inline u16 eeh_readw_be(const volatile void __iomem *addr)
L
Linus Torvalds 已提交
277
{
278 279
	u16 val = in_be16(addr);
	if (EEH_POSSIBLE_ERROR(val, u16))
L
Linus Torvalds 已提交
280 281 282
		return eeh_check_failure(addr, val);
	return val;
}
283 284

static inline u32 eeh_readl_be(const volatile void __iomem *addr)
L
Linus Torvalds 已提交
285
{
286 287 288 289
	u32 val = in_be32(addr);
	if (EEH_POSSIBLE_ERROR(val, u32))
		return eeh_check_failure(addr, val);
	return val;
L
Linus Torvalds 已提交
290
}
291 292

static inline u64 eeh_readq_be(const volatile void __iomem *addr)
L
Linus Torvalds 已提交
293 294 295 296 297 298 299
{
	u64 val = in_be64(addr);
	if (EEH_POSSIBLE_ERROR(val, u64))
		return eeh_check_failure(addr, val);
	return val;
}

300 301
static inline void eeh_memcpy_fromio(void *dest, const
				     volatile void __iomem *src,
L
Linus Torvalds 已提交
302 303
				     unsigned long n)
{
304
	_memcpy_fromio(dest, src, n);
L
Linus Torvalds 已提交
305 306 307 308

	/* Look for ffff's here at dest[n].  Assume that at least 4 bytes
	 * were copied. Check all four bytes.
	 */
309 310
	if (n >= 4 && EEH_POSSIBLE_ERROR(*((u32 *)(dest + n - 4)), u32))
		eeh_check_failure(src, *((u32 *)(dest + n - 4)));
L
Linus Torvalds 已提交
311 312 313
}

/* in-string eeh macros */
314 315
static inline void eeh_readsb(const volatile void __iomem *addr, void * buf,
			      int ns)
L
Linus Torvalds 已提交
316
{
317
	_insb(addr, buf, ns);
L
Linus Torvalds 已提交
318
	if (EEH_POSSIBLE_ERROR((*(((u8*)buf)+ns-1)), u8))
319
		eeh_check_failure(addr, *(u8*)buf);
L
Linus Torvalds 已提交
320 321
}

322 323
static inline void eeh_readsw(const volatile void __iomem *addr, void * buf,
			      int ns)
L
Linus Torvalds 已提交
324
{
325
	_insw(addr, buf, ns);
L
Linus Torvalds 已提交
326
	if (EEH_POSSIBLE_ERROR((*(((u16*)buf)+ns-1)), u16))
327
		eeh_check_failure(addr, *(u16*)buf);
L
Linus Torvalds 已提交
328 329
}

330 331
static inline void eeh_readsl(const volatile void __iomem *addr, void * buf,
			      int nl)
L
Linus Torvalds 已提交
332
{
333
	_insl(addr, buf, nl);
L
Linus Torvalds 已提交
334
	if (EEH_POSSIBLE_ERROR((*(((u32*)buf)+nl-1)), u32))
335
		eeh_check_failure(addr, *(u32*)buf);
L
Linus Torvalds 已提交
336 337
}

338
#endif /* CONFIG_PPC64 */
339
#endif /* __KERNEL__ */
340
#endif /* _POWERPC_EEH_H */