blob: 09a8743143f37a046e8d57e3d65f58f9a1bd3cb4 [file] [log] [blame]
Linas Vepstas172ca922005-11-03 18:50:04 -06001/*
Linus Torvalds1da177e2005-04-16 15:20:36 -07002 * Copyright (C) 2001 Dave Engebretsen & Todd Inglett IBM Corporation.
Gavin Shancb3bc9d2012-02-27 20:03:51 +00003 * Copyright 2001-2012 IBM Corporation.
Linus Torvalds1da177e2005-04-16 15:20:36 -07004 *
5 * This program is free software; you can redistribute it and/or modify
6 * it under the terms of the GNU General Public License as published by
7 * the Free Software Foundation; either version 2 of the License, or
8 * (at your option) any later version.
Linas Vepstas172ca922005-11-03 18:50:04 -06009 *
Linus Torvalds1da177e2005-04-16 15:20:36 -070010 * This program is distributed in the hope that it will be useful,
11 * but WITHOUT ANY WARRANTY; without even the implied warranty of
12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
13 * GNU General Public License for more details.
Linas Vepstas172ca922005-11-03 18:50:04 -060014 *
Linus Torvalds1da177e2005-04-16 15:20:36 -070015 * You should have received a copy of the GNU General Public License
16 * along with this program; if not, write to the Free Software
17 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
18 */
19
Benjamin Herrenschmidt8b8da352008-10-27 19:48:37 +000020#ifndef _POWERPC_EEH_H
21#define _POWERPC_EEH_H
Arnd Bergmann88ced032005-12-16 22:43:46 +010022#ifdef __KERNEL__
Linus Torvalds1da177e2005-04-16 15:20:36 -070023
Linus Torvalds1da177e2005-04-16 15:20:36 -070024#include <linux/init.h>
25#include <linux/list.h>
26#include <linux/string.h>
Gavin Shan5a719782013-06-20 13:21:01 +080027#include <linux/time.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070028
29struct pci_dev;
John Rose827c1a62006-02-24 11:34:23 -060030struct pci_bus;
Linus Torvalds1da177e2005-04-16 15:20:36 -070031struct device_node;
Linus Torvalds1da177e2005-04-16 15:20:36 -070032
33#ifdef CONFIG_EEH
34
Gavin Shanaa1e6372012-02-27 20:03:53 +000035/*
Gavin Shan968f9682012-09-07 22:44:05 +000036 * The struct is used to trace PE related EEH functionality.
37 * In theory, there will have one instance of the struct to
38 * be created against particular PE. In nature, PEs corelate
39 * to each other. the struct has to reflect that hierarchy in
40 * order to easily pick up those affected PEs when one particular
41 * PE has EEH errors.
42 *
43 * Also, one particular PE might be composed of PCI device, PCI
44 * bus and its subordinate components. The struct also need ship
45 * the information. Further more, one particular PE is only meaingful
46 * in the corresponding PHB. Therefore, the root PEs should be created
47 * against existing PHBs in on-to-one fashion.
48 */
Gavin Shan5efc3ad2012-09-11 19:16:16 +000049#define EEH_PE_INVALID (1 << 0) /* Invalid */
50#define EEH_PE_PHB (1 << 1) /* PHB PE */
51#define EEH_PE_DEVICE (1 << 2) /* Device PE */
52#define EEH_PE_BUS (1 << 3) /* Bus PE */
Gavin Shan968f9682012-09-07 22:44:05 +000053
54#define EEH_PE_ISOLATED (1 << 0) /* Isolated PE */
55#define EEH_PE_RECOVERING (1 << 1) /* Recovering PE */
Gavin Shan8a6b1bc2013-06-20 13:21:04 +080056#define EEH_PE_PHB_DEAD (1 << 2) /* Dead PHB */
Gavin Shan968f9682012-09-07 22:44:05 +000057
58struct eeh_pe {
59 int type; /* PE type: PHB/Bus/Device */
60 int state; /* PE EEH dependent mode */
61 int config_addr; /* Traditional PCI address */
62 int addr; /* PE configuration address */
63 struct pci_controller *phb; /* Associated PHB */
Gavin Shan8cdb2832013-06-20 13:20:55 +080064 struct pci_bus *bus; /* Top PCI bus for bus PE */
Gavin Shan968f9682012-09-07 22:44:05 +000065 int check_count; /* Times of ignored error */
66 int freeze_count; /* Times of froze up */
Gavin Shan5a719782013-06-20 13:21:01 +080067 struct timeval tstamp; /* Time on first-time freeze */
Gavin Shan968f9682012-09-07 22:44:05 +000068 int false_positives; /* Times of reported #ff's */
69 struct eeh_pe *parent; /* Parent PE */
70 struct list_head child_list; /* Link PE to the child list */
71 struct list_head edevs; /* Link list of EEH devices */
72 struct list_head child; /* Child PEs */
73};
74
Gavin Shan5b663522012-09-07 22:44:12 +000075#define eeh_pe_for_each_dev(pe, edev) \
76 list_for_each_entry(edev, &pe->edevs, list)
77
Gavin Shan968f9682012-09-07 22:44:05 +000078/*
Gavin Shaneb740b52012-02-27 20:04:04 +000079 * The struct is used to trace EEH state for the associated
80 * PCI device node or PCI device. In future, it might
81 * represent PE as well so that the EEH device to form
82 * another tree except the currently existing tree of PCI
83 * buses and PCI devices
84 */
Gavin Shandbbceee2012-09-07 22:44:20 +000085#define EEH_DEV_IRQ_DISABLED (1<<0) /* Interrupt disabled */
Gavin Shaneb740b52012-02-27 20:04:04 +000086
87struct eeh_dev {
88 int mode; /* EEH mode */
89 int class_code; /* Class code of the device */
90 int config_addr; /* Config address */
91 int pe_config_addr; /* PE config address */
Gavin Shaneb740b52012-02-27 20:04:04 +000092 u32 config_space[16]; /* Saved PCI config space */
Gavin Shan968f9682012-09-07 22:44:05 +000093 struct eeh_pe *pe; /* Associated PE */
94 struct list_head list; /* Form link list in the PE */
Gavin Shaneb740b52012-02-27 20:04:04 +000095 struct pci_controller *phb; /* Associated PHB */
96 struct device_node *dn; /* Associated device node */
97 struct pci_dev *pdev; /* Associated PCI device */
98};
99
100static inline struct device_node *eeh_dev_to_of_node(struct eeh_dev *edev)
101{
Gavin Shan2d5c1212013-06-05 15:34:03 +0800102 return edev ? edev->dn : NULL;
Gavin Shaneb740b52012-02-27 20:04:04 +0000103}
104
105static inline struct pci_dev *eeh_dev_to_pci_dev(struct eeh_dev *edev)
106{
Gavin Shan2d5c1212013-06-05 15:34:03 +0800107 return edev ? edev->pdev : NULL;
Gavin Shaneb740b52012-02-27 20:04:04 +0000108}
109
110/*
Gavin Shanaa1e6372012-02-27 20:03:53 +0000111 * The struct is used to trace the registered EEH operation
112 * callback functions. Actually, those operation callback
113 * functions are heavily platform dependent. That means the
114 * platform should register its own EEH operation callback
115 * functions before any EEH further operations.
116 */
Gavin Shan8fb8f702012-02-27 20:03:55 +0000117#define EEH_OPT_DISABLE 0 /* EEH disable */
118#define EEH_OPT_ENABLE 1 /* EEH enable */
119#define EEH_OPT_THAW_MMIO 2 /* MMIO enable */
120#define EEH_OPT_THAW_DMA 3 /* DMA enable */
Gavin Shaneb594a42012-02-27 20:03:57 +0000121#define EEH_STATE_UNAVAILABLE (1 << 0) /* State unavailable */
122#define EEH_STATE_NOT_SUPPORT (1 << 1) /* EEH not supported */
123#define EEH_STATE_RESET_ACTIVE (1 << 2) /* Active reset */
124#define EEH_STATE_MMIO_ACTIVE (1 << 3) /* Active MMIO */
125#define EEH_STATE_DMA_ACTIVE (1 << 4) /* Active DMA */
126#define EEH_STATE_MMIO_ENABLED (1 << 5) /* MMIO enabled */
127#define EEH_STATE_DMA_ENABLED (1 << 6) /* DMA enabled */
Gavin Shan26524812012-02-27 20:03:59 +0000128#define EEH_RESET_DEACTIVATE 0 /* Deactivate the PE reset */
129#define EEH_RESET_HOT 1 /* Hot reset */
130#define EEH_RESET_FUNDAMENTAL 3 /* Fundamental reset */
Gavin Shan8d633292012-02-27 20:04:00 +0000131#define EEH_LOG_TEMP 1 /* EEH temporary error log */
132#define EEH_LOG_PERM 2 /* EEH permanent error log */
Gavin Shaneb594a42012-02-27 20:03:57 +0000133
Gavin Shanaa1e6372012-02-27 20:03:53 +0000134struct eeh_ops {
135 char *name;
136 int (*init)(void);
Gavin Shan21fd21f2013-06-20 13:20:57 +0800137 int (*post_init)(void);
Gavin Shand7bb8862012-09-07 22:44:21 +0000138 void* (*of_probe)(struct device_node *dn, void *flag);
Gavin Shan51fb5f52013-06-20 13:20:56 +0800139 int (*dev_probe)(struct pci_dev *dev, void *flag);
Gavin Shan371a3952012-09-07 22:44:14 +0000140 int (*set_option)(struct eeh_pe *pe, int option);
141 int (*get_pe_addr)(struct eeh_pe *pe);
142 int (*get_state)(struct eeh_pe *pe, int *state);
143 int (*reset)(struct eeh_pe *pe, int option);
144 int (*wait_state)(struct eeh_pe *pe, int max_wait);
145 int (*get_log)(struct eeh_pe *pe, int severity, char *drv_log, unsigned long len);
146 int (*configure_bridge)(struct eeh_pe *pe);
Gavin Shan37804442012-02-27 20:04:11 +0000147 int (*read_config)(struct device_node *dn, int where, int size, u32 *val);
148 int (*write_config)(struct device_node *dn, int where, int size, u32 val);
Gavin Shan8a6b1bc2013-06-20 13:21:04 +0800149 int (*next_error)(struct eeh_pe **pe);
Gavin Shanaa1e6372012-02-27 20:03:53 +0000150};
151
152extern struct eeh_ops *eeh_ops;
David Woodhouse1e28a7d2005-11-17 00:44:03 +0000153extern int eeh_subsystem_enabled;
Gavin Shan49075812013-06-20 13:21:03 +0800154extern raw_spinlock_t confirm_error_lock;
Gavin Shand7bb8862012-09-07 22:44:21 +0000155extern int eeh_probe_mode;
156
157#define EEH_PROBE_MODE_DEV (1<<0) /* From PCI device */
158#define EEH_PROBE_MODE_DEVTREE (1<<1) /* From device tree */
159
160static inline void eeh_probe_mode_set(int flag)
161{
162 eeh_probe_mode = flag;
163}
164
165static inline int eeh_probe_mode_devtree(void)
166{
167 return (eeh_probe_mode == EEH_PROBE_MODE_DEVTREE);
168}
169
170static inline int eeh_probe_mode_dev(void)
171{
172 return (eeh_probe_mode == EEH_PROBE_MODE_DEV);
173}
Gavin Shan646a8492012-09-07 22:44:06 +0000174
Gavin Shan49075812013-06-20 13:21:03 +0800175static inline void eeh_serialize_lock(unsigned long *flags)
176{
177 raw_spin_lock_irqsave(&confirm_error_lock, *flags);
178}
179
180static inline void eeh_serialize_unlock(unsigned long flags)
181{
182 raw_spin_unlock_irqrestore(&confirm_error_lock, flags);
183}
184
Gavin Shancb3bc9d2012-02-27 20:03:51 +0000185/*
186 * Max number of EEH freezes allowed before we consider the device
187 * to be permanently disabled.
188 */
Linas Vepstas172ca922005-11-03 18:50:04 -0600189#define EEH_MAX_ALLOWED_FREEZES 5
190
Gavin Shan22f4ab12012-09-07 22:44:08 +0000191typedef void *(*eeh_traverse_func)(void *data, void *flag);
Greg Kroah-Hartmancad5cef2012-12-21 14:04:10 -0800192int eeh_phb_pe_create(struct pci_controller *phb);
Gavin Shan9ff67432013-06-20 13:20:53 +0800193struct eeh_pe *eeh_phb_pe_get(struct pci_controller *phb);
Gavin Shan01566802013-06-20 13:20:54 +0800194struct eeh_pe *eeh_pe_get(struct eeh_dev *edev);
Gavin Shan9b843482012-09-07 22:44:09 +0000195int eeh_add_to_parent_pe(struct eeh_dev *edev);
Gavin Shan20ee6a92012-09-11 19:16:17 +0000196int eeh_rmv_from_parent_pe(struct eeh_dev *edev, int purge_pe);
Gavin Shan5a719782013-06-20 13:21:01 +0800197void eeh_pe_update_time_stamp(struct eeh_pe *pe);
Gavin Shan9e6d2cf2012-09-07 22:44:15 +0000198void *eeh_pe_dev_traverse(struct eeh_pe *root,
199 eeh_traverse_func fn, void *flag);
200void eeh_pe_restore_bars(struct eeh_pe *pe);
Gavin Shan9b3c76f2012-09-07 22:44:19 +0000201struct pci_bus *eeh_pe_bus_get(struct eeh_pe *pe);
Gavin Shan55037d12012-09-07 22:44:07 +0000202
Greg Kroah-Hartmancad5cef2012-12-21 14:04:10 -0800203void *eeh_dev_init(struct device_node *dn, void *data);
204void eeh_dev_phb_init_dynamic(struct pci_controller *phb);
Gavin Shaneeb63612013-06-27 13:46:47 +0800205int eeh_init(void);
Gavin Shanaa1e6372012-02-27 20:03:53 +0000206int __init eeh_ops_register(struct eeh_ops *ops);
207int __exit eeh_ops_unregister(const char *name);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700208unsigned long eeh_check_failure(const volatile void __iomem *token,
209 unsigned long val);
Gavin Shanf8f7d632012-09-07 22:44:22 +0000210int eeh_dev_check_failure(struct eeh_dev *edev);
Gavin Shaneeb63612013-06-27 13:46:47 +0800211void eeh_addr_cache_build(void);
Linas Vepstase2a296e2005-11-03 18:51:31 -0600212void eeh_add_device_tree_early(struct device_node *);
John Rose827c1a62006-02-24 11:34:23 -0600213void eeh_add_device_tree_late(struct pci_bus *);
Thadeu Lima de Souza Cascardo6a040ce2012-12-28 09:13:19 +0000214void eeh_add_sysfs_files(struct pci_bus *);
Gavin Shan20ee6a92012-09-11 19:16:17 +0000215void eeh_remove_bus_device(struct pci_dev *, int);
Linas Vepstase2a296e2005-11-03 18:51:31 -0600216
217/**
Linus Torvalds1da177e2005-04-16 15:20:36 -0700218 * EEH_POSSIBLE_ERROR() -- test for possible MMIO failure.
219 *
220 * If this macro yields TRUE, the caller relays to eeh_check_failure()
221 * which does further tests out of line.
222 */
David Woodhouse1e28a7d2005-11-17 00:44:03 +0000223#define EEH_POSSIBLE_ERROR(val, type) ((val) == (type)~0 && eeh_subsystem_enabled)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700224
225/*
226 * Reads from a device which has been isolated by EEH will return
227 * all 1s. This macro gives an all-1s value of the given size (in
228 * bytes: 1, 2, or 4) for comparing with the result of a read.
229 */
230#define EEH_IO_ERROR_VALUE(size) (~0U >> ((4 - (size)) * 8))
231
232#else /* !CONFIG_EEH */
Gavin Shaneb740b52012-02-27 20:04:04 +0000233
Gavin Shan51fb5f52013-06-20 13:20:56 +0800234static inline int eeh_init(void)
235{
236 return 0;
237}
238
Gavin Shaneb740b52012-02-27 20:04:04 +0000239static inline void *eeh_dev_init(struct device_node *dn, void *data)
240{
241 return NULL;
242}
243
244static inline void eeh_dev_phb_init_dynamic(struct pci_controller *phb) { }
245
Linus Torvalds1da177e2005-04-16 15:20:36 -0700246static inline unsigned long eeh_check_failure(const volatile void __iomem *token, unsigned long val)
247{
248 return val;
249}
250
Gavin Shanf8f7d632012-09-07 22:44:22 +0000251#define eeh_dev_check_failure(x) (0)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700252
Gavin Shan3ab96a02012-09-07 22:44:23 +0000253static inline void eeh_addr_cache_build(void) { }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700254
Haren Myneni022930e2005-12-27 18:58:29 -0800255static inline void eeh_add_device_tree_early(struct device_node *dn) { }
256
John Rose827c1a62006-02-24 11:34:23 -0600257static inline void eeh_add_device_tree_late(struct pci_bus *bus) { }
258
Thadeu Lima de Souza Cascardo6a040ce2012-12-28 09:13:19 +0000259static inline void eeh_add_sysfs_files(struct pci_bus *bus) { }
260
Gavin Shan20ee6a92012-09-11 19:16:17 +0000261static inline void eeh_remove_bus_device(struct pci_dev *dev, int purge_pe) { }
Gavin Shan646a8492012-09-07 22:44:06 +0000262
Linus Torvalds1da177e2005-04-16 15:20:36 -0700263#define EEH_POSSIBLE_ERROR(val, type) (0)
264#define EEH_IO_ERROR_VALUE(size) (-1UL)
265#endif /* CONFIG_EEH */
266
Benjamin Herrenschmidt8b8da352008-10-27 19:48:37 +0000267#ifdef CONFIG_PPC64
Linas Vepstas172ca922005-11-03 18:50:04 -0600268/*
Linus Torvalds1da177e2005-04-16 15:20:36 -0700269 * MMIO read/write operations with EEH support.
270 */
271static inline u8 eeh_readb(const volatile void __iomem *addr)
272{
273 u8 val = in_8(addr);
274 if (EEH_POSSIBLE_ERROR(val, u8))
275 return eeh_check_failure(addr, val);
276 return val;
277}
Linus Torvalds1da177e2005-04-16 15:20:36 -0700278
279static inline u16 eeh_readw(const volatile void __iomem *addr)
280{
281 u16 val = in_le16(addr);
282 if (EEH_POSSIBLE_ERROR(val, u16))
283 return eeh_check_failure(addr, val);
284 return val;
285}
Linus Torvalds1da177e2005-04-16 15:20:36 -0700286
287static inline u32 eeh_readl(const volatile void __iomem *addr)
288{
289 u32 val = in_le32(addr);
290 if (EEH_POSSIBLE_ERROR(val, u32))
291 return eeh_check_failure(addr, val);
292 return val;
293}
Linus Torvalds1da177e2005-04-16 15:20:36 -0700294
295static inline u64 eeh_readq(const volatile void __iomem *addr)
296{
297 u64 val = in_le64(addr);
298 if (EEH_POSSIBLE_ERROR(val, u64))
299 return eeh_check_failure(addr, val);
300 return val;
301}
Benjamin Herrenschmidt4cb3cee2006-11-11 17:25:10 +1100302
303static inline u16 eeh_readw_be(const volatile void __iomem *addr)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700304{
Benjamin Herrenschmidt4cb3cee2006-11-11 17:25:10 +1100305 u16 val = in_be16(addr);
306 if (EEH_POSSIBLE_ERROR(val, u16))
307 return eeh_check_failure(addr, val);
308 return val;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700309}
Benjamin Herrenschmidt4cb3cee2006-11-11 17:25:10 +1100310
311static inline u32 eeh_readl_be(const volatile void __iomem *addr)
312{
313 u32 val = in_be32(addr);
314 if (EEH_POSSIBLE_ERROR(val, u32))
315 return eeh_check_failure(addr, val);
316 return val;
317}
318
319static inline u64 eeh_readq_be(const volatile void __iomem *addr)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700320{
321 u64 val = in_be64(addr);
322 if (EEH_POSSIBLE_ERROR(val, u64))
323 return eeh_check_failure(addr, val);
324 return val;
325}
Linus Torvalds1da177e2005-04-16 15:20:36 -0700326
Benjamin Herrenschmidt68a64352006-11-13 09:27:39 +1100327static inline void eeh_memcpy_fromio(void *dest, const
328 volatile void __iomem *src,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700329 unsigned long n)
330{
Benjamin Herrenschmidt68a64352006-11-13 09:27:39 +1100331 _memcpy_fromio(dest, src, n);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700332
333 /* Look for ffff's here at dest[n]. Assume that at least 4 bytes
334 * were copied. Check all four bytes.
335 */
Benjamin Herrenschmidt68a64352006-11-13 09:27:39 +1100336 if (n >= 4 && EEH_POSSIBLE_ERROR(*((u32 *)(dest + n - 4)), u32))
337 eeh_check_failure(src, *((u32 *)(dest + n - 4)));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700338}
339
Linus Torvalds1da177e2005-04-16 15:20:36 -0700340/* in-string eeh macros */
Benjamin Herrenschmidt4cb3cee2006-11-11 17:25:10 +1100341static inline void eeh_readsb(const volatile void __iomem *addr, void * buf,
342 int ns)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700343{
Benjamin Herrenschmidt4cb3cee2006-11-11 17:25:10 +1100344 _insb(addr, buf, ns);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700345 if (EEH_POSSIBLE_ERROR((*(((u8*)buf)+ns-1)), u8))
Benjamin Herrenschmidt4cb3cee2006-11-11 17:25:10 +1100346 eeh_check_failure(addr, *(u8*)buf);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700347}
348
Benjamin Herrenschmidt4cb3cee2006-11-11 17:25:10 +1100349static inline void eeh_readsw(const volatile void __iomem *addr, void * buf,
350 int ns)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700351{
Benjamin Herrenschmidt4cb3cee2006-11-11 17:25:10 +1100352 _insw(addr, buf, ns);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700353 if (EEH_POSSIBLE_ERROR((*(((u16*)buf)+ns-1)), u16))
Benjamin Herrenschmidt4cb3cee2006-11-11 17:25:10 +1100354 eeh_check_failure(addr, *(u16*)buf);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700355}
356
Benjamin Herrenschmidt4cb3cee2006-11-11 17:25:10 +1100357static inline void eeh_readsl(const volatile void __iomem *addr, void * buf,
358 int nl)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700359{
Benjamin Herrenschmidt4cb3cee2006-11-11 17:25:10 +1100360 _insl(addr, buf, nl);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700361 if (EEH_POSSIBLE_ERROR((*(((u32*)buf)+nl-1)), u32))
Benjamin Herrenschmidt4cb3cee2006-11-11 17:25:10 +1100362 eeh_check_failure(addr, *(u32*)buf);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700363}
364
Benjamin Herrenschmidt8b8da352008-10-27 19:48:37 +0000365#endif /* CONFIG_PPC64 */
Arnd Bergmann88ced032005-12-16 22:43:46 +0100366#endif /* __KERNEL__ */
Benjamin Herrenschmidt8b8da352008-10-27 19:48:37 +0000367#endif /* _POWERPC_EEH_H */