blob: 0c0ac93f422ff78903b9a0b7c6626a3b68453580 [file] [log] [blame]
Linas Vepstas172ca922005-11-03 18:50:04 -06001/*
Linus Torvalds1da177e2005-04-16 15:20:36 -07002 * Copyright (C) 2001 Dave Engebretsen & Todd Inglett IBM Corporation.
Gavin Shancb3bc9d2012-02-27 20:03:51 +00003 * Copyright 2001-2012 IBM Corporation.
Linus Torvalds1da177e2005-04-16 15:20:36 -07004 *
5 * This program is free software; you can redistribute it and/or modify
6 * it under the terms of the GNU General Public License as published by
7 * the Free Software Foundation; either version 2 of the License, or
8 * (at your option) any later version.
Linas Vepstas172ca922005-11-03 18:50:04 -06009 *
Linus Torvalds1da177e2005-04-16 15:20:36 -070010 * This program is distributed in the hope that it will be useful,
11 * but WITHOUT ANY WARRANTY; without even the implied warranty of
12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
13 * GNU General Public License for more details.
Linas Vepstas172ca922005-11-03 18:50:04 -060014 *
Linus Torvalds1da177e2005-04-16 15:20:36 -070015 * You should have received a copy of the GNU General Public License
16 * along with this program; if not, write to the Free Software
17 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
18 */
19
Benjamin Herrenschmidt8b8da352008-10-27 19:48:37 +000020#ifndef _POWERPC_EEH_H
21#define _POWERPC_EEH_H
Arnd Bergmann88ced032005-12-16 22:43:46 +010022#ifdef __KERNEL__
Linus Torvalds1da177e2005-04-16 15:20:36 -070023
Linus Torvalds1da177e2005-04-16 15:20:36 -070024#include <linux/init.h>
25#include <linux/list.h>
26#include <linux/string.h>
Gavin Shan5a719782013-06-20 13:21:01 +080027#include <linux/time.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070028
29struct pci_dev;
John Rose827c1a62006-02-24 11:34:23 -060030struct pci_bus;
Linus Torvalds1da177e2005-04-16 15:20:36 -070031struct device_node;
Linus Torvalds1da177e2005-04-16 15:20:36 -070032
33#ifdef CONFIG_EEH
34
Gavin Shanaa1e6372012-02-27 20:03:53 +000035/*
Gavin Shan968f9682012-09-07 22:44:05 +000036 * The struct is used to trace PE related EEH functionality.
37 * In theory, there will have one instance of the struct to
38 * be created against particular PE. In nature, PEs corelate
39 * to each other. the struct has to reflect that hierarchy in
40 * order to easily pick up those affected PEs when one particular
41 * PE has EEH errors.
42 *
43 * Also, one particular PE might be composed of PCI device, PCI
44 * bus and its subordinate components. The struct also need ship
45 * the information. Further more, one particular PE is only meaingful
46 * in the corresponding PHB. Therefore, the root PEs should be created
47 * against existing PHBs in on-to-one fashion.
48 */
Gavin Shan5efc3ad2012-09-11 19:16:16 +000049#define EEH_PE_INVALID (1 << 0) /* Invalid */
50#define EEH_PE_PHB (1 << 1) /* PHB PE */
51#define EEH_PE_DEVICE (1 << 2) /* Device PE */
52#define EEH_PE_BUS (1 << 3) /* Bus PE */
Gavin Shan968f9682012-09-07 22:44:05 +000053
54#define EEH_PE_ISOLATED (1 << 0) /* Isolated PE */
55#define EEH_PE_RECOVERING (1 << 1) /* Recovering PE */
56
57struct eeh_pe {
58 int type; /* PE type: PHB/Bus/Device */
59 int state; /* PE EEH dependent mode */
60 int config_addr; /* Traditional PCI address */
61 int addr; /* PE configuration address */
62 struct pci_controller *phb; /* Associated PHB */
Gavin Shan8cdb2832013-06-20 13:20:55 +080063 struct pci_bus *bus; /* Top PCI bus for bus PE */
Gavin Shan968f9682012-09-07 22:44:05 +000064 int check_count; /* Times of ignored error */
65 int freeze_count; /* Times of froze up */
Gavin Shan5a719782013-06-20 13:21:01 +080066 struct timeval tstamp; /* Time on first-time freeze */
Gavin Shan968f9682012-09-07 22:44:05 +000067 int false_positives; /* Times of reported #ff's */
68 struct eeh_pe *parent; /* Parent PE */
69 struct list_head child_list; /* Link PE to the child list */
70 struct list_head edevs; /* Link list of EEH devices */
71 struct list_head child; /* Child PEs */
72};
73
Gavin Shan5b663522012-09-07 22:44:12 +000074#define eeh_pe_for_each_dev(pe, edev) \
75 list_for_each_entry(edev, &pe->edevs, list)
76
Gavin Shan968f9682012-09-07 22:44:05 +000077/*
Gavin Shaneb740b52012-02-27 20:04:04 +000078 * The struct is used to trace EEH state for the associated
79 * PCI device node or PCI device. In future, it might
80 * represent PE as well so that the EEH device to form
81 * another tree except the currently existing tree of PCI
82 * buses and PCI devices
83 */
Gavin Shandbbceee2012-09-07 22:44:20 +000084#define EEH_DEV_IRQ_DISABLED (1<<0) /* Interrupt disabled */
Gavin Shaneb740b52012-02-27 20:04:04 +000085
86struct eeh_dev {
87 int mode; /* EEH mode */
88 int class_code; /* Class code of the device */
89 int config_addr; /* Config address */
90 int pe_config_addr; /* PE config address */
Gavin Shaneb740b52012-02-27 20:04:04 +000091 u32 config_space[16]; /* Saved PCI config space */
Gavin Shan968f9682012-09-07 22:44:05 +000092 struct eeh_pe *pe; /* Associated PE */
93 struct list_head list; /* Form link list in the PE */
Gavin Shaneb740b52012-02-27 20:04:04 +000094 struct pci_controller *phb; /* Associated PHB */
95 struct device_node *dn; /* Associated device node */
96 struct pci_dev *pdev; /* Associated PCI device */
97};
98
99static inline struct device_node *eeh_dev_to_of_node(struct eeh_dev *edev)
100{
Gavin Shan2d5c1212013-06-05 15:34:03 +0800101 return edev ? edev->dn : NULL;
Gavin Shaneb740b52012-02-27 20:04:04 +0000102}
103
104static inline struct pci_dev *eeh_dev_to_pci_dev(struct eeh_dev *edev)
105{
Gavin Shan2d5c1212013-06-05 15:34:03 +0800106 return edev ? edev->pdev : NULL;
Gavin Shaneb740b52012-02-27 20:04:04 +0000107}
108
109/*
Gavin Shanaa1e6372012-02-27 20:03:53 +0000110 * The struct is used to trace the registered EEH operation
111 * callback functions. Actually, those operation callback
112 * functions are heavily platform dependent. That means the
113 * platform should register its own EEH operation callback
114 * functions before any EEH further operations.
115 */
Gavin Shan8fb8f702012-02-27 20:03:55 +0000116#define EEH_OPT_DISABLE 0 /* EEH disable */
117#define EEH_OPT_ENABLE 1 /* EEH enable */
118#define EEH_OPT_THAW_MMIO 2 /* MMIO enable */
119#define EEH_OPT_THAW_DMA 3 /* DMA enable */
Gavin Shaneb594a42012-02-27 20:03:57 +0000120#define EEH_STATE_UNAVAILABLE (1 << 0) /* State unavailable */
121#define EEH_STATE_NOT_SUPPORT (1 << 1) /* EEH not supported */
122#define EEH_STATE_RESET_ACTIVE (1 << 2) /* Active reset */
123#define EEH_STATE_MMIO_ACTIVE (1 << 3) /* Active MMIO */
124#define EEH_STATE_DMA_ACTIVE (1 << 4) /* Active DMA */
125#define EEH_STATE_MMIO_ENABLED (1 << 5) /* MMIO enabled */
126#define EEH_STATE_DMA_ENABLED (1 << 6) /* DMA enabled */
Gavin Shan26524812012-02-27 20:03:59 +0000127#define EEH_RESET_DEACTIVATE 0 /* Deactivate the PE reset */
128#define EEH_RESET_HOT 1 /* Hot reset */
129#define EEH_RESET_FUNDAMENTAL 3 /* Fundamental reset */
Gavin Shan8d633292012-02-27 20:04:00 +0000130#define EEH_LOG_TEMP 1 /* EEH temporary error log */
131#define EEH_LOG_PERM 2 /* EEH permanent error log */
Gavin Shaneb594a42012-02-27 20:03:57 +0000132
Gavin Shanaa1e6372012-02-27 20:03:53 +0000133struct eeh_ops {
134 char *name;
135 int (*init)(void);
Gavin Shan21fd21f2013-06-20 13:20:57 +0800136 int (*post_init)(void);
Gavin Shand7bb8862012-09-07 22:44:21 +0000137 void* (*of_probe)(struct device_node *dn, void *flag);
Gavin Shan51fb5f52013-06-20 13:20:56 +0800138 int (*dev_probe)(struct pci_dev *dev, void *flag);
Gavin Shan371a3952012-09-07 22:44:14 +0000139 int (*set_option)(struct eeh_pe *pe, int option);
140 int (*get_pe_addr)(struct eeh_pe *pe);
141 int (*get_state)(struct eeh_pe *pe, int *state);
142 int (*reset)(struct eeh_pe *pe, int option);
143 int (*wait_state)(struct eeh_pe *pe, int max_wait);
144 int (*get_log)(struct eeh_pe *pe, int severity, char *drv_log, unsigned long len);
145 int (*configure_bridge)(struct eeh_pe *pe);
Gavin Shan37804442012-02-27 20:04:11 +0000146 int (*read_config)(struct device_node *dn, int where, int size, u32 *val);
147 int (*write_config)(struct device_node *dn, int where, int size, u32 val);
Gavin Shanaa1e6372012-02-27 20:03:53 +0000148};
149
150extern struct eeh_ops *eeh_ops;
David Woodhouse1e28a7d2005-11-17 00:44:03 +0000151extern int eeh_subsystem_enabled;
Gavin Shan646a8492012-09-07 22:44:06 +0000152extern struct mutex eeh_mutex;
Gavin Shan49075812013-06-20 13:21:03 +0800153extern raw_spinlock_t confirm_error_lock;
Gavin Shand7bb8862012-09-07 22:44:21 +0000154extern int eeh_probe_mode;
155
156#define EEH_PROBE_MODE_DEV (1<<0) /* From PCI device */
157#define EEH_PROBE_MODE_DEVTREE (1<<1) /* From device tree */
158
159static inline void eeh_probe_mode_set(int flag)
160{
161 eeh_probe_mode = flag;
162}
163
164static inline int eeh_probe_mode_devtree(void)
165{
166 return (eeh_probe_mode == EEH_PROBE_MODE_DEVTREE);
167}
168
169static inline int eeh_probe_mode_dev(void)
170{
171 return (eeh_probe_mode == EEH_PROBE_MODE_DEV);
172}
Gavin Shan646a8492012-09-07 22:44:06 +0000173
174static inline void eeh_lock(void)
175{
176 mutex_lock(&eeh_mutex);
177}
178
179static inline void eeh_unlock(void)
180{
181 mutex_unlock(&eeh_mutex);
182}
David Woodhouse1e28a7d2005-11-17 00:44:03 +0000183
Gavin Shan49075812013-06-20 13:21:03 +0800184static inline void eeh_serialize_lock(unsigned long *flags)
185{
186 raw_spin_lock_irqsave(&confirm_error_lock, *flags);
187}
188
189static inline void eeh_serialize_unlock(unsigned long flags)
190{
191 raw_spin_unlock_irqrestore(&confirm_error_lock, flags);
192}
193
Gavin Shancb3bc9d2012-02-27 20:03:51 +0000194/*
195 * Max number of EEH freezes allowed before we consider the device
196 * to be permanently disabled.
197 */
Linas Vepstas172ca922005-11-03 18:50:04 -0600198#define EEH_MAX_ALLOWED_FREEZES 5
199
Gavin Shan22f4ab12012-09-07 22:44:08 +0000200typedef void *(*eeh_traverse_func)(void *data, void *flag);
Greg Kroah-Hartmancad5cef2012-12-21 14:04:10 -0800201int eeh_phb_pe_create(struct pci_controller *phb);
Gavin Shan9ff67432013-06-20 13:20:53 +0800202struct eeh_pe *eeh_phb_pe_get(struct pci_controller *phb);
Gavin Shan01566802013-06-20 13:20:54 +0800203struct eeh_pe *eeh_pe_get(struct eeh_dev *edev);
Gavin Shan9b843482012-09-07 22:44:09 +0000204int eeh_add_to_parent_pe(struct eeh_dev *edev);
Gavin Shan20ee6a92012-09-11 19:16:17 +0000205int eeh_rmv_from_parent_pe(struct eeh_dev *edev, int purge_pe);
Gavin Shan5a719782013-06-20 13:21:01 +0800206void eeh_pe_update_time_stamp(struct eeh_pe *pe);
Gavin Shan9e6d2cf2012-09-07 22:44:15 +0000207void *eeh_pe_dev_traverse(struct eeh_pe *root,
208 eeh_traverse_func fn, void *flag);
209void eeh_pe_restore_bars(struct eeh_pe *pe);
Gavin Shan9b3c76f2012-09-07 22:44:19 +0000210struct pci_bus *eeh_pe_bus_get(struct eeh_pe *pe);
Gavin Shan55037d12012-09-07 22:44:07 +0000211
Greg Kroah-Hartmancad5cef2012-12-21 14:04:10 -0800212void *eeh_dev_init(struct device_node *dn, void *data);
213void eeh_dev_phb_init_dynamic(struct pci_controller *phb);
Gavin Shan51fb5f52013-06-20 13:20:56 +0800214int __init eeh_init(void);
Gavin Shanaa1e6372012-02-27 20:03:53 +0000215int __init eeh_ops_register(struct eeh_ops *ops);
216int __exit eeh_ops_unregister(const char *name);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700217unsigned long eeh_check_failure(const volatile void __iomem *token,
218 unsigned long val);
Gavin Shanf8f7d632012-09-07 22:44:22 +0000219int eeh_dev_check_failure(struct eeh_dev *edev);
Gavin Shan3ab96a02012-09-07 22:44:23 +0000220void __init eeh_addr_cache_build(void);
Linas Vepstase2a296e2005-11-03 18:51:31 -0600221void eeh_add_device_tree_early(struct device_node *);
John Rose827c1a62006-02-24 11:34:23 -0600222void eeh_add_device_tree_late(struct pci_bus *);
Thadeu Lima de Souza Cascardo6a040ce2012-12-28 09:13:19 +0000223void eeh_add_sysfs_files(struct pci_bus *);
Gavin Shan20ee6a92012-09-11 19:16:17 +0000224void eeh_remove_bus_device(struct pci_dev *, int);
Linas Vepstase2a296e2005-11-03 18:51:31 -0600225
226/**
Linus Torvalds1da177e2005-04-16 15:20:36 -0700227 * EEH_POSSIBLE_ERROR() -- test for possible MMIO failure.
228 *
229 * If this macro yields TRUE, the caller relays to eeh_check_failure()
230 * which does further tests out of line.
231 */
David Woodhouse1e28a7d2005-11-17 00:44:03 +0000232#define EEH_POSSIBLE_ERROR(val, type) ((val) == (type)~0 && eeh_subsystem_enabled)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700233
234/*
235 * Reads from a device which has been isolated by EEH will return
236 * all 1s. This macro gives an all-1s value of the given size (in
237 * bytes: 1, 2, or 4) for comparing with the result of a read.
238 */
239#define EEH_IO_ERROR_VALUE(size) (~0U >> ((4 - (size)) * 8))
240
241#else /* !CONFIG_EEH */
Gavin Shaneb740b52012-02-27 20:04:04 +0000242
Gavin Shan51fb5f52013-06-20 13:20:56 +0800243static inline int eeh_init(void)
244{
245 return 0;
246}
247
Gavin Shaneb740b52012-02-27 20:04:04 +0000248static inline void *eeh_dev_init(struct device_node *dn, void *data)
249{
250 return NULL;
251}
252
253static inline void eeh_dev_phb_init_dynamic(struct pci_controller *phb) { }
254
Linus Torvalds1da177e2005-04-16 15:20:36 -0700255static inline unsigned long eeh_check_failure(const volatile void __iomem *token, unsigned long val)
256{
257 return val;
258}
259
Gavin Shanf8f7d632012-09-07 22:44:22 +0000260#define eeh_dev_check_failure(x) (0)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700261
Gavin Shan3ab96a02012-09-07 22:44:23 +0000262static inline void eeh_addr_cache_build(void) { }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700263
Haren Myneni022930e2005-12-27 18:58:29 -0800264static inline void eeh_add_device_tree_early(struct device_node *dn) { }
265
John Rose827c1a62006-02-24 11:34:23 -0600266static inline void eeh_add_device_tree_late(struct pci_bus *bus) { }
267
Thadeu Lima de Souza Cascardo6a040ce2012-12-28 09:13:19 +0000268static inline void eeh_add_sysfs_files(struct pci_bus *bus) { }
269
Gavin Shan20ee6a92012-09-11 19:16:17 +0000270static inline void eeh_remove_bus_device(struct pci_dev *dev, int purge_pe) { }
Gavin Shan646a8492012-09-07 22:44:06 +0000271
272static inline void eeh_lock(void) { }
273static inline void eeh_unlock(void) { }
274
Linus Torvalds1da177e2005-04-16 15:20:36 -0700275#define EEH_POSSIBLE_ERROR(val, type) (0)
276#define EEH_IO_ERROR_VALUE(size) (-1UL)
277#endif /* CONFIG_EEH */
278
Benjamin Herrenschmidt8b8da352008-10-27 19:48:37 +0000279#ifdef CONFIG_PPC64
Linas Vepstas172ca922005-11-03 18:50:04 -0600280/*
Linus Torvalds1da177e2005-04-16 15:20:36 -0700281 * MMIO read/write operations with EEH support.
282 */
283static inline u8 eeh_readb(const volatile void __iomem *addr)
284{
285 u8 val = in_8(addr);
286 if (EEH_POSSIBLE_ERROR(val, u8))
287 return eeh_check_failure(addr, val);
288 return val;
289}
Linus Torvalds1da177e2005-04-16 15:20:36 -0700290
291static inline u16 eeh_readw(const volatile void __iomem *addr)
292{
293 u16 val = in_le16(addr);
294 if (EEH_POSSIBLE_ERROR(val, u16))
295 return eeh_check_failure(addr, val);
296 return val;
297}
Linus Torvalds1da177e2005-04-16 15:20:36 -0700298
299static inline u32 eeh_readl(const volatile void __iomem *addr)
300{
301 u32 val = in_le32(addr);
302 if (EEH_POSSIBLE_ERROR(val, u32))
303 return eeh_check_failure(addr, val);
304 return val;
305}
Linus Torvalds1da177e2005-04-16 15:20:36 -0700306
307static inline u64 eeh_readq(const volatile void __iomem *addr)
308{
309 u64 val = in_le64(addr);
310 if (EEH_POSSIBLE_ERROR(val, u64))
311 return eeh_check_failure(addr, val);
312 return val;
313}
Benjamin Herrenschmidt4cb3cee2006-11-11 17:25:10 +1100314
315static inline u16 eeh_readw_be(const volatile void __iomem *addr)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700316{
Benjamin Herrenschmidt4cb3cee2006-11-11 17:25:10 +1100317 u16 val = in_be16(addr);
318 if (EEH_POSSIBLE_ERROR(val, u16))
319 return eeh_check_failure(addr, val);
320 return val;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700321}
Benjamin Herrenschmidt4cb3cee2006-11-11 17:25:10 +1100322
323static inline u32 eeh_readl_be(const volatile void __iomem *addr)
324{
325 u32 val = in_be32(addr);
326 if (EEH_POSSIBLE_ERROR(val, u32))
327 return eeh_check_failure(addr, val);
328 return val;
329}
330
331static inline u64 eeh_readq_be(const volatile void __iomem *addr)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700332{
333 u64 val = in_be64(addr);
334 if (EEH_POSSIBLE_ERROR(val, u64))
335 return eeh_check_failure(addr, val);
336 return val;
337}
Linus Torvalds1da177e2005-04-16 15:20:36 -0700338
Benjamin Herrenschmidt68a64352006-11-13 09:27:39 +1100339static inline void eeh_memcpy_fromio(void *dest, const
340 volatile void __iomem *src,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700341 unsigned long n)
342{
Benjamin Herrenschmidt68a64352006-11-13 09:27:39 +1100343 _memcpy_fromio(dest, src, n);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700344
345 /* Look for ffff's here at dest[n]. Assume that at least 4 bytes
346 * were copied. Check all four bytes.
347 */
Benjamin Herrenschmidt68a64352006-11-13 09:27:39 +1100348 if (n >= 4 && EEH_POSSIBLE_ERROR(*((u32 *)(dest + n - 4)), u32))
349 eeh_check_failure(src, *((u32 *)(dest + n - 4)));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700350}
351
Linus Torvalds1da177e2005-04-16 15:20:36 -0700352/* in-string eeh macros */
Benjamin Herrenschmidt4cb3cee2006-11-11 17:25:10 +1100353static inline void eeh_readsb(const volatile void __iomem *addr, void * buf,
354 int ns)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700355{
Benjamin Herrenschmidt4cb3cee2006-11-11 17:25:10 +1100356 _insb(addr, buf, ns);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700357 if (EEH_POSSIBLE_ERROR((*(((u8*)buf)+ns-1)), u8))
Benjamin Herrenschmidt4cb3cee2006-11-11 17:25:10 +1100358 eeh_check_failure(addr, *(u8*)buf);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700359}
360
Benjamin Herrenschmidt4cb3cee2006-11-11 17:25:10 +1100361static inline void eeh_readsw(const volatile void __iomem *addr, void * buf,
362 int ns)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700363{
Benjamin Herrenschmidt4cb3cee2006-11-11 17:25:10 +1100364 _insw(addr, buf, ns);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700365 if (EEH_POSSIBLE_ERROR((*(((u16*)buf)+ns-1)), u16))
Benjamin Herrenschmidt4cb3cee2006-11-11 17:25:10 +1100366 eeh_check_failure(addr, *(u16*)buf);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700367}
368
Benjamin Herrenschmidt4cb3cee2006-11-11 17:25:10 +1100369static inline void eeh_readsl(const volatile void __iomem *addr, void * buf,
370 int nl)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700371{
Benjamin Herrenschmidt4cb3cee2006-11-11 17:25:10 +1100372 _insl(addr, buf, nl);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700373 if (EEH_POSSIBLE_ERROR((*(((u32*)buf)+nl-1)), u32))
Benjamin Herrenschmidt4cb3cee2006-11-11 17:25:10 +1100374 eeh_check_failure(addr, *(u32*)buf);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700375}
376
Benjamin Herrenschmidt8b8da352008-10-27 19:48:37 +0000377#endif /* CONFIG_PPC64 */
Arnd Bergmann88ced032005-12-16 22:43:46 +0100378#endif /* __KERNEL__ */
Benjamin Herrenschmidt8b8da352008-10-27 19:48:37 +0000379#endif /* _POWERPC_EEH_H */