blob: 845e024321d4718b48293a9aff2025bc3cf541c1 [file] [log] [blame]
Thomas Gleixner1a59d1b82019-05-27 08:55:05 +02001// SPDX-License-Identifier: GPL-2.0-or-later
Gavin Shan55037d12012-09-07 22:44:07 +00002/*
3 * The file intends to implement PE based on the information from
4 * platforms. Basically, there have 3 types of PEs: PHB/Bus/Device.
5 * All the PEs should be organized as hierarchy tree. The first level
6 * of the tree will be associated to existing PHBs since the particular
7 * PE is only meaningful in one PHB domain.
8 *
9 * Copyright Benjamin Herrenschmidt & Gavin Shan, IBM Corporation 2012.
Gavin Shan55037d12012-09-07 22:44:07 +000010 */
11
Gavin Shan652defe2013-06-27 13:46:43 +080012#include <linux/delay.h>
Gavin Shan55037d12012-09-07 22:44:07 +000013#include <linux/export.h>
14#include <linux/gfp.h>
Gavin Shan55037d12012-09-07 22:44:07 +000015#include <linux/kernel.h>
16#include <linux/pci.h>
17#include <linux/string.h>
18
19#include <asm/pci-bridge.h>
20#include <asm/ppc-pci.h>
21
Gavin Shanbb593c02014-07-17 14:41:43 +100022static int eeh_pe_aux_size = 0;
Gavin Shan55037d12012-09-07 22:44:07 +000023static LIST_HEAD(eeh_phb_pe);
24
25/**
Gavin Shanbb593c02014-07-17 14:41:43 +100026 * eeh_set_pe_aux_size - Set PE auxillary data size
27 * @size: PE auxillary data size
28 *
29 * Set PE auxillary data size
30 */
31void eeh_set_pe_aux_size(int size)
32{
33 if (size < 0)
34 return;
35
36 eeh_pe_aux_size = size;
37}
38
39/**
Gavin Shan55037d12012-09-07 22:44:07 +000040 * eeh_pe_alloc - Allocate PE
41 * @phb: PCI controller
42 * @type: PE type
43 *
44 * Allocate PE instance dynamically.
45 */
46static struct eeh_pe *eeh_pe_alloc(struct pci_controller *phb, int type)
47{
48 struct eeh_pe *pe;
Gavin Shanbb593c02014-07-17 14:41:43 +100049 size_t alloc_size;
50
51 alloc_size = sizeof(struct eeh_pe);
52 if (eeh_pe_aux_size) {
53 alloc_size = ALIGN(alloc_size, cache_line_size());
54 alloc_size += eeh_pe_aux_size;
55 }
Gavin Shan55037d12012-09-07 22:44:07 +000056
57 /* Allocate PHB PE */
Gavin Shanbb593c02014-07-17 14:41:43 +100058 pe = kzalloc(alloc_size, GFP_KERNEL);
Gavin Shan55037d12012-09-07 22:44:07 +000059 if (!pe) return NULL;
60
61 /* Initialize PHB PE */
62 pe->type = type;
63 pe->phb = phb;
64 INIT_LIST_HEAD(&pe->child_list);
Gavin Shan55037d12012-09-07 22:44:07 +000065 INIT_LIST_HEAD(&pe->edevs);
66
Gavin Shanbb593c02014-07-17 14:41:43 +100067 pe->data = (void *)pe + ALIGN(sizeof(struct eeh_pe),
68 cache_line_size());
Gavin Shan55037d12012-09-07 22:44:07 +000069 return pe;
70}
71
72/**
73 * eeh_phb_pe_create - Create PHB PE
74 * @phb: PCI controller
75 *
76 * The function should be called while the PHB is detected during
77 * system boot or PCI hotplug in order to create PHB PE.
78 */
Greg Kroah-Hartmancad5cef2012-12-21 14:04:10 -080079int eeh_phb_pe_create(struct pci_controller *phb)
Gavin Shan55037d12012-09-07 22:44:07 +000080{
81 struct eeh_pe *pe;
82
83 /* Allocate PHB PE */
84 pe = eeh_pe_alloc(phb, EEH_PE_PHB);
85 if (!pe) {
86 pr_err("%s: out of memory!\n", __func__);
87 return -ENOMEM;
88 }
89
90 /* Put it into the list */
Gavin Shan55037d12012-09-07 22:44:07 +000091 list_add_tail(&pe->child, &eeh_phb_pe);
Gavin Shan55037d12012-09-07 22:44:07 +000092
Russell Currey1f52f172016-11-16 14:02:15 +110093 pr_debug("EEH: Add PE for PHB#%x\n", phb->global_number);
Gavin Shan55037d12012-09-07 22:44:07 +000094
95 return 0;
96}
97
98/**
Sam Bobrofffef7f902018-09-12 11:23:32 +100099 * eeh_wait_state - Wait for PE state
100 * @pe: EEH PE
101 * @max_wait: maximal period in millisecond
102 *
103 * Wait for the state of associated PE. It might take some time
104 * to retrieve the PE's state.
105 */
106int eeh_wait_state(struct eeh_pe *pe, int max_wait)
107{
108 int ret;
109 int mwait;
110
111 /*
112 * According to PAPR, the state of PE might be temporarily
113 * unavailable. Under the circumstance, we have to wait
114 * for indicated time determined by firmware. The maximal
115 * wait time is 5 minutes, which is acquired from the original
116 * EEH implementation. Also, the original implementation
117 * also defined the minimal wait time as 1 second.
118 */
119#define EEH_STATE_MIN_WAIT_TIME (1000)
120#define EEH_STATE_MAX_WAIT_TIME (300 * 1000)
121
122 while (1) {
123 ret = eeh_ops->get_state(pe, &mwait);
124
125 if (ret != EEH_STATE_UNAVAILABLE)
126 return ret;
127
128 if (max_wait <= 0) {
129 pr_warn("%s: Timeout when getting PE's state (%d)\n",
130 __func__, max_wait);
131 return EEH_STATE_NOT_SUPPORT;
132 }
133
134 if (mwait < EEH_STATE_MIN_WAIT_TIME) {
135 pr_warn("%s: Firmware returned bad wait value %d\n",
136 __func__, mwait);
137 mwait = EEH_STATE_MIN_WAIT_TIME;
138 } else if (mwait > EEH_STATE_MAX_WAIT_TIME) {
139 pr_warn("%s: Firmware returned too long wait value %d\n",
140 __func__, mwait);
141 mwait = EEH_STATE_MAX_WAIT_TIME;
142 }
143
144 msleep(min(mwait, max_wait));
145 max_wait -= mwait;
146 }
147}
148
149/**
Gavin Shan55037d12012-09-07 22:44:07 +0000150 * eeh_phb_pe_get - Retrieve PHB PE based on the given PHB
151 * @phb: PCI controller
152 *
153 * The overall PEs form hierarchy tree. The first layer of the
154 * hierarchy tree is composed of PHB PEs. The function is used
155 * to retrieve the corresponding PHB PE according to the given PHB.
156 */
Gavin Shan9ff67432013-06-20 13:20:53 +0800157struct eeh_pe *eeh_phb_pe_get(struct pci_controller *phb)
Gavin Shan55037d12012-09-07 22:44:07 +0000158{
159 struct eeh_pe *pe;
160
Gavin Shan55037d12012-09-07 22:44:07 +0000161 list_for_each_entry(pe, &eeh_phb_pe, child) {
162 /*
163 * Actually, we needn't check the type since
164 * the PE for PHB has been determined when that
165 * was created.
166 */
Aneesh Kumar K.V78446632012-09-20 23:29:46 +0000167 if ((pe->type & EEH_PE_PHB) && pe->phb == phb)
Gavin Shan55037d12012-09-07 22:44:07 +0000168 return pe;
Gavin Shan55037d12012-09-07 22:44:07 +0000169 }
170
Gavin Shan55037d12012-09-07 22:44:07 +0000171 return NULL;
172}
Gavin Shan22f4ab12012-09-07 22:44:08 +0000173
174/**
175 * eeh_pe_next - Retrieve the next PE in the tree
176 * @pe: current PE
177 * @root: root PE
178 *
179 * The function is used to retrieve the next PE in the
180 * hierarchy PE tree.
181 */
Sam Bobroff309ed3a2018-05-25 13:11:35 +1000182struct eeh_pe *eeh_pe_next(struct eeh_pe *pe, struct eeh_pe *root)
Gavin Shan22f4ab12012-09-07 22:44:08 +0000183{
184 struct list_head *next = pe->child_list.next;
185
186 if (next == &pe->child_list) {
187 while (1) {
188 if (pe == root)
189 return NULL;
190 next = pe->child.next;
191 if (next != &pe->parent->child_list)
192 break;
193 pe = pe->parent;
194 }
195 }
196
197 return list_entry(next, struct eeh_pe, child);
198}
199
200/**
201 * eeh_pe_traverse - Traverse PEs in the specified PHB
202 * @root: root PE
203 * @fn: callback
204 * @flag: extra parameter to callback
205 *
206 * The function is used to traverse the specified PE and its
207 * child PEs. The traversing is to be terminated once the
208 * callback returns something other than NULL, or no more PEs
209 * to be traversed.
210 */
Gavin Shanf5c57712013-07-24 10:24:58 +0800211void *eeh_pe_traverse(struct eeh_pe *root,
Sam Bobroffd6c49322018-05-25 13:11:32 +1000212 eeh_pe_traverse_func fn, void *flag)
Gavin Shan22f4ab12012-09-07 22:44:08 +0000213{
214 struct eeh_pe *pe;
215 void *ret;
216
Sam Bobroff309ed3a2018-05-25 13:11:35 +1000217 eeh_for_each_pe(root, pe) {
Gavin Shan22f4ab12012-09-07 22:44:08 +0000218 ret = fn(pe, flag);
219 if (ret) return ret;
220 }
221
222 return NULL;
223}
224
225/**
Gavin Shan9e6d2cf2012-09-07 22:44:15 +0000226 * eeh_pe_dev_traverse - Traverse the devices from the PE
227 * @root: EEH PE
228 * @fn: function callback
229 * @flag: extra parameter to callback
230 *
231 * The function is used to traverse the devices of the specified
232 * PE and its child PEs.
233 */
Sam Bobroffcef50c62019-08-16 14:48:15 +1000234void eeh_pe_dev_traverse(struct eeh_pe *root,
Sam Bobroffd6c49322018-05-25 13:11:32 +1000235 eeh_edev_traverse_func fn, void *flag)
Gavin Shan9e6d2cf2012-09-07 22:44:15 +0000236{
237 struct eeh_pe *pe;
Gavin Shan9feed422013-07-24 10:24:56 +0800238 struct eeh_dev *edev, *tmp;
Gavin Shan9e6d2cf2012-09-07 22:44:15 +0000239
240 if (!root) {
Gavin Shan0dae2742014-07-17 14:41:41 +1000241 pr_warn("%s: Invalid PE %p\n",
242 __func__, root);
Sam Bobroffcef50c62019-08-16 14:48:15 +1000243 return;
Gavin Shan9e6d2cf2012-09-07 22:44:15 +0000244 }
245
246 /* Traverse root PE */
Sam Bobroffcef50c62019-08-16 14:48:15 +1000247 eeh_for_each_pe(root, pe)
248 eeh_pe_for_each_dev(pe, edev, tmp)
249 fn(edev, flag);
Gavin Shan9e6d2cf2012-09-07 22:44:15 +0000250}
251
252/**
Gavin Shan22f4ab12012-09-07 22:44:08 +0000253 * __eeh_pe_get - Check the PE address
Gavin Shan22f4ab12012-09-07 22:44:08 +0000254 *
255 * For one particular PE, it can be identified by PE address
256 * or tranditional BDF address. BDF address is composed of
257 * Bus/Device/Function number. The extra data referred by flag
258 * indicates which type of address should be used.
259 */
Sam Bobroffd6c49322018-05-25 13:11:32 +1000260static void *__eeh_pe_get(struct eeh_pe *pe, void *flag)
Gavin Shan22f4ab12012-09-07 22:44:08 +0000261{
Oliver O'Halloran35d64732020-09-18 19:30:50 +1000262 int *target_pe = flag;
Gavin Shan22f4ab12012-09-07 22:44:08 +0000263
Oliver O'Halloran35d64732020-09-18 19:30:50 +1000264 /* PHB PEs are special and should be ignored */
Gavin Shan5efc3ad2012-09-11 19:16:16 +0000265 if (pe->type & EEH_PE_PHB)
Gavin Shan22f4ab12012-09-07 22:44:08 +0000266 return NULL;
267
Oliver O'Halloran35d64732020-09-18 19:30:50 +1000268 if (*target_pe == pe->addr)
Gavin Shan22f4ab12012-09-07 22:44:08 +0000269 return pe;
270
271 return NULL;
272}
273
274/**
275 * eeh_pe_get - Search PE based on the given address
Alexey Kardashevskiy8bae6a22017-08-29 17:34:00 +1000276 * @phb: PCI controller
277 * @pe_no: PE number
Gavin Shan22f4ab12012-09-07 22:44:08 +0000278 *
279 * Search the corresponding PE based on the specified address which
280 * is included in the eeh device. The function is used to check if
281 * the associated PE has been created against the PE address. It's
282 * notable that the PE address has 2 format: traditional PE address
283 * which is composed of PCI bus/device/function number, or unified
284 * PE address.
285 */
Oliver O'Halloran35d64732020-09-18 19:30:50 +1000286struct eeh_pe *eeh_pe_get(struct pci_controller *phb, int pe_no)
Gavin Shan22f4ab12012-09-07 22:44:08 +0000287{
Alexey Kardashevskiy8bae6a22017-08-29 17:34:00 +1000288 struct eeh_pe *root = eeh_phb_pe_get(phb);
Gavin Shan22f4ab12012-09-07 22:44:08 +0000289
Oliver O'Halloran35d64732020-09-18 19:30:50 +1000290 return eeh_pe_traverse(root, __eeh_pe_get, &pe_no);
Gavin Shan22f4ab12012-09-07 22:44:08 +0000291}
292
293/**
Oliver O'Hallorand923ab72020-07-25 18:12:29 +1000294 * eeh_pe_tree_insert - Add EEH device to parent PE
Gavin Shan9b843482012-09-07 22:44:09 +0000295 * @edev: EEH device
Oliver O'Hallorana131bfc2020-07-25 18:12:31 +1000296 * @new_pe_parent: PE to create additional PEs under
Gavin Shan9b843482012-09-07 22:44:09 +0000297 *
Oliver O'Hallorana131bfc2020-07-25 18:12:31 +1000298 * Add EEH device to the PE in edev->pe_config_addr. If a PE already
299 * exists with that address then @edev is added to that PE. Otherwise
300 * a new PE is created and inserted into the PE tree as a child of
301 * @new_pe_parent.
302 *
303 * If @new_pe_parent is NULL then the new PE will be inserted under
304 * directly under the the PHB.
Gavin Shan9b843482012-09-07 22:44:09 +0000305 */
Oliver O'Hallorana131bfc2020-07-25 18:12:31 +1000306int eeh_pe_tree_insert(struct eeh_dev *edev, struct eeh_pe *new_pe_parent)
Gavin Shan9b843482012-09-07 22:44:09 +0000307{
Oliver O'Halloran31595ae2020-07-25 18:12:30 +1000308 struct pci_controller *hose = edev->controller;
Gavin Shan9b843482012-09-07 22:44:09 +0000309 struct eeh_pe *pe, *parent;
310
311 /*
312 * Search the PE has been existing or not according
313 * to the PE address. If that has been existing, the
314 * PE should be composed of PCI bus and its subordinate
315 * components.
316 */
Oliver O'Halloran35d64732020-09-18 19:30:50 +1000317 pe = eeh_pe_get(hose, edev->pe_config_addr);
Sam Bobroff27d43962019-08-16 14:48:16 +1000318 if (pe) {
319 if (pe->type & EEH_PE_INVALID) {
320 list_add_tail(&edev->entry, &pe->edevs);
321 edev->pe = pe;
322 /*
323 * We're running to here because of PCI hotplug caused by
324 * EEH recovery. We need clear EEH_PE_INVALID until the top.
325 */
326 parent = pe;
327 while (parent) {
328 if (!(parent->type & EEH_PE_INVALID))
329 break;
330 parent->type &= ~EEH_PE_INVALID;
331 parent = parent->parent;
332 }
Gavin Shan9b843482012-09-07 22:44:09 +0000333
Oliver O'Hallorana131bfc2020-07-25 18:12:31 +1000334 eeh_edev_dbg(edev, "Added to existing PE (parent: PE#%x)\n",
Sam Bobroff27d43962019-08-16 14:48:16 +1000335 pe->parent->addr);
336 } else {
337 /* Mark the PE as type of PCI bus */
338 pe->type = EEH_PE_BUS;
339 edev->pe = pe;
340
341 /* Put the edev to PE */
342 list_add_tail(&edev->entry, &pe->edevs);
343 eeh_edev_dbg(edev, "Added to bus PE\n");
Gavin Shan5efc3ad2012-09-11 19:16:16 +0000344 }
Gavin Shan5efc3ad2012-09-11 19:16:16 +0000345 return 0;
Gavin Shan9b843482012-09-07 22:44:09 +0000346 }
347
348 /* Create a new EEH PE */
Wei Yangc29fa272016-03-04 10:53:08 +1100349 if (edev->physfn)
Oliver O'Halloran31595ae2020-07-25 18:12:30 +1000350 pe = eeh_pe_alloc(hose, EEH_PE_VF);
Wei Yangc29fa272016-03-04 10:53:08 +1100351 else
Oliver O'Halloran31595ae2020-07-25 18:12:30 +1000352 pe = eeh_pe_alloc(hose, EEH_PE_DEVICE);
Gavin Shan9b843482012-09-07 22:44:09 +0000353 if (!pe) {
354 pr_err("%s: out of memory!\n", __func__);
355 return -ENOMEM;
356 }
Oliver O'Halloran269e5832020-10-07 15:09:02 +1100357
358 pe->addr = edev->pe_config_addr;
Gavin Shan9b843482012-09-07 22:44:09 +0000359
360 /*
361 * Put the new EEH PE into hierarchy tree. If the parent
362 * can't be found, the newly created PE will be attached
363 * to PHB directly. Otherwise, we have to associate the
364 * PE with its parent.
365 */
Oliver O'Hallorana131bfc2020-07-25 18:12:31 +1000366 if (!new_pe_parent) {
367 new_pe_parent = eeh_phb_pe_get(hose);
368 if (!new_pe_parent) {
Gavin Shan9b843482012-09-07 22:44:09 +0000369 pr_err("%s: No PHB PE is found (PHB Domain=%d)\n",
Oliver O'Halloran31595ae2020-07-25 18:12:30 +1000370 __func__, hose->global_number);
Gavin Shan9b843482012-09-07 22:44:09 +0000371 edev->pe = NULL;
372 kfree(pe);
373 return -EEXIST;
374 }
375 }
Oliver O'Hallorana131bfc2020-07-25 18:12:31 +1000376
377 /* link new PE into the tree */
378 pe->parent = new_pe_parent;
379 list_add_tail(&pe->child, &new_pe_parent->child_list);
Gavin Shan9b843482012-09-07 22:44:09 +0000380
381 /*
382 * Put the newly created PE into the child list and
383 * link the EEH device accordingly.
384 */
Sam Bobroff80e65b02018-09-12 11:23:26 +1000385 list_add_tail(&edev->entry, &pe->edevs);
Gavin Shan9b843482012-09-07 22:44:09 +0000386 edev->pe = pe;
Oliver O'Hallorana131bfc2020-07-25 18:12:31 +1000387 eeh_edev_dbg(edev, "Added to new (parent: PE#%x)\n",
388 new_pe_parent->addr);
Gavin Shan9b843482012-09-07 22:44:09 +0000389
390 return 0;
391}
Gavin Shan82e88822012-09-07 22:44:10 +0000392
393/**
Oliver O'Hallorand923ab72020-07-25 18:12:29 +1000394 * eeh_pe_tree_remove - Remove one EEH device from the associated PE
Gavin Shan82e88822012-09-07 22:44:10 +0000395 * @edev: EEH device
396 *
397 * The PE hierarchy tree might be changed when doing PCI hotplug.
398 * Also, the PCI devices or buses could be removed from the system
399 * during EEH recovery. So we have to call the function remove the
400 * corresponding PE accordingly if necessary.
401 */
Oliver O'Hallorand923ab72020-07-25 18:12:29 +1000402int eeh_pe_tree_remove(struct eeh_dev *edev)
Gavin Shan82e88822012-09-07 22:44:10 +0000403{
Gavin Shan5efc3ad2012-09-11 19:16:16 +0000404 struct eeh_pe *pe, *parent, *child;
Oliver O'Halloran799abe22019-09-03 20:15:52 +1000405 bool keep, recover;
Gavin Shan5efc3ad2012-09-11 19:16:16 +0000406 int cnt;
Gavin Shan82e88822012-09-07 22:44:10 +0000407
Sam Bobroff9a3eda22018-09-12 11:23:28 +1000408 pe = eeh_dev_to_pe(edev);
409 if (!pe) {
Sam Bobroff1ff8f362019-08-16 14:48:13 +1000410 eeh_edev_dbg(edev, "No PE found for device.\n");
Gavin Shan82e88822012-09-07 22:44:10 +0000411 return -EEXIST;
412 }
413
414 /* Remove the EEH device */
Gavin Shan82e88822012-09-07 22:44:10 +0000415 edev->pe = NULL;
Sam Bobroff80e65b02018-09-12 11:23:26 +1000416 list_del(&edev->entry);
Gavin Shan82e88822012-09-07 22:44:10 +0000417
418 /*
419 * Check if the parent PE includes any EEH devices.
420 * If not, we should delete that. Also, we should
421 * delete the parent PE if it doesn't have associated
422 * child PEs and EEH devices.
423 */
424 while (1) {
425 parent = pe->parent;
Oliver O'Halloran799abe22019-09-03 20:15:52 +1000426
427 /* PHB PEs should never be removed */
Gavin Shan5efc3ad2012-09-11 19:16:16 +0000428 if (pe->type & EEH_PE_PHB)
Gavin Shan82e88822012-09-07 22:44:10 +0000429 break;
430
Oliver O'Halloran799abe22019-09-03 20:15:52 +1000431 /*
432 * XXX: KEEP is set while resetting a PE. I don't think it's
433 * ever set without RECOVERING also being set. I could
434 * be wrong though so catch that with a WARN.
435 */
436 keep = !!(pe->state & EEH_PE_KEEP);
437 recover = !!(pe->state & EEH_PE_RECOVERING);
438 WARN_ON(keep && !recover);
439
440 if (!keep && !recover) {
Gavin Shan20ee6a92012-09-11 19:16:17 +0000441 if (list_empty(&pe->edevs) &&
442 list_empty(&pe->child_list)) {
443 list_del(&pe->child);
444 kfree(pe);
445 } else {
Gavin Shan5efc3ad2012-09-11 19:16:16 +0000446 break;
Gavin Shan20ee6a92012-09-11 19:16:17 +0000447 }
448 } else {
Oliver O'Halloran799abe22019-09-03 20:15:52 +1000449 /*
450 * Mark the PE as invalid. At the end of the recovery
451 * process any invalid PEs will be garbage collected.
452 *
453 * We need to delay the free()ing of them since we can
454 * remove edev's while traversing the PE tree which
455 * might trigger the removal of a PE and we can't
456 * deal with that (yet).
457 */
Gavin Shan20ee6a92012-09-11 19:16:17 +0000458 if (list_empty(&pe->edevs)) {
459 cnt = 0;
460 list_for_each_entry(child, &pe->child_list, child) {
Gavin Shane716e012012-11-22 21:58:26 +0000461 if (!(child->type & EEH_PE_INVALID)) {
Gavin Shan20ee6a92012-09-11 19:16:17 +0000462 cnt++;
463 break;
464 }
465 }
466
467 if (!cnt)
468 pe->type |= EEH_PE_INVALID;
469 else
470 break;
471 }
Gavin Shan82e88822012-09-07 22:44:10 +0000472 }
473
474 pe = parent;
475 }
476
477 return 0;
478}
Gavin Shan5b663522012-09-07 22:44:12 +0000479
480/**
Gavin Shan5a719782013-06-20 13:21:01 +0800481 * eeh_pe_update_time_stamp - Update PE's frozen time stamp
482 * @pe: EEH PE
483 *
484 * We have time stamp for each PE to trace its time of getting
485 * frozen in last hour. The function should be called to update
486 * the time stamp on first error of the specific PE. On the other
487 * handle, we needn't account for errors happened in last hour.
488 */
489void eeh_pe_update_time_stamp(struct eeh_pe *pe)
490{
Arnd Bergmannedfd17f2017-11-04 22:26:52 +0100491 time64_t tstamp;
Gavin Shan5a719782013-06-20 13:21:01 +0800492
493 if (!pe) return;
494
495 if (pe->freeze_count <= 0) {
496 pe->freeze_count = 0;
Arnd Bergmannedfd17f2017-11-04 22:26:52 +0100497 pe->tstamp = ktime_get_seconds();
Gavin Shan5a719782013-06-20 13:21:01 +0800498 } else {
Arnd Bergmannedfd17f2017-11-04 22:26:52 +0100499 tstamp = ktime_get_seconds();
500 if (tstamp - pe->tstamp > 3600) {
Gavin Shan5a719782013-06-20 13:21:01 +0800501 pe->tstamp = tstamp;
502 pe->freeze_count = 0;
503 }
504 }
505}
506
507/**
Gavin Shan5b663522012-09-07 22:44:12 +0000508 * eeh_pe_state_mark - Mark specified state for PE and its associated device
509 * @pe: EEH PE
510 *
511 * EEH error affects the current PE and its child PEs. The function
512 * is used to mark appropriate state for the affected PEs and the
513 * associated devices.
514 */
Sam Bobroffe762bb82018-09-12 11:23:31 +1000515void eeh_pe_state_mark(struct eeh_pe *root, int state)
Gavin Shan5b663522012-09-07 22:44:12 +0000516{
Sam Bobroffe762bb82018-09-12 11:23:31 +1000517 struct eeh_pe *pe;
518
519 eeh_for_each_pe(root, pe)
520 if (!(pe->state & EEH_PE_REMOVED))
521 pe->state |= state;
Gavin Shan5b663522012-09-07 22:44:12 +0000522}
Gavin Shane0056b02016-09-28 14:34:55 +1000523EXPORT_SYMBOL_GPL(eeh_pe_state_mark);
Gavin Shan5b663522012-09-07 22:44:12 +0000524
Sam Bobroffe762bb82018-09-12 11:23:31 +1000525/**
526 * eeh_pe_mark_isolated
527 * @pe: EEH PE
528 *
529 * Record that a PE has been isolated by marking the PE and it's children as
530 * EEH_PE_ISOLATED (and EEH_PE_CFG_BLOCKED, if required) and their PCI devices
531 * as pci_channel_io_frozen.
532 */
533void eeh_pe_mark_isolated(struct eeh_pe *root)
534{
535 struct eeh_pe *pe;
536 struct eeh_dev *edev;
537 struct pci_dev *pdev;
538
539 eeh_pe_state_mark(root, EEH_PE_ISOLATED);
540 eeh_for_each_pe(root, pe) {
541 list_for_each_entry(edev, &pe->edevs, entry) {
542 pdev = eeh_dev_to_pci_dev(edev);
543 if (pdev)
544 pdev->error_state = pci_channel_io_frozen;
545 }
546 /* Block PCI config access if required */
547 if (pe->state & EEH_PE_CFG_RESTRICTED)
548 pe->state |= EEH_PE_CFG_BLOCKED;
549 }
550}
551EXPORT_SYMBOL_GPL(eeh_pe_mark_isolated);
552
Sam Bobroffcef50c62019-08-16 14:48:15 +1000553static void __eeh_pe_dev_mode_mark(struct eeh_dev *edev, void *flag)
Gavin Shand2b0f6f2014-04-24 18:00:19 +1000554{
Gavin Shand2b0f6f2014-04-24 18:00:19 +1000555 int mode = *((int *)flag);
556
557 edev->mode |= mode;
Gavin Shand2b0f6f2014-04-24 18:00:19 +1000558}
559
560/**
561 * eeh_pe_dev_state_mark - Mark state for all device under the PE
562 * @pe: EEH PE
563 *
564 * Mark specific state for all child devices of the PE.
565 */
566void eeh_pe_dev_mode_mark(struct eeh_pe *pe, int mode)
567{
568 eeh_pe_dev_traverse(pe, __eeh_pe_dev_mode_mark, &mode);
569}
570
Gavin Shan5b663522012-09-07 22:44:12 +0000571/**
Sam Bobroff9ed5ca62018-11-29 14:16:39 +1100572 * eeh_pe_state_clear - Clear state for the PE
Gavin Shan5b663522012-09-07 22:44:12 +0000573 * @data: EEH PE
Sam Bobroff9ed5ca62018-11-29 14:16:39 +1100574 * @state: state
575 * @include_passed: include passed-through devices?
Gavin Shan5b663522012-09-07 22:44:12 +0000576 *
577 * The function is used to clear the indicated state from the
578 * given PE. Besides, we also clear the check count of the PE
579 * as well.
580 */
Sam Bobroff9ed5ca62018-11-29 14:16:39 +1100581void eeh_pe_state_clear(struct eeh_pe *root, int state, bool include_passed)
Gavin Shan5b663522012-09-07 22:44:12 +0000582{
Sam Bobroff9ed5ca62018-11-29 14:16:39 +1100583 struct eeh_pe *pe;
Gavin Shan22fca172014-09-30 12:38:59 +1000584 struct eeh_dev *edev, *tmp;
585 struct pci_dev *pdev;
Gavin Shan5b663522012-09-07 22:44:12 +0000586
Sam Bobroff9ed5ca62018-11-29 14:16:39 +1100587 eeh_for_each_pe(root, pe) {
588 /* Keep the state of permanently removed PE intact */
589 if (pe->state & EEH_PE_REMOVED)
Gavin Shan22fca172014-09-30 12:38:59 +1000590 continue;
591
Sam Bobroff9ed5ca62018-11-29 14:16:39 +1100592 if (!include_passed && eeh_pe_passed(pe))
593 continue;
594
595 pe->state &= ~state;
596
597 /*
598 * Special treatment on clearing isolated state. Clear
599 * check count since last isolation and put all affected
600 * devices to normal state.
601 */
602 if (!(state & EEH_PE_ISOLATED))
603 continue;
604
605 pe->check_count = 0;
606 eeh_pe_for_each_dev(pe, edev, tmp) {
607 pdev = eeh_dev_to_pci_dev(edev);
608 if (!pdev)
609 continue;
610
611 pdev->error_state = pci_channel_io_normal;
612 }
613
614 /* Unblock PCI config access if required */
615 if (pe->state & EEH_PE_CFG_RESTRICTED)
616 pe->state &= ~EEH_PE_CFG_BLOCKED;
Gavin Shan22fca172014-09-30 12:38:59 +1000617 }
Gavin Shan5b663522012-09-07 22:44:12 +0000618}
Gavin Shan9e6d2cf2012-09-07 22:44:15 +0000619
Gavin Shan652defe2013-06-27 13:46:43 +0800620/*
621 * Some PCI bridges (e.g. PLX bridges) have primary/secondary
622 * buses assigned explicitly by firmware, and we probably have
623 * lost that after reset. So we have to delay the check until
624 * the PCI-CFG registers have been restored for the parent
625 * bridge.
Gavin Shan9e6d2cf2012-09-07 22:44:15 +0000626 *
Gavin Shan652defe2013-06-27 13:46:43 +0800627 * Don't use normal PCI-CFG accessors, which probably has been
628 * blocked on normal path during the stage. So we need utilize
629 * eeh operations, which is always permitted.
Gavin Shan9e6d2cf2012-09-07 22:44:15 +0000630 */
Gavin Shan0bd78582015-03-17 16:15:07 +1100631static void eeh_bridge_check_link(struct eeh_dev *edev)
Gavin Shan652defe2013-06-27 13:46:43 +0800632{
633 int cap;
634 uint32_t val;
635 int timeout = 0;
636
637 /*
638 * We only check root port and downstream ports of
639 * PCIe switches
640 */
Gavin Shan4b83bd42013-07-24 10:24:59 +0800641 if (!(edev->mode & (EEH_DEV_ROOT_PORT | EEH_DEV_DS_PORT)))
Gavin Shan652defe2013-06-27 13:46:43 +0800642 return;
643
Sam Bobroff1ff8f362019-08-16 14:48:13 +1000644 eeh_edev_dbg(edev, "Checking PCIe link...\n");
Gavin Shan652defe2013-06-27 13:46:43 +0800645
646 /* Check slot status */
Gavin Shan4b83bd42013-07-24 10:24:59 +0800647 cap = edev->pcie_cap;
Oliver O'Halloran17d2a482020-07-25 18:12:26 +1000648 eeh_ops->read_config(edev, cap + PCI_EXP_SLTSTA, 2, &val);
Gavin Shan652defe2013-06-27 13:46:43 +0800649 if (!(val & PCI_EXP_SLTSTA_PDS)) {
Sam Bobroff1ff8f362019-08-16 14:48:13 +1000650 eeh_edev_dbg(edev, "No card in the slot (0x%04x) !\n", val);
Gavin Shan652defe2013-06-27 13:46:43 +0800651 return;
652 }
653
654 /* Check power status if we have the capability */
Oliver O'Halloran17d2a482020-07-25 18:12:26 +1000655 eeh_ops->read_config(edev, cap + PCI_EXP_SLTCAP, 2, &val);
Gavin Shan652defe2013-06-27 13:46:43 +0800656 if (val & PCI_EXP_SLTCAP_PCP) {
Oliver O'Halloran17d2a482020-07-25 18:12:26 +1000657 eeh_ops->read_config(edev, cap + PCI_EXP_SLTCTL, 2, &val);
Gavin Shan652defe2013-06-27 13:46:43 +0800658 if (val & PCI_EXP_SLTCTL_PCC) {
Sam Bobroff1ff8f362019-08-16 14:48:13 +1000659 eeh_edev_dbg(edev, "In power-off state, power it on ...\n");
Gavin Shan652defe2013-06-27 13:46:43 +0800660 val &= ~(PCI_EXP_SLTCTL_PCC | PCI_EXP_SLTCTL_PIC);
661 val |= (0x0100 & PCI_EXP_SLTCTL_PIC);
Oliver O'Halloran17d2a482020-07-25 18:12:26 +1000662 eeh_ops->write_config(edev, cap + PCI_EXP_SLTCTL, 2, val);
Gavin Shan652defe2013-06-27 13:46:43 +0800663 msleep(2 * 1000);
664 }
665 }
666
667 /* Enable link */
Oliver O'Halloran17d2a482020-07-25 18:12:26 +1000668 eeh_ops->read_config(edev, cap + PCI_EXP_LNKCTL, 2, &val);
Gavin Shan652defe2013-06-27 13:46:43 +0800669 val &= ~PCI_EXP_LNKCTL_LD;
Oliver O'Halloran17d2a482020-07-25 18:12:26 +1000670 eeh_ops->write_config(edev, cap + PCI_EXP_LNKCTL, 2, val);
Gavin Shan652defe2013-06-27 13:46:43 +0800671
672 /* Check link */
Oliver O'Halloran17d2a482020-07-25 18:12:26 +1000673 eeh_ops->read_config(edev, cap + PCI_EXP_LNKCAP, 4, &val);
Gavin Shan652defe2013-06-27 13:46:43 +0800674 if (!(val & PCI_EXP_LNKCAP_DLLLARC)) {
Sam Bobroff1ff8f362019-08-16 14:48:13 +1000675 eeh_edev_dbg(edev, "No link reporting capability (0x%08x) \n", val);
Gavin Shan652defe2013-06-27 13:46:43 +0800676 msleep(1000);
677 return;
678 }
679
680 /* Wait the link is up until timeout (5s) */
681 timeout = 0;
682 while (timeout < 5000) {
683 msleep(20);
684 timeout += 20;
685
Oliver O'Halloran17d2a482020-07-25 18:12:26 +1000686 eeh_ops->read_config(edev, cap + PCI_EXP_LNKSTA, 2, &val);
Gavin Shan652defe2013-06-27 13:46:43 +0800687 if (val & PCI_EXP_LNKSTA_DLLLA)
688 break;
689 }
690
691 if (val & PCI_EXP_LNKSTA_DLLLA)
Sam Bobroff1ff8f362019-08-16 14:48:13 +1000692 eeh_edev_dbg(edev, "Link up (%s)\n",
Gavin Shan652defe2013-06-27 13:46:43 +0800693 (val & PCI_EXP_LNKSTA_CLS_2_5GB) ? "2.5GB" : "5GB");
694 else
Sam Bobroff1ff8f362019-08-16 14:48:13 +1000695 eeh_edev_dbg(edev, "Link not ready (0x%04x)\n", val);
Gavin Shan652defe2013-06-27 13:46:43 +0800696}
697
698#define BYTE_SWAP(OFF) (8*((OFF)/4)+3-(OFF))
699#define SAVED_BYTE(OFF) (((u8 *)(edev->config_space))[BYTE_SWAP(OFF)])
700
Gavin Shan0bd78582015-03-17 16:15:07 +1100701static void eeh_restore_bridge_bars(struct eeh_dev *edev)
Gavin Shan652defe2013-06-27 13:46:43 +0800702{
703 int i;
704
705 /*
706 * Device BARs: 0x10 - 0x18
707 * Bus numbers and windows: 0x18 - 0x30
708 */
709 for (i = 4; i < 13; i++)
Oliver O'Halloran17d2a482020-07-25 18:12:26 +1000710 eeh_ops->write_config(edev, i*4, 4, edev->config_space[i]);
Gavin Shan652defe2013-06-27 13:46:43 +0800711 /* Rom: 0x38 */
Oliver O'Halloran17d2a482020-07-25 18:12:26 +1000712 eeh_ops->write_config(edev, 14*4, 4, edev->config_space[14]);
Gavin Shan652defe2013-06-27 13:46:43 +0800713
714 /* Cache line & Latency timer: 0xC 0xD */
Oliver O'Halloran17d2a482020-07-25 18:12:26 +1000715 eeh_ops->write_config(edev, PCI_CACHE_LINE_SIZE, 1,
Gavin Shan652defe2013-06-27 13:46:43 +0800716 SAVED_BYTE(PCI_CACHE_LINE_SIZE));
Oliver O'Halloran17d2a482020-07-25 18:12:26 +1000717 eeh_ops->write_config(edev, PCI_LATENCY_TIMER, 1,
718 SAVED_BYTE(PCI_LATENCY_TIMER));
Gavin Shan652defe2013-06-27 13:46:43 +0800719 /* Max latency, min grant, interrupt ping and line: 0x3C */
Oliver O'Halloran17d2a482020-07-25 18:12:26 +1000720 eeh_ops->write_config(edev, 15*4, 4, edev->config_space[15]);
Gavin Shan652defe2013-06-27 13:46:43 +0800721
722 /* PCI Command: 0x4 */
Oliver O'Halloran17d2a482020-07-25 18:12:26 +1000723 eeh_ops->write_config(edev, PCI_COMMAND, 4, edev->config_space[1] |
Michael Neuling13a83ea2018-04-11 13:37:58 +1000724 PCI_COMMAND_MEMORY | PCI_COMMAND_MASTER);
Gavin Shan652defe2013-06-27 13:46:43 +0800725
726 /* Check the PCIe link is ready */
Gavin Shan0bd78582015-03-17 16:15:07 +1100727 eeh_bridge_check_link(edev);
Gavin Shan652defe2013-06-27 13:46:43 +0800728}
729
Gavin Shan0bd78582015-03-17 16:15:07 +1100730static void eeh_restore_device_bars(struct eeh_dev *edev)
Gavin Shan9e6d2cf2012-09-07 22:44:15 +0000731{
732 int i;
733 u32 cmd;
Gavin Shan9e6d2cf2012-09-07 22:44:15 +0000734
735 for (i = 4; i < 10; i++)
Oliver O'Halloran17d2a482020-07-25 18:12:26 +1000736 eeh_ops->write_config(edev, i*4, 4, edev->config_space[i]);
Gavin Shan9e6d2cf2012-09-07 22:44:15 +0000737 /* 12 == Expansion ROM Address */
Oliver O'Halloran17d2a482020-07-25 18:12:26 +1000738 eeh_ops->write_config(edev, 12*4, 4, edev->config_space[12]);
Gavin Shan9e6d2cf2012-09-07 22:44:15 +0000739
Oliver O'Halloran17d2a482020-07-25 18:12:26 +1000740 eeh_ops->write_config(edev, PCI_CACHE_LINE_SIZE, 1,
Gavin Shan9e6d2cf2012-09-07 22:44:15 +0000741 SAVED_BYTE(PCI_CACHE_LINE_SIZE));
Oliver O'Halloran17d2a482020-07-25 18:12:26 +1000742 eeh_ops->write_config(edev, PCI_LATENCY_TIMER, 1,
Gavin Shan9e6d2cf2012-09-07 22:44:15 +0000743 SAVED_BYTE(PCI_LATENCY_TIMER));
744
745 /* max latency, min grant, interrupt pin and line */
Oliver O'Halloran17d2a482020-07-25 18:12:26 +1000746 eeh_ops->write_config(edev, 15*4, 4, edev->config_space[15]);
Gavin Shan9e6d2cf2012-09-07 22:44:15 +0000747
748 /*
749 * Restore PERR & SERR bits, some devices require it,
750 * don't touch the other command bits
751 */
Oliver O'Halloran17d2a482020-07-25 18:12:26 +1000752 eeh_ops->read_config(edev, PCI_COMMAND, 4, &cmd);
Gavin Shan9e6d2cf2012-09-07 22:44:15 +0000753 if (edev->config_space[1] & PCI_COMMAND_PARITY)
754 cmd |= PCI_COMMAND_PARITY;
755 else
756 cmd &= ~PCI_COMMAND_PARITY;
757 if (edev->config_space[1] & PCI_COMMAND_SERR)
758 cmd |= PCI_COMMAND_SERR;
759 else
760 cmd &= ~PCI_COMMAND_SERR;
Oliver O'Halloran17d2a482020-07-25 18:12:26 +1000761 eeh_ops->write_config(edev, PCI_COMMAND, 4, cmd);
Gavin Shan652defe2013-06-27 13:46:43 +0800762}
763
764/**
765 * eeh_restore_one_device_bars - Restore the Base Address Registers for one device
766 * @data: EEH device
767 * @flag: Unused
768 *
769 * Loads the PCI configuration space base address registers,
770 * the expansion ROM base address, the latency timer, and etc.
771 * from the saved values in the device node.
772 */
Sam Bobroffcef50c62019-08-16 14:48:15 +1000773static void eeh_restore_one_device_bars(struct eeh_dev *edev, void *flag)
Gavin Shan652defe2013-06-27 13:46:43 +0800774{
Gavin Shanf5c57712013-07-24 10:24:58 +0800775 /* Do special restore for bridges */
Gavin Shan4b83bd42013-07-24 10:24:59 +0800776 if (edev->mode & EEH_DEV_BRIDGE)
Gavin Shan0bd78582015-03-17 16:15:07 +1100777 eeh_restore_bridge_bars(edev);
Gavin Shan652defe2013-06-27 13:46:43 +0800778 else
Gavin Shan0bd78582015-03-17 16:15:07 +1100779 eeh_restore_device_bars(edev);
Gavin Shan9e6d2cf2012-09-07 22:44:15 +0000780
Oliver O'Halloran0c2c7652020-07-25 18:12:24 +1000781 if (eeh_ops->restore_config)
782 eeh_ops->restore_config(edev);
Gavin Shan9e6d2cf2012-09-07 22:44:15 +0000783}
784
785/**
786 * eeh_pe_restore_bars - Restore the PCI config space info
787 * @pe: EEH PE
788 *
789 * This routine performs a recursive walk to the children
790 * of this device as well.
791 */
792void eeh_pe_restore_bars(struct eeh_pe *pe)
793{
Gavin Shanea812452012-09-11 19:16:18 +0000794 /*
795 * We needn't take the EEH lock since eeh_pe_dev_traverse()
796 * will take that.
797 */
Gavin Shan9e6d2cf2012-09-07 22:44:15 +0000798 eeh_pe_dev_traverse(pe, eeh_restore_one_device_bars, NULL);
799}
Gavin Shan9b3c76f2012-09-07 22:44:19 +0000800
801/**
Gavin Shan357b2f32014-06-11 18:26:44 +1000802 * eeh_pe_loc_get - Retrieve location code binding to the given PE
803 * @pe: EEH PE
804 *
805 * Retrieve the location code of the given PE. If the primary PE bus
806 * is root bus, we will grab location code from PHB device tree node
807 * or root port. Otherwise, the upstream bridge's device tree node
808 * of the primary PE bus will be checked for the location code.
809 */
810const char *eeh_pe_loc_get(struct eeh_pe *pe)
811{
Gavin Shan357b2f32014-06-11 18:26:44 +1000812 struct pci_bus *bus = eeh_pe_bus_get(pe);
Gavin Shan7e56f622015-12-02 16:25:32 +1100813 struct device_node *dn;
Mike Qiu9e5c6e52014-07-15 01:42:22 -0400814 const char *loc = NULL;
Gavin Shan357b2f32014-06-11 18:26:44 +1000815
Gavin Shan7e56f622015-12-02 16:25:32 +1100816 while (bus) {
817 dn = pci_bus_to_OF_node(bus);
818 if (!dn) {
819 bus = bus->parent;
820 continue;
821 }
Gavin Shan357b2f32014-06-11 18:26:44 +1000822
Gavin Shan7e56f622015-12-02 16:25:32 +1100823 if (pci_is_root_bus(bus))
Mike Qiu9e5c6e52014-07-15 01:42:22 -0400824 loc = of_get_property(dn, "ibm,io-base-loc-code", NULL);
Gavin Shan7e56f622015-12-02 16:25:32 +1100825 else
826 loc = of_get_property(dn, "ibm,slot-location-code",
827 NULL);
Gavin Shan357b2f32014-06-11 18:26:44 +1000828
Gavin Shan7e56f622015-12-02 16:25:32 +1100829 if (loc)
830 return loc;
831
832 bus = bus->parent;
Gavin Shan357b2f32014-06-11 18:26:44 +1000833 }
834
Gavin Shan7e56f622015-12-02 16:25:32 +1100835 return "N/A";
Gavin Shan357b2f32014-06-11 18:26:44 +1000836}
837
838/**
Gavin Shan9b3c76f2012-09-07 22:44:19 +0000839 * eeh_pe_bus_get - Retrieve PCI bus according to the given PE
840 * @pe: EEH PE
841 *
842 * Retrieve the PCI bus according to the given PE. Basically,
843 * there're 3 types of PEs: PHB/Bus/Device. For PHB PE, the
844 * primary PCI bus will be retrieved. The parent bus will be
845 * returned for BUS PE. However, we don't have associated PCI
846 * bus for DEVICE PE.
847 */
848struct pci_bus *eeh_pe_bus_get(struct eeh_pe *pe)
849{
Gavin Shan9b3c76f2012-09-07 22:44:19 +0000850 struct eeh_dev *edev;
851 struct pci_dev *pdev;
852
Gavin Shan4eb07992016-02-09 15:50:23 +1100853 if (pe->type & EEH_PE_PHB)
854 return pe->phb->bus;
Gavin Shan8cdb2832013-06-20 13:20:55 +0800855
Gavin Shan4eb07992016-02-09 15:50:23 +1100856 /* The primary bus might be cached during probe time */
857 if (pe->state & EEH_PE_PRI_BUS)
858 return pe->bus;
Gavin Shan9b3c76f2012-09-07 22:44:19 +0000859
Gavin Shan4eb07992016-02-09 15:50:23 +1100860 /* Retrieve the parent PCI bus of first (top) PCI device */
Sam Bobroff80e65b02018-09-12 11:23:26 +1000861 edev = list_first_entry_or_null(&pe->edevs, struct eeh_dev, entry);
Gavin Shan4eb07992016-02-09 15:50:23 +1100862 pdev = eeh_dev_to_pci_dev(edev);
863 if (pdev)
864 return pdev->bus;
865
866 return NULL;
Gavin Shan9b3c76f2012-09-07 22:44:19 +0000867}