eeh_pseries.c 16 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565
  1. /*
  2. * The file intends to implement the platform dependent EEH operations on pseries.
  3. * Actually, the pseries platform is built based on RTAS heavily. That means the
  4. * pseries platform dependent EEH operations will be built on RTAS calls. The functions
  5. * are devired from arch/powerpc/platforms/pseries/eeh.c and necessary cleanup has
  6. * been done.
  7. *
  8. * Copyright Benjamin Herrenschmidt & Gavin Shan, IBM Corporation 2011.
  9. * Copyright IBM Corporation 2001, 2005, 2006
  10. * Copyright Dave Engebretsen & Todd Inglett 2001
  11. * Copyright Linas Vepstas 2005, 2006
  12. *
  13. * This program is free software; you can redistribute it and/or modify
  14. * it under the terms of the GNU General Public License as published by
  15. * the Free Software Foundation; either version 2 of the License, or
  16. * (at your option) any later version.
  17. *
  18. * This program is distributed in the hope that it will be useful,
  19. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  20. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  21. * GNU General Public License for more details.
  22. *
  23. * You should have received a copy of the GNU General Public License
  24. * along with this program; if not, write to the Free Software
  25. * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
  26. */
  27. #include <linux/atomic.h>
  28. #include <linux/delay.h>
  29. #include <linux/export.h>
  30. #include <linux/init.h>
  31. #include <linux/list.h>
  32. #include <linux/of.h>
  33. #include <linux/pci.h>
  34. #include <linux/proc_fs.h>
  35. #include <linux/rbtree.h>
  36. #include <linux/sched.h>
  37. #include <linux/seq_file.h>
  38. #include <linux/spinlock.h>
  39. #include <asm/eeh.h>
  40. #include <asm/eeh_event.h>
  41. #include <asm/io.h>
  42. #include <asm/machdep.h>
  43. #include <asm/ppc-pci.h>
  44. #include <asm/rtas.h>
  45. /* RTAS tokens */
  46. static int ibm_set_eeh_option;
  47. static int ibm_set_slot_reset;
  48. static int ibm_read_slot_reset_state;
  49. static int ibm_read_slot_reset_state2;
  50. static int ibm_slot_error_detail;
  51. static int ibm_get_config_addr_info;
  52. static int ibm_get_config_addr_info2;
  53. static int ibm_configure_bridge;
  54. static int ibm_configure_pe;
  55. /*
  56. * Buffer for reporting slot-error-detail rtas calls. Its here
  57. * in BSS, and not dynamically alloced, so that it ends up in
  58. * RMO where RTAS can access it.
  59. */
  60. static unsigned char slot_errbuf[RTAS_ERROR_LOG_MAX];
  61. static DEFINE_SPINLOCK(slot_errbuf_lock);
  62. static int eeh_error_buf_size;
  63. /**
  64. * pseries_eeh_init - EEH platform dependent initialization
  65. *
  66. * EEH platform dependent initialization on pseries.
  67. */
  68. static int pseries_eeh_init(void)
  69. {
  70. /* figure out EEH RTAS function call tokens */
  71. ibm_set_eeh_option = rtas_token("ibm,set-eeh-option");
  72. ibm_set_slot_reset = rtas_token("ibm,set-slot-reset");
  73. ibm_read_slot_reset_state2 = rtas_token("ibm,read-slot-reset-state2");
  74. ibm_read_slot_reset_state = rtas_token("ibm,read-slot-reset-state");
  75. ibm_slot_error_detail = rtas_token("ibm,slot-error-detail");
  76. ibm_get_config_addr_info2 = rtas_token("ibm,get-config-addr-info2");
  77. ibm_get_config_addr_info = rtas_token("ibm,get-config-addr-info");
  78. ibm_configure_pe = rtas_token("ibm,configure-pe");
  79. ibm_configure_bridge = rtas_token ("ibm,configure-bridge");
  80. /*
  81. * Necessary sanity check. We needn't check "get-config-addr-info"
  82. * and its variant since the old firmware probably support address
  83. * of domain/bus/slot/function for EEH RTAS operations.
  84. */
  85. if (ibm_set_eeh_option == RTAS_UNKNOWN_SERVICE) {
  86. pr_warning("%s: RTAS service <ibm,set-eeh-option> invalid\n",
  87. __func__);
  88. return -EINVAL;
  89. } else if (ibm_set_slot_reset == RTAS_UNKNOWN_SERVICE) {
  90. pr_warning("%s: RTAS service <ibm, set-slot-reset> invalid\n",
  91. __func__);
  92. return -EINVAL;
  93. } else if (ibm_read_slot_reset_state2 == RTAS_UNKNOWN_SERVICE &&
  94. ibm_read_slot_reset_state == RTAS_UNKNOWN_SERVICE) {
  95. pr_warning("%s: RTAS service <ibm,read-slot-reset-state2> and "
  96. "<ibm,read-slot-reset-state> invalid\n",
  97. __func__);
  98. return -EINVAL;
  99. } else if (ibm_slot_error_detail == RTAS_UNKNOWN_SERVICE) {
  100. pr_warning("%s: RTAS service <ibm,slot-error-detail> invalid\n",
  101. __func__);
  102. return -EINVAL;
  103. } else if (ibm_configure_pe == RTAS_UNKNOWN_SERVICE &&
  104. ibm_configure_bridge == RTAS_UNKNOWN_SERVICE) {
  105. pr_warning("%s: RTAS service <ibm,configure-pe> and "
  106. "<ibm,configure-bridge> invalid\n",
  107. __func__);
  108. return -EINVAL;
  109. }
  110. /* Initialize error log lock and size */
  111. spin_lock_init(&slot_errbuf_lock);
  112. eeh_error_buf_size = rtas_token("rtas-error-log-max");
  113. if (eeh_error_buf_size == RTAS_UNKNOWN_SERVICE) {
  114. pr_warning("%s: unknown EEH error log size\n",
  115. __func__);
  116. eeh_error_buf_size = 1024;
  117. } else if (eeh_error_buf_size > RTAS_ERROR_LOG_MAX) {
  118. pr_warning("%s: EEH error log size %d exceeds the maximal %d\n",
  119. __func__, eeh_error_buf_size, RTAS_ERROR_LOG_MAX);
  120. eeh_error_buf_size = RTAS_ERROR_LOG_MAX;
  121. }
  122. return 0;
  123. }
  124. /**
  125. * pseries_eeh_set_option - Initialize EEH or MMIO/DMA reenable
  126. * @dn: device node
  127. * @option: operation to be issued
  128. *
  129. * The function is used to control the EEH functionality globally.
  130. * Currently, following options are support according to PAPR:
  131. * Enable EEH, Disable EEH, Enable MMIO and Enable DMA
  132. */
  133. static int pseries_eeh_set_option(struct device_node *dn, int option)
  134. {
  135. int ret = 0;
  136. struct eeh_dev *edev;
  137. const u32 *reg;
  138. int config_addr;
  139. edev = of_node_to_eeh_dev(dn);
  140. /*
  141. * When we're enabling or disabling EEH functioality on
  142. * the particular PE, the PE config address is possibly
  143. * unavailable. Therefore, we have to figure it out from
  144. * the FDT node.
  145. */
  146. switch (option) {
  147. case EEH_OPT_DISABLE:
  148. case EEH_OPT_ENABLE:
  149. reg = of_get_property(dn, "reg", NULL);
  150. config_addr = reg[0];
  151. break;
  152. case EEH_OPT_THAW_MMIO:
  153. case EEH_OPT_THAW_DMA:
  154. config_addr = edev->config_addr;
  155. if (edev->pe_config_addr)
  156. config_addr = edev->pe_config_addr;
  157. break;
  158. default:
  159. pr_err("%s: Invalid option %d\n",
  160. __func__, option);
  161. return -EINVAL;
  162. }
  163. ret = rtas_call(ibm_set_eeh_option, 4, 1, NULL,
  164. config_addr, BUID_HI(edev->phb->buid),
  165. BUID_LO(edev->phb->buid), option);
  166. return ret;
  167. }
  168. /**
  169. * pseries_eeh_get_pe_addr - Retrieve PE address
  170. * @dn: device node
  171. *
  172. * Retrieve the assocated PE address. Actually, there're 2 RTAS
  173. * function calls dedicated for the purpose. We need implement
  174. * it through the new function and then the old one. Besides,
  175. * you should make sure the config address is figured out from
  176. * FDT node before calling the function.
  177. *
  178. * It's notable that zero'ed return value means invalid PE config
  179. * address.
  180. */
  181. static int pseries_eeh_get_pe_addr(struct device_node *dn)
  182. {
  183. struct eeh_dev *edev;
  184. int ret = 0;
  185. int rets[3];
  186. edev = of_node_to_eeh_dev(dn);
  187. if (ibm_get_config_addr_info2 != RTAS_UNKNOWN_SERVICE) {
  188. /*
  189. * First of all, we need to make sure there has one PE
  190. * associated with the device. Otherwise, PE address is
  191. * meaningless.
  192. */
  193. ret = rtas_call(ibm_get_config_addr_info2, 4, 2, rets,
  194. edev->config_addr, BUID_HI(edev->phb->buid),
  195. BUID_LO(edev->phb->buid), 1);
  196. if (ret || (rets[0] == 0))
  197. return 0;
  198. /* Retrieve the associated PE config address */
  199. ret = rtas_call(ibm_get_config_addr_info2, 4, 2, rets,
  200. edev->config_addr, BUID_HI(edev->phb->buid),
  201. BUID_LO(edev->phb->buid), 0);
  202. if (ret) {
  203. pr_warning("%s: Failed to get PE address for %s\n",
  204. __func__, dn->full_name);
  205. return 0;
  206. }
  207. return rets[0];
  208. }
  209. if (ibm_get_config_addr_info != RTAS_UNKNOWN_SERVICE) {
  210. ret = rtas_call(ibm_get_config_addr_info, 4, 2, rets,
  211. edev->config_addr, BUID_HI(edev->phb->buid),
  212. BUID_LO(edev->phb->buid), 0);
  213. if (ret) {
  214. pr_warning("%s: Failed to get PE address for %s\n",
  215. __func__, dn->full_name);
  216. return 0;
  217. }
  218. return rets[0];
  219. }
  220. return ret;
  221. }
  222. /**
  223. * pseries_eeh_get_state - Retrieve PE state
  224. * @dn: PE associated device node
  225. * @state: return value
  226. *
  227. * Retrieve the state of the specified PE. On RTAS compliant
  228. * pseries platform, there already has one dedicated RTAS function
  229. * for the purpose. It's notable that the associated PE config address
  230. * might be ready when calling the function. Therefore, endeavour to
  231. * use the PE config address if possible. Further more, there're 2
  232. * RTAS calls for the purpose, we need to try the new one and back
  233. * to the old one if the new one couldn't work properly.
  234. */
  235. static int pseries_eeh_get_state(struct device_node *dn, int *state)
  236. {
  237. struct eeh_dev *edev;
  238. int config_addr;
  239. int ret;
  240. int rets[4];
  241. int result;
  242. /* Figure out PE config address if possible */
  243. edev = of_node_to_eeh_dev(dn);
  244. config_addr = edev->config_addr;
  245. if (edev->pe_config_addr)
  246. config_addr = edev->pe_config_addr;
  247. if (ibm_read_slot_reset_state2 != RTAS_UNKNOWN_SERVICE) {
  248. ret = rtas_call(ibm_read_slot_reset_state2, 3, 4, rets,
  249. config_addr, BUID_HI(edev->phb->buid),
  250. BUID_LO(edev->phb->buid));
  251. } else if (ibm_read_slot_reset_state != RTAS_UNKNOWN_SERVICE) {
  252. /* Fake PE unavailable info */
  253. rets[2] = 0;
  254. ret = rtas_call(ibm_read_slot_reset_state, 3, 3, rets,
  255. config_addr, BUID_HI(edev->phb->buid),
  256. BUID_LO(edev->phb->buid));
  257. } else {
  258. return EEH_STATE_NOT_SUPPORT;
  259. }
  260. if (ret)
  261. return ret;
  262. /* Parse the result out */
  263. result = 0;
  264. if (rets[1]) {
  265. switch(rets[0]) {
  266. case 0:
  267. result &= ~EEH_STATE_RESET_ACTIVE;
  268. result |= EEH_STATE_MMIO_ACTIVE;
  269. result |= EEH_STATE_DMA_ACTIVE;
  270. break;
  271. case 1:
  272. result |= EEH_STATE_RESET_ACTIVE;
  273. result |= EEH_STATE_MMIO_ACTIVE;
  274. result |= EEH_STATE_DMA_ACTIVE;
  275. break;
  276. case 2:
  277. result &= ~EEH_STATE_RESET_ACTIVE;
  278. result &= ~EEH_STATE_MMIO_ACTIVE;
  279. result &= ~EEH_STATE_DMA_ACTIVE;
  280. break;
  281. case 4:
  282. result &= ~EEH_STATE_RESET_ACTIVE;
  283. result &= ~EEH_STATE_MMIO_ACTIVE;
  284. result &= ~EEH_STATE_DMA_ACTIVE;
  285. result |= EEH_STATE_MMIO_ENABLED;
  286. break;
  287. case 5:
  288. if (rets[2]) {
  289. if (state) *state = rets[2];
  290. result = EEH_STATE_UNAVAILABLE;
  291. } else {
  292. result = EEH_STATE_NOT_SUPPORT;
  293. }
  294. break;
  295. default:
  296. result = EEH_STATE_NOT_SUPPORT;
  297. }
  298. } else {
  299. result = EEH_STATE_NOT_SUPPORT;
  300. }
  301. return result;
  302. }
  303. /**
  304. * pseries_eeh_reset - Reset the specified PE
  305. * @dn: PE associated device node
  306. * @option: reset option
  307. *
  308. * Reset the specified PE
  309. */
  310. static int pseries_eeh_reset(struct device_node *dn, int option)
  311. {
  312. struct eeh_dev *edev;
  313. int config_addr;
  314. int ret;
  315. /* Figure out PE address */
  316. edev = of_node_to_eeh_dev(dn);
  317. config_addr = edev->config_addr;
  318. if (edev->pe_config_addr)
  319. config_addr = edev->pe_config_addr;
  320. /* Reset PE through RTAS call */
  321. ret = rtas_call(ibm_set_slot_reset, 4, 1, NULL,
  322. config_addr, BUID_HI(edev->phb->buid),
  323. BUID_LO(edev->phb->buid), option);
  324. /* If fundamental-reset not supported, try hot-reset */
  325. if (option == EEH_RESET_FUNDAMENTAL &&
  326. ret == -8) {
  327. ret = rtas_call(ibm_set_slot_reset, 4, 1, NULL,
  328. config_addr, BUID_HI(edev->phb->buid),
  329. BUID_LO(edev->phb->buid), EEH_RESET_HOT);
  330. }
  331. return ret;
  332. }
  333. /**
  334. * pseries_eeh_wait_state - Wait for PE state
  335. * @dn: PE associated device node
  336. * @max_wait: maximal period in microsecond
  337. *
  338. * Wait for the state of associated PE. It might take some time
  339. * to retrieve the PE's state.
  340. */
  341. static int pseries_eeh_wait_state(struct device_node *dn, int max_wait)
  342. {
  343. int ret;
  344. int mwait;
  345. /*
  346. * According to PAPR, the state of PE might be temporarily
  347. * unavailable. Under the circumstance, we have to wait
  348. * for indicated time determined by firmware. The maximal
  349. * wait time is 5 minutes, which is acquired from the original
  350. * EEH implementation. Also, the original implementation
  351. * also defined the minimal wait time as 1 second.
  352. */
  353. #define EEH_STATE_MIN_WAIT_TIME (1000)
  354. #define EEH_STATE_MAX_WAIT_TIME (300 * 1000)
  355. while (1) {
  356. ret = pseries_eeh_get_state(dn, &mwait);
  357. /*
  358. * If the PE's state is temporarily unavailable,
  359. * we have to wait for the specified time. Otherwise,
  360. * the PE's state will be returned immediately.
  361. */
  362. if (ret != EEH_STATE_UNAVAILABLE)
  363. return ret;
  364. if (max_wait <= 0) {
  365. pr_warning("%s: Timeout when getting PE's state (%d)\n",
  366. __func__, max_wait);
  367. return EEH_STATE_NOT_SUPPORT;
  368. }
  369. if (mwait <= 0) {
  370. pr_warning("%s: Firmware returned bad wait value %d\n",
  371. __func__, mwait);
  372. mwait = EEH_STATE_MIN_WAIT_TIME;
  373. } else if (mwait > EEH_STATE_MAX_WAIT_TIME) {
  374. pr_warning("%s: Firmware returned too long wait value %d\n",
  375. __func__, mwait);
  376. mwait = EEH_STATE_MAX_WAIT_TIME;
  377. }
  378. max_wait -= mwait;
  379. msleep(mwait);
  380. }
  381. return EEH_STATE_NOT_SUPPORT;
  382. }
  383. /**
  384. * pseries_eeh_get_log - Retrieve error log
  385. * @dn: device node
  386. * @severity: temporary or permanent error log
  387. * @drv_log: driver log to be combined with retrieved error log
  388. * @len: length of driver log
  389. *
  390. * Retrieve the temporary or permanent error from the PE.
  391. * Actually, the error will be retrieved through the dedicated
  392. * RTAS call.
  393. */
  394. static int pseries_eeh_get_log(struct device_node *dn, int severity, char *drv_log, unsigned long len)
  395. {
  396. struct eeh_dev *edev;
  397. int config_addr;
  398. unsigned long flags;
  399. int ret;
  400. edev = of_node_to_eeh_dev(dn);
  401. spin_lock_irqsave(&slot_errbuf_lock, flags);
  402. memset(slot_errbuf, 0, eeh_error_buf_size);
  403. /* Figure out the PE address */
  404. config_addr = edev->config_addr;
  405. if (edev->pe_config_addr)
  406. config_addr = edev->pe_config_addr;
  407. ret = rtas_call(ibm_slot_error_detail, 8, 1, NULL, config_addr,
  408. BUID_HI(edev->phb->buid), BUID_LO(edev->phb->buid),
  409. virt_to_phys(drv_log), len,
  410. virt_to_phys(slot_errbuf), eeh_error_buf_size,
  411. severity);
  412. if (!ret)
  413. log_error(slot_errbuf, ERR_TYPE_RTAS_LOG, 0);
  414. spin_unlock_irqrestore(&slot_errbuf_lock, flags);
  415. return ret;
  416. }
  417. /**
  418. * pseries_eeh_configure_bridge - Configure PCI bridges in the indicated PE
  419. * @dn: PE associated device node
  420. *
  421. * The function will be called to reconfigure the bridges included
  422. * in the specified PE so that the mulfunctional PE would be recovered
  423. * again.
  424. */
  425. static int pseries_eeh_configure_bridge(struct device_node *dn)
  426. {
  427. struct eeh_dev *edev;
  428. int config_addr;
  429. int ret;
  430. /* Figure out the PE address */
  431. edev = of_node_to_eeh_dev(dn);
  432. config_addr = edev->config_addr;
  433. if (edev->pe_config_addr)
  434. config_addr = edev->pe_config_addr;
  435. /* Use new configure-pe function, if supported */
  436. if (ibm_configure_pe != RTAS_UNKNOWN_SERVICE) {
  437. ret = rtas_call(ibm_configure_pe, 3, 1, NULL,
  438. config_addr, BUID_HI(edev->phb->buid),
  439. BUID_LO(edev->phb->buid));
  440. } else if (ibm_configure_bridge != RTAS_UNKNOWN_SERVICE) {
  441. ret = rtas_call(ibm_configure_bridge, 3, 1, NULL,
  442. config_addr, BUID_HI(edev->phb->buid),
  443. BUID_LO(edev->phb->buid));
  444. } else {
  445. return -EFAULT;
  446. }
  447. if (ret)
  448. pr_warning("%s: Unable to configure bridge %d for %s\n",
  449. __func__, ret, dn->full_name);
  450. return ret;
  451. }
  452. /**
  453. * pseries_eeh_read_config - Read PCI config space
  454. * @dn: device node
  455. * @where: PCI address
  456. * @size: size to read
  457. * @val: return value
  458. *
  459. * Read config space from the speicifed device
  460. */
  461. static int pseries_eeh_read_config(struct device_node *dn, int where, int size, u32 *val)
  462. {
  463. struct pci_dn *pdn;
  464. pdn = PCI_DN(dn);
  465. return rtas_read_config(pdn, where, size, val);
  466. }
  467. /**
  468. * pseries_eeh_write_config - Write PCI config space
  469. * @dn: device node
  470. * @where: PCI address
  471. * @size: size to write
  472. * @val: value to be written
  473. *
  474. * Write config space to the specified device
  475. */
  476. static int pseries_eeh_write_config(struct device_node *dn, int where, int size, u32 val)
  477. {
  478. struct pci_dn *pdn;
  479. pdn = PCI_DN(dn);
  480. return rtas_write_config(pdn, where, size, val);
  481. }
  482. static struct eeh_ops pseries_eeh_ops = {
  483. .name = "pseries",
  484. .init = pseries_eeh_init,
  485. .set_option = pseries_eeh_set_option,
  486. .get_pe_addr = pseries_eeh_get_pe_addr,
  487. .get_state = pseries_eeh_get_state,
  488. .reset = pseries_eeh_reset,
  489. .wait_state = pseries_eeh_wait_state,
  490. .get_log = pseries_eeh_get_log,
  491. .configure_bridge = pseries_eeh_configure_bridge,
  492. .read_config = pseries_eeh_read_config,
  493. .write_config = pseries_eeh_write_config
  494. };
  495. /**
  496. * eeh_pseries_init - Register platform dependent EEH operations
  497. *
  498. * EEH initialization on pseries platform. This function should be
  499. * called before any EEH related functions.
  500. */
  501. int __init eeh_pseries_init(void)
  502. {
  503. return eeh_ops_register(&pseries_eeh_ops);
  504. }