bte.h 7.6 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236
  1. /*
  2. * This file is subject to the terms and conditions of the GNU General Public
  3. * License. See the file "COPYING" in the main directory of this archive
  4. * for more details.
  5. *
  6. * Copyright (c) 2000-2007 Silicon Graphics, Inc. All Rights Reserved.
  7. */
  8. #ifndef _ASM_IA64_SN_BTE_H
  9. #define _ASM_IA64_SN_BTE_H
  10. #include <linux/timer.h>
  11. #include <linux/spinlock.h>
  12. #include <linux/cache.h>
  13. #include <asm/sn/pda.h>
  14. #include <asm/sn/types.h>
  15. #include <asm/sn/shub_mmr.h>
  16. struct nodepda_s;
  17. #define IBCT_NOTIFY (0x1UL << 4)
  18. #define IBCT_ZFIL_MODE (0x1UL << 0)
  19. /* #define BTE_DEBUG */
  20. /* #define BTE_DEBUG_VERBOSE */
  21. #ifdef BTE_DEBUG
  22. # define BTE_PRINTK(x) printk x /* Terse */
  23. # ifdef BTE_DEBUG_VERBOSE
  24. # define BTE_PRINTKV(x) printk x /* Verbose */
  25. # else
  26. # define BTE_PRINTKV(x)
  27. # endif /* BTE_DEBUG_VERBOSE */
  28. #else
  29. # define BTE_PRINTK(x)
  30. # define BTE_PRINTKV(x)
  31. #endif /* BTE_DEBUG */
  32. /* BTE status register only supports 16 bits for length field */
  33. #define BTE_LEN_BITS (16)
  34. #define BTE_LEN_MASK ((1 << BTE_LEN_BITS) - 1)
  35. #define BTE_MAX_XFER (BTE_LEN_MASK << L1_CACHE_SHIFT)
  36. /* Define hardware */
  37. #define BTES_PER_NODE (is_shub2() ? 4 : 2)
  38. #define MAX_BTES_PER_NODE 4
  39. #define BTE2OFF_CTRL 0
  40. #define BTE2OFF_SRC (SH2_BT_ENG_SRC_ADDR_0 - SH2_BT_ENG_CSR_0)
  41. #define BTE2OFF_DEST (SH2_BT_ENG_DEST_ADDR_0 - SH2_BT_ENG_CSR_0)
  42. #define BTE2OFF_NOTIFY (SH2_BT_ENG_NOTIF_ADDR_0 - SH2_BT_ENG_CSR_0)
  43. #define BTE_BASE_ADDR(interface) \
  44. (is_shub2() ? (interface == 0) ? SH2_BT_ENG_CSR_0 : \
  45. (interface == 1) ? SH2_BT_ENG_CSR_1 : \
  46. (interface == 2) ? SH2_BT_ENG_CSR_2 : \
  47. SH2_BT_ENG_CSR_3 \
  48. : (interface == 0) ? IIO_IBLS0 : IIO_IBLS1)
  49. #define BTE_SOURCE_ADDR(base) \
  50. (is_shub2() ? base + (BTE2OFF_SRC/8) \
  51. : base + (BTEOFF_SRC/8))
  52. #define BTE_DEST_ADDR(base) \
  53. (is_shub2() ? base + (BTE2OFF_DEST/8) \
  54. : base + (BTEOFF_DEST/8))
  55. #define BTE_CTRL_ADDR(base) \
  56. (is_shub2() ? base + (BTE2OFF_CTRL/8) \
  57. : base + (BTEOFF_CTRL/8))
  58. #define BTE_NOTIF_ADDR(base) \
  59. (is_shub2() ? base + (BTE2OFF_NOTIFY/8) \
  60. : base + (BTEOFF_NOTIFY/8))
  61. /* Define hardware modes */
  62. #define BTE_NOTIFY IBCT_NOTIFY
  63. #define BTE_NORMAL BTE_NOTIFY
  64. #define BTE_ZERO_FILL (BTE_NOTIFY | IBCT_ZFIL_MODE)
  65. /* Use a reserved bit to let the caller specify a wait for any BTE */
  66. #define BTE_WACQUIRE 0x4000
  67. /* Use the BTE on the node with the destination memory */
  68. #define BTE_USE_DEST (BTE_WACQUIRE << 1)
  69. /* Use any available BTE interface on any node for the transfer */
  70. #define BTE_USE_ANY (BTE_USE_DEST << 1)
  71. /* macro to force the IBCT0 value valid */
  72. #define BTE_VALID_MODE(x) ((x) & (IBCT_NOTIFY | IBCT_ZFIL_MODE))
  73. #define BTE_ACTIVE (IBLS_BUSY | IBLS_ERROR)
  74. #define BTE_WORD_AVAILABLE (IBLS_BUSY << 1)
  75. #define BTE_WORD_BUSY (~BTE_WORD_AVAILABLE)
  76. /*
  77. * Some macros to simplify reading.
  78. * Start with macros to locate the BTE control registers.
  79. */
  80. #define BTE_LNSTAT_LOAD(_bte) \
  81. HUB_L(_bte->bte_base_addr)
  82. #define BTE_LNSTAT_STORE(_bte, _x) \
  83. HUB_S(_bte->bte_base_addr, (_x))
  84. #define BTE_SRC_STORE(_bte, _x) \
  85. ({ \
  86. u64 __addr = ((_x) & ~AS_MASK); \
  87. if (is_shub2()) \
  88. __addr = SH2_TIO_PHYS_TO_DMA(__addr); \
  89. HUB_S(_bte->bte_source_addr, __addr); \
  90. })
  91. #define BTE_DEST_STORE(_bte, _x) \
  92. ({ \
  93. u64 __addr = ((_x) & ~AS_MASK); \
  94. if (is_shub2()) \
  95. __addr = SH2_TIO_PHYS_TO_DMA(__addr); \
  96. HUB_S(_bte->bte_destination_addr, __addr); \
  97. })
  98. #define BTE_CTRL_STORE(_bte, _x) \
  99. HUB_S(_bte->bte_control_addr, (_x))
  100. #define BTE_NOTIF_STORE(_bte, _x) \
  101. ({ \
  102. u64 __addr = ia64_tpa((_x) & ~AS_MASK); \
  103. if (is_shub2()) \
  104. __addr = SH2_TIO_PHYS_TO_DMA(__addr); \
  105. HUB_S(_bte->bte_notify_addr, __addr); \
  106. })
  107. #define BTE_START_TRANSFER(_bte, _len, _mode) \
  108. is_shub2() ? BTE_CTRL_STORE(_bte, IBLS_BUSY | (_mode << 24) | _len) \
  109. : BTE_LNSTAT_STORE(_bte, _len); \
  110. BTE_CTRL_STORE(_bte, _mode)
  111. /* Possible results from bte_copy and bte_unaligned_copy */
  112. /* The following error codes map into the BTE hardware codes
  113. * IIO_ICRB_ECODE_* (in shubio.h). The hardware uses
  114. * an error code of 0 (IIO_ICRB_ECODE_DERR), but we want zero
  115. * to mean BTE_SUCCESS, so add one (BTEFAIL_OFFSET) to the error
  116. * codes to give the following error codes.
  117. */
  118. #define BTEFAIL_OFFSET 1
  119. typedef enum {
  120. BTE_SUCCESS, /* 0 is success */
  121. BTEFAIL_DIR, /* Directory error due to IIO access*/
  122. BTEFAIL_POISON, /* poison error on IO access (write to poison page) */
  123. BTEFAIL_WERR, /* Write error (ie WINV to a Read only line) */
  124. BTEFAIL_ACCESS, /* access error (protection violation) */
  125. BTEFAIL_PWERR, /* Partial Write Error */
  126. BTEFAIL_PRERR, /* Partial Read Error */
  127. BTEFAIL_TOUT, /* CRB Time out */
  128. BTEFAIL_XTERR, /* Incoming xtalk pkt had error bit */
  129. BTEFAIL_NOTAVAIL, /* BTE not available */
  130. } bte_result_t;
  131. #define BTEFAIL_SH2_RESP_SHORT 0x1 /* bit 000001 */
  132. #define BTEFAIL_SH2_RESP_LONG 0x2 /* bit 000010 */
  133. #define BTEFAIL_SH2_RESP_DSP 0x4 /* bit 000100 */
  134. #define BTEFAIL_SH2_RESP_ACCESS 0x8 /* bit 001000 */
  135. #define BTEFAIL_SH2_CRB_TO 0x10 /* bit 010000 */
  136. #define BTEFAIL_SH2_NACK_LIMIT 0x20 /* bit 100000 */
  137. #define BTEFAIL_SH2_ALL 0x3F /* bit 111111 */
  138. #define BTE_ERR_BITS 0x3FUL
  139. #define BTE_ERR_SHIFT 36
  140. #define BTE_ERR_MASK (BTE_ERR_BITS << BTE_ERR_SHIFT)
  141. #define BTE_ERROR_RETRY(value) \
  142. (is_shub2() ? (value != BTEFAIL_SH2_CRB_TO) \
  143. : (value != BTEFAIL_TOUT))
  144. /*
  145. * On shub1 BTE_ERR_MASK will always be false, so no need for is_shub2()
  146. */
  147. #define BTE_SHUB2_ERROR(_status) \
  148. ((_status & BTE_ERR_MASK) \
  149. ? (((_status >> BTE_ERR_SHIFT) & BTE_ERR_BITS) | IBLS_ERROR) \
  150. : _status)
  151. #define BTE_GET_ERROR_STATUS(_status) \
  152. (BTE_SHUB2_ERROR(_status) & ~IBLS_ERROR)
  153. #define BTE_VALID_SH2_ERROR(value) \
  154. ((value >= BTEFAIL_SH2_RESP_SHORT) && (value <= BTEFAIL_SH2_ALL))
  155. /*
  156. * Structure defining a bte. An instance of this
  157. * structure is created in the nodepda for each
  158. * bte on that node (as defined by BTES_PER_NODE)
  159. * This structure contains everything necessary
  160. * to work with a BTE.
  161. */
  162. struct bteinfo_s {
  163. volatile u64 notify ____cacheline_aligned;
  164. u64 *bte_base_addr ____cacheline_aligned;
  165. u64 *bte_source_addr;
  166. u64 *bte_destination_addr;
  167. u64 *bte_control_addr;
  168. u64 *bte_notify_addr;
  169. spinlock_t spinlock;
  170. cnodeid_t bte_cnode; /* cnode */
  171. int bte_error_count; /* Number of errors encountered */
  172. int bte_num; /* 0 --> BTE0, 1 --> BTE1 */
  173. int cleanup_active; /* Interface is locked for cleanup */
  174. volatile bte_result_t bh_error; /* error while processing */
  175. volatile u64 *most_rcnt_na;
  176. struct bteinfo_s *btes_to_try[MAX_BTES_PER_NODE];
  177. };
  178. /*
  179. * Function prototypes (functions defined in bte.c, used elsewhere)
  180. */
  181. extern bte_result_t bte_copy(u64, u64, u64, u64, void *);
  182. extern bte_result_t bte_unaligned_copy(u64, u64, u64, u64);
  183. extern void bte_error_handler(struct nodepda_s *);
  184. #define bte_zero(dest, len, mode, notification) \
  185. bte_copy(0, dest, len, ((mode) | BTE_ZERO_FILL), notification)
  186. /*
  187. * The following is the preferred way of calling bte_unaligned_copy
  188. * If the copy is fully cache line aligned, then bte_copy is
  189. * used instead. Since bte_copy is inlined, this saves a call
  190. * stack. NOTE: bte_copy is called synchronously and does block
  191. * until the transfer is complete. In order to get the asynch
  192. * version of bte_copy, you must perform this check yourself.
  193. */
  194. #define BTE_UNALIGNED_COPY(src, dest, len, mode) \
  195. (((len & (L1_CACHE_BYTES - 1)) || \
  196. (src & (L1_CACHE_BYTES - 1)) || \
  197. (dest & (L1_CACHE_BYTES - 1))) ? \
  198. bte_unaligned_copy(src, dest, len, mode) : \
  199. bte_copy(src, dest, len, mode, NULL))
  200. #endif /* _ASM_IA64_SN_BTE_H */