uv_bau.h 11 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331
  1. /*
  2. * This file is subject to the terms and conditions of the GNU General Public
  3. * License. See the file "COPYING" in the main directory of this archive
  4. * for more details.
  5. *
  6. * SGI UV Broadcast Assist Unit definitions
  7. *
  8. * Copyright (C) 2008 Silicon Graphics, Inc. All rights reserved.
  9. */
  10. #ifndef __ASM_X86_UV_BAU__
  11. #define __ASM_X86_UV_BAU__
  12. #include <linux/bitmap.h>
  13. #define BITSPERBYTE 8
  14. /* Broadcast Assist Unit messaging structures */
  15. /*
  16. * Selective Broadcast activations are induced by software action
  17. * specifying a particular 8-descriptor "set" via a 6-bit index written
  18. * to an MMR.
  19. * Thus there are 64 unique 512-byte sets of SB descriptors - one set for
  20. * each 6-bit index value. These descriptor sets are mapped in sequence
  21. * starting with set 0 located at the address specified in the
  22. * BAU_SB_DESCRIPTOR_BASE register, set 1 is located at BASE + 512,
  23. * set 2 is at BASE + 2*512, set 3 at BASE + 3*512, and so on.
  24. *
  25. * We will use 31 sets, one for sending BAU messages from each of the 32
  26. * cpu's on the node.
  27. *
  28. * TLB shootdown will use the first of the 8 descriptors of each set.
  29. * Each of the descriptors is 64 bytes in size (8*64 = 512 bytes in a set).
  30. */
  31. #define UV_ITEMS_PER_DESCRIPTOR 8
  32. #define UV_CPUS_PER_ACT_STATUS 32
  33. #define UV_ACT_STATUS_MASK 0x3
  34. #define UV_ACT_STATUS_SIZE 2
  35. #define UV_ACTIVATION_DESCRIPTOR_SIZE 32
  36. #define UV_DISTRIBUTION_SIZE 256
  37. #define UV_SW_ACK_NPENDING 8
  38. #define UV_BAU_MESSAGE 200 /* Messaging irq; see irq_64.h */
  39. /* and include/asm-x86/hw_irq_64.h */
  40. /* To be dynamically allocated in the future */
  41. #define UV_NET_ENDPOINT_INTD 0x38
  42. #define UV_DESC_BASE_PNODE_SHIFT 49 /* position of pnode (nasid>>1) in MMR */
  43. #define UV_PAYLOADQ_PNODE_SHIFT 49
  44. #define UV_PTC_BASENAME "sgi_uv/ptc_statistics"
  45. #define uv_physnodeaddr(x) ((__pa((unsigned long)(x)) & uv_mmask))
  46. /* bits in UVH_LB_BAU_SB_ACTIVATION_STATUS_0/1 */
  47. #define DESC_STATUS_IDLE 0
  48. #define DESC_STATUS_ACTIVE 1
  49. #define DESC_STATUS_DESTINATION_TIMEOUT 2
  50. #define DESC_STATUS_SOURCE_TIMEOUT 3
  51. /* source side threshholds at which message retries print a warning */
  52. #define SOURCE_TIMEOUT_LIMIT 20
  53. #define DESTINATION_TIMEOUT_LIMIT 20
  54. /* number of entries in the destination side payload queue */
  55. #define DESTINATION_PAYLOAD_QUEUE_SIZE 17
  56. /* number of destination side software ack resources */
  57. #define DESTINATION_NUM_RESOURCES 8
  58. #define MAX_CPUS_PER_NODE 32
  59. /* Distribution: 32 bytes (256 bits) (bytes 0-0x1f of descriptor) */
  60. /* If the 'multilevel' flag in the header portion of the descriptor
  61. * has been set to 0, then endpoint multi-unicast mode is selected.
  62. * The distribution specification (32 bytes) is interpreted as a 256-bit
  63. * distribution vector. Adjacent bits correspond to consecutive even numbered
  64. * nodeIDs. The result of adding the index of a given bit to the 15-bit
  65. * 'base_dest_nodeid' field of the header corresponds to the
  66. * destination nodeID associated with that specified bit. */
  67. struct bau_target_nodemask {
  68. unsigned long bits[BITS_TO_LONGS(256)];
  69. };
  70. /* mask of cpu's on a node */
  71. /* (during initialization we need to check that unsigned long has
  72. enough bits for max. cpu's per node) */
  73. struct bau_local_cpumask {
  74. unsigned long bits;
  75. };
  76. /*
  77. * Payload: 16 bytes (128 bits) (bytes 0x20-0x2f of descriptor)
  78. * only 12 bytes (96 bits) of the payload area are usable.
  79. * An additional 3 bytes (bits 27:4) of the header address are carried
  80. * to the next bytes of the destination payload queue.
  81. * And an additional 2 bytes of the header Suppl_A field are also
  82. * carried to the destination payload queue.
  83. * But the first byte of the Suppl_A becomes bits 127:120 (the 16th byte)
  84. * of the destination payload queue, which is written by the hardware
  85. * with the s/w ack resource bit vector.
  86. * [ effective message contents (16 bytes (128 bits) maximum), not counting
  87. * the s/w ack bit vector ]
  88. */
  89. /* The payload is software-defined for INTD transactions */
  90. struct bau_msg_payload {
  91. unsigned long address; /* signifies a page or all TLB's
  92. of the cpu */
  93. /* 64 bits */
  94. unsigned short sending_cpu; /* filled in by sender */
  95. /* 16 bits */
  96. unsigned short acknowledge_count;/* filled in by destination */
  97. /* 16 bits */
  98. unsigned int reserved1:32; /* not usable */
  99. };
  100. /* Message header: 16 bytes (128 bits) (bytes 0x30-0x3f of descriptor) */
  101. /* see table 4.2.3.0.1 in broacast_assist spec. */
  102. struct bau_msg_header {
  103. int dest_subnodeid:6; /* must be zero */
  104. /* bits 5:0 */
  105. int base_dest_nodeid:15; /* nasid>>1 (pnode) of first bit in node_map */
  106. /* bits 20:6 */
  107. int command:8; /* message type */
  108. /* bits 28:21 */
  109. /* 0x38: SN3net EndPoint Message */
  110. int rsvd_1:3; /* must be zero */
  111. /* bits 31:29 */
  112. /* int will align on 32 bits */
  113. int rsvd_2:9; /* must be zero */
  114. /* bits 40:32 */
  115. /* Suppl_A is 56-41 */
  116. int payload_2a:8; /* becomes byte 16 of msg */
  117. /* bits 48:41 */ /* not currently using */
  118. int payload_2b:8; /* becomes byte 17 of msg */
  119. /* bits 56:49 */ /* not currently using */
  120. /* Address field (96:57) is never used as an
  121. address (these are address bits 42:3) */
  122. int rsvd_3:1; /* must be zero */
  123. /* bit 57 */
  124. /* address bits 27:4 are payload */
  125. /* these 24 bits become bytes 12-14 of msg */
  126. int replied_to:1; /* sent as 0 by the source to byte 12 */
  127. /* bit 58 */
  128. int payload_1a:5; /* not currently used */
  129. /* bits 63:59 */
  130. int payload_1b:8; /* not currently used */
  131. /* bits 71:64 */
  132. int payload_1c:8; /* not currently used */
  133. /* bits 79:72 */
  134. int payload_1d:2; /* not currently used */
  135. /* bits 81:80 */
  136. int rsvd_4:7; /* must be zero */
  137. /* bits 88:82 */
  138. int sw_ack_flag:1; /* software acknowledge flag */
  139. /* bit 89 */
  140. /* INTD trasactions at destination are to
  141. wait for software acknowledge */
  142. int rsvd_5:6; /* must be zero */
  143. /* bits 95:90 */
  144. int rsvd_6:5; /* must be zero */
  145. /* bits 100:96 */
  146. int int_both:1; /* if 1, interrupt both sockets on the blade */
  147. /* bit 101*/
  148. int fairness:3; /* usually zero */
  149. /* bits 104:102 */
  150. int multilevel:1; /* multi-level multicast format */
  151. /* bit 105 */
  152. /* 0 for TLB: endpoint multi-unicast messages */
  153. int chaining:1; /* next descriptor is part of this activation*/
  154. /* bit 106 */
  155. int rsvd_7:21; /* must be zero */
  156. /* bits 127:107 */
  157. };
  158. /* The format of the message to send, plus all accompanying control */
  159. /* Should be 64 bytes */
  160. struct bau_activation_descriptor {
  161. struct bau_target_nodemask distribution;
  162. /* message template, consisting of header and payload: */
  163. struct bau_msg_header header;
  164. struct bau_msg_payload payload;
  165. };
  166. /*
  167. * -payload-- ---------header------
  168. * bytes 0-11 bits 41-56 bits 58-81
  169. * A B (2) C (3)
  170. *
  171. * A/B/C are moved to:
  172. * A C B
  173. * bytes 0-11 bytes 12-14 bytes 16-17 (byte 15 filled in by hw as vector)
  174. * ------------payload queue-----------
  175. */
  176. /*
  177. * The payload queue on the destination side is an array of these.
  178. * With BAU_MISC_CONTROL set for software acknowledge mode, the messages
  179. * are 32 bytes (2 micropackets) (256 bits) in length, but contain only 17
  180. * bytes of usable data, including the sw ack vector in byte 15 (bits 127:120)
  181. * (12 bytes come from bau_msg_payload, 3 from payload_1, 2 from
  182. * sw_ack_vector and payload_2)
  183. * "Enabling Software Acknowledgment mode (see Section 4.3.3 Software
  184. * Acknowledge Processing) also selects 32 byte (17 bytes usable) payload
  185. * operation."
  186. */
  187. struct bau_payload_queue_entry {
  188. unsigned long address; /* signifies a page or all TLB's
  189. of the cpu */
  190. /* 64 bits, bytes 0-7 */
  191. unsigned short sending_cpu; /* cpu that sent the message */
  192. /* 16 bits, bytes 8-9 */
  193. unsigned short acknowledge_count; /* filled in by destination */
  194. /* 16 bits, bytes 10-11 */
  195. unsigned short replied_to:1; /* sent as 0 by the source */
  196. /* 1 bit */
  197. unsigned short unused1:7; /* not currently using */
  198. /* 7 bits: byte 12) */
  199. unsigned char unused2[2]; /* not currently using */
  200. /* bytes 13-14 */
  201. unsigned char sw_ack_vector; /* filled in by the hardware */
  202. /* byte 15 (bits 127:120) */
  203. unsigned char unused4[3]; /* not currently using bytes 17-19 */
  204. /* bytes 17-19 */
  205. int number_of_cpus; /* filled in at destination */
  206. /* 32 bits, bytes 20-23 (aligned) */
  207. unsigned char unused5[8]; /* not using */
  208. /* bytes 24-31 */
  209. };
  210. /* one for every slot in the destination payload queue */
  211. struct bau_msg_status {
  212. struct bau_local_cpumask seen_by; /* map of cpu's */
  213. };
  214. /* one for every slot in the destination software ack resources */
  215. struct bau_sw_ack_status {
  216. struct bau_payload_queue_entry *msg; /* associated message */
  217. int watcher; /* cpu monitoring, or -1 */
  218. };
  219. /* one on every node and per-cpu; to locate the software tables */
  220. struct bau_control {
  221. struct bau_activation_descriptor *descriptor_base;
  222. struct bau_payload_queue_entry *bau_msg_head;
  223. struct bau_payload_queue_entry *va_queue_first;
  224. struct bau_payload_queue_entry *va_queue_last;
  225. struct bau_msg_status *msg_statuses;
  226. int *watching; /* pointer to array */
  227. };
  228. /*
  229. * This structure is allocated per_cpu for UV TLB shootdown statistics.
  230. */
  231. struct ptc_stats {
  232. unsigned long ptc_i; /* number of IPI-style flushes */
  233. unsigned long requestor; /* number of nodes this cpu sent to */
  234. unsigned long requestee; /* times cpu was remotely requested */
  235. unsigned long alltlb; /* times all tlb's on this cpu were flushed */
  236. unsigned long onetlb; /* times just one tlb on this cpu was flushed */
  237. unsigned long s_retry; /* retries on source side timeouts */
  238. unsigned long d_retry; /* retries on destination side timeouts */
  239. unsigned long sflush_ns;/* nanoseconds spent in uv_flush_tlb_others */
  240. unsigned long dflush_ns;/* nanoseconds spent destination side */
  241. unsigned long retriesok; /* successes on retries */
  242. unsigned long nomsg; /* interrupts with no message */
  243. unsigned long multmsg; /* interrupts with multiple messages */
  244. unsigned long ntargeted;/* nodes targeted */
  245. };
  246. static inline int bau_node_isset(int node, struct bau_target_nodemask *dstp)
  247. {
  248. return constant_test_bit(node, &dstp->bits[0]);
  249. }
  250. static inline void bau_node_set(int node, struct bau_target_nodemask *dstp)
  251. {
  252. __set_bit(node, &dstp->bits[0]);
  253. }
  254. static inline void bau_nodes_clear(struct bau_target_nodemask *dstp, int nbits)
  255. {
  256. bitmap_zero(&dstp->bits[0], nbits);
  257. }
  258. static inline void bau_cpubits_clear(struct bau_local_cpumask *dstp, int nbits)
  259. {
  260. bitmap_zero(&dstp->bits, nbits);
  261. }
  262. /*
  263. * atomic increment of a short integer
  264. * (rather than using the __sync_add_and_fetch() intrinsic)
  265. *
  266. * returns the new value of the variable
  267. */
  268. static inline short int atomic_inc_short(short int *v)
  269. {
  270. asm volatile("movw $1, %%cx\n"
  271. "lock ; xaddw %%cx, %0\n"
  272. : "+m" (*v) /* outputs */
  273. : : "%cx", "memory"); /* inputs : clobbereds */
  274. return *v;
  275. }
  276. /*
  277. * atomic OR of two long integers
  278. * (rather than using the __sync_or_and_fetch() intrinsic)
  279. */
  280. static inline void atomic_or_long(unsigned long *v1, unsigned long v2)
  281. {
  282. asm volatile("movq %0, %%rax; lea %1, %%rdx\n"
  283. "lock ; orq %%rax, %%rdx\n"
  284. : "+m" (*v1) /* outputs */
  285. : "m" (v1), "m" (v2) /* inputs */
  286. : "memory"); /* clobbereds */
  287. }
  288. #define cpubit_isset(cpu, bau_local_cpumask) \
  289. test_bit((cpu), (bau_local_cpumask).bits)
  290. int uv_flush_tlb_others(cpumask_t *, struct mm_struct *, unsigned long);
  291. void uv_bau_message_intr1(void);
  292. void uv_bau_timeout_intr1(void);
  293. #endif /* __ASM_X86_UV_BAU__ */