1 /*
2 * This file is subject to the terms and conditions of the GNU General Public
3 * License. See the file "COPYING" in the main directory of this archive
4 * for more details.
5 *
6 * SGI UV Broadcast Assist Unit definitions
7 *
8 * Copyright (C) 2008-2011 Silicon Graphics, Inc. All rights reserved.
9 */
10
11 #ifndef _ASM_X86_UV_UV_BAU_H
12 #define _ASM_X86_UV_UV_BAU_H
13
14 #include <linux/bitmap.h>
15 #define BITSPERBYTE 8
16
17 /*
18 * Broadcast Assist Unit messaging structures
19 *
20 * Selective Broadcast activations are induced by software action
21 * specifying a particular 8-descriptor "set" via a 6-bit index written
22 * to an MMR.
23 * Thus there are 64 unique 512-byte sets of SB descriptors - one set for
24 * each 6-bit index value. These descriptor sets are mapped in sequence
25 * starting with set 0 located at the address specified in the
26 * BAU_SB_DESCRIPTOR_BASE register, set 1 is located at BASE + 512,
27 * set 2 is at BASE + 2*512, set 3 at BASE + 3*512, and so on.
28 *
29 * We will use one set for sending BAU messages from each of the
30 * cpu's on the uvhub.
31 *
32 * TLB shootdown will use the first of the 8 descriptors of each set.
33 * Each of the descriptors is 64 bytes in size (8*64 = 512 bytes in a set).
34 */
35
36 #define MAX_CPUS_PER_UVHUB 128
37 #define MAX_CPUS_PER_SOCKET 64
38 #define ADP_SZ 64 /* hardware-provided max. */
39 #define UV_CPUS_PER_AS 32 /* hardware-provided max. */
40 #define ITEMS_PER_DESC 8
41 /* the 'throttle' to prevent the hardware stay-busy bug */
42 #define MAX_BAU_CONCURRENT 3
43 #define UV_ACT_STATUS_MASK 0x3
44 #define UV_ACT_STATUS_SIZE 2
45 #define UV_DISTRIBUTION_SIZE 256
46 #define UV_SW_ACK_NPENDING 8
47 #define UV1_NET_ENDPOINT_INTD 0x38
48 #define UV2_NET_ENDPOINT_INTD 0x28
49 #define UV_NET_ENDPOINT_INTD (is_uv1_hub() ? \
50 UV1_NET_ENDPOINT_INTD : UV2_NET_ENDPOINT_INTD)
51 #define UV_DESC_PSHIFT 49
52 #define UV_PAYLOADQ_PNODE_SHIFT 49
53 #define UV_PTC_BASENAME "sgi_uv/ptc_statistics"
54 #define UV_BAU_BASENAME "sgi_uv/bau_tunables"
55 #define UV_BAU_TUNABLES_DIR "sgi_uv"
56 #define UV_BAU_TUNABLES_FILE "bau_tunables"
57 #define WHITESPACE " \t\n"
58 #define uv_mmask ((1UL << uv_hub_info->m_val) - 1)
59 #define uv_physnodeaddr(x) ((__pa((unsigned long)(x)) & uv_mmask))
60 #define cpubit_isset(cpu, bau_local_cpumask) \
61 test_bit((cpu), (bau_local_cpumask).bits)
62
63 /* [19:16] SOFT_ACK timeout period 19: 1 is urgency 7 17:16 1 is multiplier */
64 /*
65 * UV2: Bit 19 selects between
66 * (0): 10 microsecond timebase and
67 * (1): 80 microseconds
68 * we're using 560us, similar to UV1: 65 units of 10us
69 */
70 #define UV1_INTD_SOFT_ACK_TIMEOUT_PERIOD (9UL)
71 #define UV2_INTD_SOFT_ACK_TIMEOUT_PERIOD (15UL)
72
73 #define UV_INTD_SOFT_ACK_TIMEOUT_PERIOD (is_uv1_hub() ? \
74 UV1_INTD_SOFT_ACK_TIMEOUT_PERIOD : \
75 UV2_INTD_SOFT_ACK_TIMEOUT_PERIOD)
76 /* assuming UV3 is the same */
77
78 #define BAU_MISC_CONTROL_MULT_MASK 3
79
80 #define UVH_AGING_PRESCALE_SEL 0x000000b000UL
81 /* [30:28] URGENCY_7 an index into a table of times */
82 #define BAU_URGENCY_7_SHIFT 28
83 #define BAU_URGENCY_7_MASK 7
84
85 #define UVH_TRANSACTION_TIMEOUT 0x000000b200UL
86 /* [45:40] BAU - BAU transaction timeout select - a multiplier */
87 #define BAU_TRANS_SHIFT 40
88 #define BAU_TRANS_MASK 0x3f
89
90 /*
91 * shorten some awkward names
92 */
93 #define AS_PUSH_SHIFT UVH_LB_BAU_SB_ACTIVATION_CONTROL_PUSH_SHFT
94 #define SOFTACK_MSHIFT UVH_LB_BAU_MISC_CONTROL_ENABLE_INTD_SOFT_ACK_MODE_SHFT
95 #define SOFTACK_PSHIFT UVH_LB_BAU_MISC_CONTROL_INTD_SOFT_ACK_TIMEOUT_PERIOD_SHFT
96 #define SOFTACK_TIMEOUT_PERIOD UV_INTD_SOFT_ACK_TIMEOUT_PERIOD
97 #define PREFETCH_HINT_SHFT UV3H_LB_BAU_MISC_CONTROL_ENABLE_INTD_PREFETCH_HINT_SHFT
98 #define SB_STATUS_SHFT UV3H_LB_BAU_MISC_CONTROL_ENABLE_EXTENDED_SB_STATUS_SHFT
99 #define write_gmmr uv_write_global_mmr64
100 #define write_lmmr uv_write_local_mmr
101 #define read_lmmr uv_read_local_mmr
102 #define read_gmmr uv_read_global_mmr64
103
104 /*
105 * bits in UVH_LB_BAU_SB_ACTIVATION_STATUS_0/1
106 */
107 #define DS_IDLE 0
108 #define DS_ACTIVE 1
109 #define DS_DESTINATION_TIMEOUT 2
110 #define DS_SOURCE_TIMEOUT 3
111 /*
112 * bits put together from HRP_LB_BAU_SB_ACTIVATION_STATUS_0/1/2
113 * values 1 and 3 will not occur
114 * Decoded meaning ERROR BUSY AUX ERR
115 * ------------------------------- ---- ----- -------
116 * IDLE 0 0 0
117 * BUSY (active) 0 1 0
118 * SW Ack Timeout (destination) 1 0 0
119 * SW Ack INTD rejected (strong NACK) 1 0 1
120 * Source Side Time Out Detected 1 1 0
121 * Destination Side PUT Failed 1 1 1
122 */
123 #define UV2H_DESC_IDLE 0
124 #define UV2H_DESC_BUSY 2
125 #define UV2H_DESC_DEST_TIMEOUT 4
126 #define UV2H_DESC_DEST_STRONG_NACK 5
127 #define UV2H_DESC_SOURCE_TIMEOUT 6
128 #define UV2H_DESC_DEST_PUT_ERR 7
129
130 /*
131 * delay for 'plugged' timeout retries, in microseconds
132 */
133 #define PLUGGED_DELAY 10
134
135 /*
136 * threshholds at which to use IPI to free resources
137 */
138 /* after this # consecutive 'plugged' timeouts, use IPI to release resources */
139 #define PLUGSB4RESET 100
140 /* after this many consecutive timeouts, use IPI to release resources */
141 #define TIMEOUTSB4RESET 1
142 /* at this number uses of IPI to release resources, giveup the request */
143 #define IPI_RESET_LIMIT 1
144 /* after this # consecutive successes, bump up the throttle if it was lowered */
145 #define COMPLETE_THRESHOLD 5
146 /* after this # of giveups (fall back to kernel IPI's) disable the use of
147 the BAU for a period of time */
148 #define GIVEUP_LIMIT 100
149
150 #define UV_LB_SUBNODEID 0x10
151
152 /* these two are the same for UV1 and UV2: */
153 #define UV_SA_SHFT UVH_LB_BAU_MISC_CONTROL_INTD_SOFT_ACK_TIMEOUT_PERIOD_SHFT
154 #define UV_SA_MASK UVH_LB_BAU_MISC_CONTROL_INTD_SOFT_ACK_TIMEOUT_PERIOD_MASK
155 /* 4 bits of software ack period */
156 #define UV2_ACK_MASK 0x7UL
157 #define UV2_ACK_UNITS_SHFT 3
158 #define UV2_EXT_SHFT UV2H_LB_BAU_MISC_CONTROL_ENABLE_EXTENDED_SB_STATUS_SHFT
159
160 /*
161 * number of entries in the destination side payload queue
162 */
163 #define DEST_Q_SIZE 20
164 /*
165 * number of destination side software ack resources
166 */
167 #define DEST_NUM_RESOURCES 8
168 /*
169 * completion statuses for sending a TLB flush message
170 */
171 #define FLUSH_RETRY_PLUGGED 1
172 #define FLUSH_RETRY_TIMEOUT 2
173 #define FLUSH_GIVEUP 3
174 #define FLUSH_COMPLETE 4
175
176 /*
177 * tuning the action when the numalink network is extremely delayed
178 */
179 #define CONGESTED_RESPONSE_US 1000 /* 'long' response time, in
180 microseconds */
181 #define CONGESTED_REPS 10 /* long delays averaged over
182 this many broadcasts */
183 #define DISABLED_PERIOD 10 /* time for the bau to be
184 disabled, in seconds */
185 /* see msg_type: */
186 #define MSG_NOOP 0
187 #define MSG_REGULAR 1
188 #define MSG_RETRY 2
189
190 /*
191 * Distribution: 32 bytes (256 bits) (bytes 0-0x1f of descriptor)
192 * If the 'multilevel' flag in the header portion of the descriptor
193 * has been set to 0, then endpoint multi-unicast mode is selected.
194 * The distribution specification (32 bytes) is interpreted as a 256-bit
195 * distribution vector. Adjacent bits correspond to consecutive even numbered
196 * nodeIDs. The result of adding the index of a given bit to the 15-bit
197 * 'base_dest_nasid' field of the header corresponds to the
198 * destination nodeID associated with that specified bit.
199 */
200 struct pnmask {
201 unsigned long bits[BITS_TO_LONGS(UV_DISTRIBUTION_SIZE)];
202 };
203
204 /*
205 * mask of cpu's on a uvhub
206 * (during initialization we need to check that unsigned long has
207 * enough bits for max. cpu's per uvhub)
208 */
209 struct bau_local_cpumask {
210 unsigned long bits;
211 };
212
213 /*
214 * Payload: 16 bytes (128 bits) (bytes 0x20-0x2f of descriptor)
215 * only 12 bytes (96 bits) of the payload area are usable.
216 * An additional 3 bytes (bits 27:4) of the header address are carried
217 * to the next bytes of the destination payload queue.
218 * And an additional 2 bytes of the header Suppl_A field are also
219 * carried to the destination payload queue.
220 * But the first byte of the Suppl_A becomes bits 127:120 (the 16th byte)
221 * of the destination payload queue, which is written by the hardware
222 * with the s/w ack resource bit vector.
223 * [ effective message contents (16 bytes (128 bits) maximum), not counting
224 * the s/w ack bit vector ]
225 */
226
227 /*
228 * The payload is software-defined for INTD transactions
229 */
230 struct bau_msg_payload {
231 unsigned long address; /* signifies a page or all
232 TLB's of the cpu */
233 /* 64 bits */
234 unsigned short sending_cpu; /* filled in by sender */
235 /* 16 bits */
236 unsigned short acknowledge_count; /* filled in by destination */
237 /* 16 bits */
238 unsigned int reserved1:32; /* not usable */
239 };
240
241
242 /*
243 * UV1 Message header: 16 bytes (128 bits) (bytes 0x30-0x3f of descriptor)
244 * see table 4.2.3.0.1 in broacast_assist spec.
245 */
246 struct uv1_bau_msg_header {
247 unsigned int dest_subnodeid:6; /* must be 0x10, for the LB */
248 /* bits 5:0 */
249 unsigned int base_dest_nasid:15; /* nasid of the first bit */
250 /* bits 20:6 */ /* in uvhub map */
251 unsigned int command:8; /* message type */
252 /* bits 28:21 */
253 /* 0x38: SN3net EndPoint Message */
254 unsigned int rsvd_1:3; /* must be zero */
255 /* bits 31:29 */
256 /* int will align on 32 bits */
257 unsigned int rsvd_2:9; /* must be zero */
258 /* bits 40:32 */
259 /* Suppl_A is 56-41 */
260 unsigned int sequence:16; /* message sequence number */
261 /* bits 56:41 */ /* becomes bytes 16-17 of msg */
262 /* Address field (96:57) is
263 never used as an address
264 (these are address bits
265 42:3) */
266
267 unsigned int rsvd_3:1; /* must be zero */
268 /* bit 57 */
269 /* address bits 27:4 are payload */
270 /* these next 24 (58-81) bits become bytes 12-14 of msg */
271 /* bits 65:58 land in byte 12 */
272 unsigned int replied_to:1; /* sent as 0 by the source to
273 byte 12 */
274 /* bit 58 */
275 unsigned int msg_type:3; /* software type of the
276 message */
277 /* bits 61:59 */
278 unsigned int canceled:1; /* message canceled, resource
279 is to be freed*/
280 /* bit 62 */
281 unsigned int payload_1a:1; /* not currently used */
282 /* bit 63 */
283 unsigned int payload_1b:2; /* not currently used */
284 /* bits 65:64 */
285
286 /* bits 73:66 land in byte 13 */
287 unsigned int payload_1ca:6; /* not currently used */
288 /* bits 71:66 */
289 unsigned int payload_1c:2; /* not currently used */
290 /* bits 73:72 */
291
292 /* bits 81:74 land in byte 14 */
293 unsigned int payload_1d:6; /* not currently used */
294 /* bits 79:74 */
295 unsigned int payload_1e:2; /* not currently used */
296 /* bits 81:80 */
297
298 unsigned int rsvd_4:7; /* must be zero */
299 /* bits 88:82 */
300 unsigned int swack_flag:1; /* software acknowledge flag */
301 /* bit 89 */
302 /* INTD trasactions at
303 destination are to wait for
304 software acknowledge */
305 unsigned int rsvd_5:6; /* must be zero */
306 /* bits 95:90 */
307 unsigned int rsvd_6:5; /* must be zero */
308 /* bits 100:96 */
309 unsigned int int_both:1; /* if 1, interrupt both sockets
310 on the uvhub */
311 /* bit 101*/
312 unsigned int fairness:3; /* usually zero */
313 /* bits 104:102 */
314 unsigned int multilevel:1; /* multi-level multicast
315 format */
316 /* bit 105 */
317 /* 0 for TLB: endpoint multi-unicast messages */
318 unsigned int chaining:1; /* next descriptor is part of
319 this activation*/
320 /* bit 106 */
321 unsigned int rsvd_7:21; /* must be zero */
322 /* bits 127:107 */
323 };
324
325 /*
326 * UV2 Message header: 16 bytes (128 bits) (bytes 0x30-0x3f of descriptor)
327 * see figure 9-2 of harp_sys.pdf
328 * assuming UV3 is the same
329 */
330 struct uv2_3_bau_msg_header {
331 unsigned int base_dest_nasid:15; /* nasid of the first bit */
332 /* bits 14:0 */ /* in uvhub map */
333 unsigned int dest_subnodeid:5; /* must be 0x10, for the LB */
334 /* bits 19:15 */
335 unsigned int rsvd_1:1; /* must be zero */
336 /* bit 20 */
337 /* Address bits 59:21 */
338 /* bits 25:2 of address (44:21) are payload */
339 /* these next 24 bits become bytes 12-14 of msg */
340 /* bits 28:21 land in byte 12 */
341 unsigned int replied_to:1; /* sent as 0 by the source to
342 byte 12 */
343 /* bit 21 */
344 unsigned int msg_type:3; /* software type of the
345 message */
346 /* bits 24:22 */
347 unsigned int canceled:1; /* message canceled, resource
348 is to be freed*/
349 /* bit 25 */
350 unsigned int payload_1:3; /* not currently used */
351 /* bits 28:26 */
352
353 /* bits 36:29 land in byte 13 */
354 unsigned int payload_2a:3; /* not currently used */
355 unsigned int payload_2b:5; /* not currently used */
356 /* bits 36:29 */
357
358 /* bits 44:37 land in byte 14 */
359 unsigned int payload_3:8; /* not currently used */
360 /* bits 44:37 */
361
362 unsigned int rsvd_2:7; /* reserved */
363 /* bits 51:45 */
364 unsigned int swack_flag:1; /* software acknowledge flag */
365 /* bit 52 */
366 unsigned int rsvd_3a:3; /* must be zero */
367 unsigned int rsvd_3b:8; /* must be zero */
368 unsigned int rsvd_3c:8; /* must be zero */
369 unsigned int rsvd_3d:3; /* must be zero */
370 /* bits 74:53 */
371 unsigned int fairness:3; /* usually zero */
372 /* bits 77:75 */
373
374 unsigned int sequence:16; /* message sequence number */
375 /* bits 93:78 Suppl_A */
376 unsigned int chaining:1; /* next descriptor is part of
377 this activation*/
378 /* bit 94 */
379 unsigned int multilevel:1; /* multi-level multicast
380 format */
381 /* bit 95 */
382 unsigned int rsvd_4:24; /* ordered / source node /
383 source subnode / aging
384 must be zero */
385 /* bits 119:96 */
386 unsigned int command:8; /* message type */
387 /* bits 127:120 */
388 };
389
390 /*
391 * The activation descriptor:
392 * The format of the message to send, plus all accompanying control
393 * Should be 64 bytes
394 */
395 struct bau_desc {
396 struct pnmask distribution;
397 /*
398 * message template, consisting of header and payload:
399 */
400 union bau_msg_header {
401 struct uv1_bau_msg_header uv1_hdr;
402 struct uv2_3_bau_msg_header uv2_3_hdr;
403 } header;
404
405 struct bau_msg_payload payload;
406 };
407 /* UV1:
408 * -payload-- ---------header------
409 * bytes 0-11 bits 41-56 bits 58-81
410 * A B (2) C (3)
411 *
412 * A/B/C are moved to:
413 * A C B
414 * bytes 0-11 bytes 12-14 bytes 16-17 (byte 15 filled in by hw as vector)
415 * ------------payload queue-----------
416 */
417 /* UV2:
418 * -payload-- ---------header------
419 * bytes 0-11 bits 70-78 bits 21-44
420 * A B (2) C (3)
421 *
422 * A/B/C are moved to:
423 * A C B
424 * bytes 0-11 bytes 12-14 bytes 16-17 (byte 15 filled in by hw as vector)
425 * ------------payload queue-----------
426 */
427
428 /*
429 * The payload queue on the destination side is an array of these.
430 * With BAU_MISC_CONTROL set for software acknowledge mode, the messages
431 * are 32 bytes (2 micropackets) (256 bits) in length, but contain only 17
432 * bytes of usable data, including the sw ack vector in byte 15 (bits 127:120)
433 * (12 bytes come from bau_msg_payload, 3 from payload_1, 2 from
434 * swack_vec and payload_2)
435 * "Enabling Software Acknowledgment mode (see Section 4.3.3 Software
436 * Acknowledge Processing) also selects 32 byte (17 bytes usable) payload
437 * operation."
438 */
439 struct bau_pq_entry {
440 unsigned long address; /* signifies a page or all TLB's
441 of the cpu */
442 /* 64 bits, bytes 0-7 */
443 unsigned short sending_cpu; /* cpu that sent the message */
444 /* 16 bits, bytes 8-9 */
445 unsigned short acknowledge_count; /* filled in by destination */
446 /* 16 bits, bytes 10-11 */
447 /* these next 3 bytes come from bits 58-81 of the message header */
448 unsigned short replied_to:1; /* sent as 0 by the source */
449 unsigned short msg_type:3; /* software message type */
450 unsigned short canceled:1; /* sent as 0 by the source */
451 unsigned short unused1:3; /* not currently using */
452 /* byte 12 */
453 unsigned char unused2a; /* not currently using */
454 /* byte 13 */
455 unsigned char unused2; /* not currently using */
456 /* byte 14 */
457 unsigned char swack_vec; /* filled in by the hardware */
458 /* byte 15 (bits 127:120) */
459 unsigned short sequence; /* message sequence number */
460 /* bytes 16-17 */
461 unsigned char unused4[2]; /* not currently using bytes 18-19 */
462 /* bytes 18-19 */
463 int number_of_cpus; /* filled in at destination */
464 /* 32 bits, bytes 20-23 (aligned) */
465 unsigned char unused5[8]; /* not using */
466 /* bytes 24-31 */
467 };
468
469 struct msg_desc {
470 struct bau_pq_entry *msg;
471 int msg_slot;
472 struct bau_pq_entry *queue_first;
473 struct bau_pq_entry *queue_last;
474 };
475
476 struct reset_args {
477 int sender;
478 };
479
480 /*
481 * This structure is allocated per_cpu for UV TLB shootdown statistics.
482 */
483 struct ptc_stats {
484 /* sender statistics */
485 unsigned long s_giveup; /* number of fall backs to
486 IPI-style flushes */
487 unsigned long s_requestor; /* number of shootdown
488 requests */
489 unsigned long s_stimeout; /* source side timeouts */
490 unsigned long s_dtimeout; /* destination side timeouts */
491 unsigned long s_strongnacks; /* number of strong nack's */
492 unsigned long s_time; /* time spent in sending side */
493 unsigned long s_retriesok; /* successful retries */
494 unsigned long s_ntargcpu; /* total number of cpu's
495 targeted */
496 unsigned long s_ntargself; /* times the sending cpu was
497 targeted */
498 unsigned long s_ntarglocals; /* targets of cpus on the local
499 blade */
500 unsigned long s_ntargremotes; /* targets of cpus on remote
501 blades */
502 unsigned long s_ntarglocaluvhub; /* targets of the local hub */
503 unsigned long s_ntargremoteuvhub; /* remotes hubs targeted */
504 unsigned long s_ntarguvhub; /* total number of uvhubs
505 targeted */
506 unsigned long s_ntarguvhub16; /* number of times target
507 hubs >= 16*/
508 unsigned long s_ntarguvhub8; /* number of times target
509 hubs >= 8 */
510 unsigned long s_ntarguvhub4; /* number of times target
511 hubs >= 4 */
512 unsigned long s_ntarguvhub2; /* number of times target
513 hubs >= 2 */
514 unsigned long s_ntarguvhub1; /* number of times target
515 hubs == 1 */
516 unsigned long s_resets_plug; /* ipi-style resets from plug
517 state */
518 unsigned long s_resets_timeout; /* ipi-style resets from
519 timeouts */
520 unsigned long s_busy; /* status stayed busy past
521 s/w timer */
522 unsigned long s_throttles; /* waits in throttle */
523 unsigned long s_retry_messages; /* retry broadcasts */
524 unsigned long s_bau_reenabled; /* for bau enable/disable */
525 unsigned long s_bau_disabled; /* for bau enable/disable */
526 unsigned long s_uv2_wars; /* uv2 workaround, perm. busy */
527 unsigned long s_uv2_wars_hw; /* uv2 workaround, hiwater */
528 unsigned long s_uv2_war_waits; /* uv2 workaround, long waits */
529 unsigned long s_overipilimit; /* over the ipi reset limit */
530 unsigned long s_giveuplimit; /* disables, over giveup limit*/
531 unsigned long s_enters; /* entries to the driver */
532 unsigned long s_ipifordisabled; /* fall back to IPI; disabled */
533 unsigned long s_plugged; /* plugged by h/w bug*/
534 unsigned long s_congested; /* giveup on long wait */
535 /* destination statistics */
536 unsigned long d_alltlb; /* times all tlb's on this
537 cpu were flushed */
538 unsigned long d_onetlb; /* times just one tlb on this
539 cpu was flushed */
540 unsigned long d_multmsg; /* interrupts with multiple
541 messages */
542 unsigned long d_nomsg; /* interrupts with no message */
543 unsigned long d_time; /* time spent on destination
544 side */
545 unsigned long d_requestee; /* number of messages
546 processed */
547 unsigned long d_retries; /* number of retry messages
548 processed */
549 unsigned long d_canceled; /* number of messages canceled
550 by retries */
551 unsigned long d_nocanceled; /* retries that found nothing
552 to cancel */
553 unsigned long d_resets; /* number of ipi-style requests
554 processed */
555 unsigned long d_rcanceled; /* number of messages canceled
556 by resets */
557 };
558
559 struct tunables {
560 int *tunp;
561 int deflt;
562 };
563
564 struct hub_and_pnode {
565 short uvhub;
566 short pnode;
567 };
568
569 struct socket_desc {
570 short num_cpus;
571 short cpu_number[MAX_CPUS_PER_SOCKET];
572 };
573
574 struct uvhub_desc {
575 unsigned short socket_mask;
576 short num_cpus;
577 short uvhub;
578 short pnode;
579 struct socket_desc socket[2];
580 };
581
582 /*
583 * one per-cpu; to locate the software tables
584 */
585 struct bau_control {
586 struct bau_desc *descriptor_base;
587 struct bau_pq_entry *queue_first;
588 struct bau_pq_entry *queue_last;
589 struct bau_pq_entry *bau_msg_head;
590 struct bau_control *uvhub_master;
591 struct bau_control *socket_master;
592 struct ptc_stats *statp;
593 cpumask_t *cpumask;
594 unsigned long timeout_interval;
595 unsigned long set_bau_on_time;
596 atomic_t active_descriptor_count;
597 int plugged_tries;
598 int timeout_tries;
599 int ipi_attempts;
600 int conseccompletes;
601 short nobau;
602 short baudisabled;
603 short cpu;
604 short osnode;
605 short uvhub_cpu;
606 short uvhub;
607 short uvhub_version;
608 short cpus_in_socket;
609 short cpus_in_uvhub;
610 short partition_base_pnode;
611 short busy; /* all were busy (war) */
612 unsigned short message_number;
613 unsigned short uvhub_quiesce;
614 short socket_acknowledge_count[DEST_Q_SIZE];
615 cycles_t send_message;
616 cycles_t period_end;
617 cycles_t period_time;
618 spinlock_t uvhub_lock;
619 spinlock_t queue_lock;
620 spinlock_t disable_lock;
621 /* tunables */
622 int max_concurr;
623 int max_concurr_const;
624 int plugged_delay;
625 int plugsb4reset;
626 int timeoutsb4reset;
627 int ipi_reset_limit;
628 int complete_threshold;
629 int cong_response_us;
630 int cong_reps;
631 cycles_t disabled_period;
632 int period_giveups;
633 int giveup_limit;
634 long period_requests;
635 struct hub_and_pnode *thp;
636 };
637
write_mmr_data_broadcast(int pnode,unsigned long mmr_image)638 static inline void write_mmr_data_broadcast(int pnode, unsigned long mmr_image)
639 {
640 write_gmmr(pnode, UVH_BAU_DATA_BROADCAST, mmr_image);
641 }
642
write_mmr_descriptor_base(int pnode,unsigned long mmr_image)643 static inline void write_mmr_descriptor_base(int pnode, unsigned long mmr_image)
644 {
645 write_gmmr(pnode, UVH_LB_BAU_SB_DESCRIPTOR_BASE, mmr_image);
646 }
647
write_mmr_activation(unsigned long index)648 static inline void write_mmr_activation(unsigned long index)
649 {
650 write_lmmr(UVH_LB_BAU_SB_ACTIVATION_CONTROL, index);
651 }
652
write_gmmr_activation(int pnode,unsigned long mmr_image)653 static inline void write_gmmr_activation(int pnode, unsigned long mmr_image)
654 {
655 write_gmmr(pnode, UVH_LB_BAU_SB_ACTIVATION_CONTROL, mmr_image);
656 }
657
write_mmr_payload_first(int pnode,unsigned long mmr_image)658 static inline void write_mmr_payload_first(int pnode, unsigned long mmr_image)
659 {
660 write_gmmr(pnode, UVH_LB_BAU_INTD_PAYLOAD_QUEUE_FIRST, mmr_image);
661 }
662
write_mmr_payload_tail(int pnode,unsigned long mmr_image)663 static inline void write_mmr_payload_tail(int pnode, unsigned long mmr_image)
664 {
665 write_gmmr(pnode, UVH_LB_BAU_INTD_PAYLOAD_QUEUE_TAIL, mmr_image);
666 }
667
write_mmr_payload_last(int pnode,unsigned long mmr_image)668 static inline void write_mmr_payload_last(int pnode, unsigned long mmr_image)
669 {
670 write_gmmr(pnode, UVH_LB_BAU_INTD_PAYLOAD_QUEUE_LAST, mmr_image);
671 }
672
write_mmr_misc_control(int pnode,unsigned long mmr_image)673 static inline void write_mmr_misc_control(int pnode, unsigned long mmr_image)
674 {
675 write_gmmr(pnode, UVH_LB_BAU_MISC_CONTROL, mmr_image);
676 }
677
read_mmr_misc_control(int pnode)678 static inline unsigned long read_mmr_misc_control(int pnode)
679 {
680 return read_gmmr(pnode, UVH_LB_BAU_MISC_CONTROL);
681 }
682
write_mmr_sw_ack(unsigned long mr)683 static inline void write_mmr_sw_ack(unsigned long mr)
684 {
685 uv_write_local_mmr(UVH_LB_BAU_INTD_SOFTWARE_ACKNOWLEDGE_ALIAS, mr);
686 }
687
write_gmmr_sw_ack(int pnode,unsigned long mr)688 static inline void write_gmmr_sw_ack(int pnode, unsigned long mr)
689 {
690 write_gmmr(pnode, UVH_LB_BAU_INTD_SOFTWARE_ACKNOWLEDGE_ALIAS, mr);
691 }
692
read_mmr_sw_ack(void)693 static inline unsigned long read_mmr_sw_ack(void)
694 {
695 return read_lmmr(UVH_LB_BAU_INTD_SOFTWARE_ACKNOWLEDGE);
696 }
697
read_gmmr_sw_ack(int pnode)698 static inline unsigned long read_gmmr_sw_ack(int pnode)
699 {
700 return read_gmmr(pnode, UVH_LB_BAU_INTD_SOFTWARE_ACKNOWLEDGE);
701 }
702
write_mmr_data_config(int pnode,unsigned long mr)703 static inline void write_mmr_data_config(int pnode, unsigned long mr)
704 {
705 uv_write_global_mmr64(pnode, UVH_BAU_DATA_CONFIG, mr);
706 }
707
bau_uvhub_isset(int uvhub,struct pnmask * dstp)708 static inline int bau_uvhub_isset(int uvhub, struct pnmask *dstp)
709 {
710 return constant_test_bit(uvhub, &dstp->bits[0]);
711 }
bau_uvhub_set(int pnode,struct pnmask * dstp)712 static inline void bau_uvhub_set(int pnode, struct pnmask *dstp)
713 {
714 __set_bit(pnode, &dstp->bits[0]);
715 }
bau_uvhubs_clear(struct pnmask * dstp,int nbits)716 static inline void bau_uvhubs_clear(struct pnmask *dstp,
717 int nbits)
718 {
719 bitmap_zero(&dstp->bits[0], nbits);
720 }
bau_uvhub_weight(struct pnmask * dstp)721 static inline int bau_uvhub_weight(struct pnmask *dstp)
722 {
723 return bitmap_weight((unsigned long *)&dstp->bits[0],
724 UV_DISTRIBUTION_SIZE);
725 }
726
bau_cpubits_clear(struct bau_local_cpumask * dstp,int nbits)727 static inline void bau_cpubits_clear(struct bau_local_cpumask *dstp, int nbits)
728 {
729 bitmap_zero(&dstp->bits, nbits);
730 }
731
732 extern void uv_bau_message_intr1(void);
733 #ifdef CONFIG_TRACING
734 #define trace_uv_bau_message_intr1 uv_bau_message_intr1
735 #endif
736 extern void uv_bau_timeout_intr1(void);
737
738 struct atomic_short {
739 short counter;
740 };
741
742 /*
743 * atomic_read_short - read a short atomic variable
744 * @v: pointer of type atomic_short
745 *
746 * Atomically reads the value of @v.
747 */
atomic_read_short(const struct atomic_short * v)748 static inline int atomic_read_short(const struct atomic_short *v)
749 {
750 return v->counter;
751 }
752
753 /*
754 * atom_asr - add and return a short int
755 * @i: short value to add
756 * @v: pointer of type atomic_short
757 *
758 * Atomically adds @i to @v and returns @i + @v
759 */
atom_asr(short i,struct atomic_short * v)760 static inline int atom_asr(short i, struct atomic_short *v)
761 {
762 short __i = i;
763 asm volatile(LOCK_PREFIX "xaddw %0, %1"
764 : "+r" (i), "+m" (v->counter)
765 : : "memory");
766 return i + __i;
767 }
768
769 /*
770 * conditionally add 1 to *v, unless *v is >= u
771 * return 0 if we cannot add 1 to *v because it is >= u
772 * return 1 if we can add 1 to *v because it is < u
773 * the add is atomic
774 *
775 * This is close to atomic_add_unless(), but this allows the 'u' value
776 * to be lowered below the current 'v'. atomic_add_unless can only stop
777 * on equal.
778 */
atomic_inc_unless_ge(spinlock_t * lock,atomic_t * v,int u)779 static inline int atomic_inc_unless_ge(spinlock_t *lock, atomic_t *v, int u)
780 {
781 spin_lock(lock);
782 if (atomic_read(v) >= u) {
783 spin_unlock(lock);
784 return 0;
785 }
786 atomic_inc(v);
787 spin_unlock(lock);
788 return 1;
789 }
790
791 #endif /* _ASM_X86_UV_UV_BAU_H */
792