]> git.proxmox.com Git - mirror_ubuntu-artful-kernel.git/blame - arch/x86/include/asm/uv/uv_bau.h
Merge git://git.kernel.org/pub/scm/linux/kernel/git/davem/net-next
[mirror_ubuntu-artful-kernel.git] / arch / x86 / include / asm / uv / uv_bau.h
CommitLineData
1812924b
CW
1/*
2 * This file is subject to the terms and conditions of the GNU General Public
3 * License. See the file "COPYING" in the main directory of this archive
4 * for more details.
5 *
6 * SGI UV Broadcast Assist Unit definitions
7 *
f073cc8f 8 * Copyright (C) 2008-2011 Silicon Graphics, Inc. All rights reserved.
1812924b
CW
9 */
10
05e4d316
PA
11#ifndef _ASM_X86_UV_UV_BAU_H
12#define _ASM_X86_UV_UV_BAU_H
1812924b
CW
13
14#include <linux/bitmap.h>
15#define BITSPERBYTE 8
16
1812924b 17/*
b194b120
CW
18 * Broadcast Assist Unit messaging structures
19 *
1812924b
CW
20 * Selective Broadcast activations are induced by software action
21 * specifying a particular 8-descriptor "set" via a 6-bit index written
22 * to an MMR.
23 * Thus there are 64 unique 512-byte sets of SB descriptors - one set for
24 * each 6-bit index value. These descriptor sets are mapped in sequence
25 * starting with set 0 located at the address specified in the
26 * BAU_SB_DESCRIPTOR_BASE register, set 1 is located at BASE + 512,
27 * set 2 is at BASE + 2*512, set 3 at BASE + 3*512, and so on.
28 *
cfa60917 29 * We will use one set for sending BAU messages from each of the
b8f7fb13 30 * cpu's on the uvhub.
1812924b
CW
31 *
32 * TLB shootdown will use the first of the 8 descriptors of each set.
33 * Each of the descriptors is 64 bytes in size (8*64 = 512 bytes in a set).
34 */
35
3ab0c49f
JC
36#define MAX_CPUS_PER_UVHUB 128
37#define MAX_CPUS_PER_SOCKET 64
f073cc8f
CW
38#define ADP_SZ 64 /* hardware-provided max. */
39#define UV_CPUS_PER_AS 32 /* hardware-provided max. */
40#define ITEMS_PER_DESC 8
50fb55ac 41/* the 'throttle' to prevent the hardware stay-busy bug */
b8f7fb13 42#define MAX_BAU_CONCURRENT 3
b194b120
CW
43#define UV_ACT_STATUS_MASK 0x3
44#define UV_ACT_STATUS_SIZE 2
b194b120
CW
45#define UV_DISTRIBUTION_SIZE 256
46#define UV_SW_ACK_NPENDING 8
2a919596
JS
47#define UV1_NET_ENDPOINT_INTD 0x38
48#define UV2_NET_ENDPOINT_INTD 0x28
49#define UV_NET_ENDPOINT_INTD (is_uv1_hub() ? \
50 UV1_NET_ENDPOINT_INTD : UV2_NET_ENDPOINT_INTD)
f073cc8f 51#define UV_DESC_PSHIFT 49
b194b120
CW
52#define UV_PAYLOADQ_PNODE_SHIFT 49
53#define UV_PTC_BASENAME "sgi_uv/ptc_statistics"
e8e5e8a8
CW
54#define UV_BAU_BASENAME "sgi_uv/bau_tunables"
55#define UV_BAU_TUNABLES_DIR "sgi_uv"
56#define UV_BAU_TUNABLES_FILE "bau_tunables"
57#define WHITESPACE " \t\n"
6a469e46 58#define uv_mmask ((1UL << uv_hub_info->m_val) - 1)
b194b120 59#define uv_physnodeaddr(x) ((__pa((unsigned long)(x)) & uv_mmask))
f073cc8f
CW
60#define cpubit_isset(cpu, bau_local_cpumask) \
61 test_bit((cpu), (bau_local_cpumask).bits)
2a919596 62
12a6611f 63/* [19:16] SOFT_ACK timeout period 19: 1 is urgency 7 17:16 1 is multiplier */
2a919596
JS
64/*
65 * UV2: Bit 19 selects between
66 * (0): 10 microsecond timebase and
67 * (1): 80 microseconds
da87c937 68 * we're using 560us, similar to UV1: 65 units of 10us
2a919596
JS
69 */
70#define UV1_INTD_SOFT_ACK_TIMEOUT_PERIOD (9UL)
ae90c232 71#define UV2_INTD_SOFT_ACK_TIMEOUT_PERIOD (15UL)
2a919596
JS
72
73#define UV_INTD_SOFT_ACK_TIMEOUT_PERIOD (is_uv1_hub() ? \
74 UV1_INTD_SOFT_ACK_TIMEOUT_PERIOD : \
75 UV2_INTD_SOFT_ACK_TIMEOUT_PERIOD)
a26fd719 76/* assuming UV3 is the same */
2a919596 77
f073cc8f 78#define BAU_MISC_CONTROL_MULT_MASK 3
12a6611f 79
f073cc8f 80#define UVH_AGING_PRESCALE_SEL 0x000000b000UL
12a6611f 81/* [30:28] URGENCY_7 an index into a table of times */
f073cc8f
CW
82#define BAU_URGENCY_7_SHIFT 28
83#define BAU_URGENCY_7_MASK 7
12a6611f 84
f073cc8f 85#define UVH_TRANSACTION_TIMEOUT 0x000000b200UL
12a6611f 86/* [45:40] BAU - BAU transaction timeout select - a multiplier */
f073cc8f
CW
87#define BAU_TRANS_SHIFT 40
88#define BAU_TRANS_MASK 0x3f
89
90/*
91 * shorten some awkward names
92 */
93#define AS_PUSH_SHIFT UVH_LB_BAU_SB_ACTIVATION_CONTROL_PUSH_SHFT
94#define SOFTACK_MSHIFT UVH_LB_BAU_MISC_CONTROL_ENABLE_INTD_SOFT_ACK_MODE_SHFT
95#define SOFTACK_PSHIFT UVH_LB_BAU_MISC_CONTROL_INTD_SOFT_ACK_TIMEOUT_PERIOD_SHFT
96#define SOFTACK_TIMEOUT_PERIOD UV_INTD_SOFT_ACK_TIMEOUT_PERIOD
a26fd719
CW
97#define PREFETCH_HINT_SHFT UV3H_LB_BAU_MISC_CONTROL_ENABLE_INTD_PREFETCH_HINT_SHFT
98#define SB_STATUS_SHFT UV3H_LB_BAU_MISC_CONTROL_ENABLE_EXTENDED_SB_STATUS_SHFT
f073cc8f
CW
99#define write_gmmr uv_write_global_mmr64
100#define write_lmmr uv_write_local_mmr
101#define read_lmmr uv_read_local_mmr
102#define read_gmmr uv_read_global_mmr64
b194b120
CW
103
104/*
105 * bits in UVH_LB_BAU_SB_ACTIVATION_STATUS_0/1
106 */
f073cc8f
CW
107#define DS_IDLE 0
108#define DS_ACTIVE 1
109#define DS_DESTINATION_TIMEOUT 2
110#define DS_SOURCE_TIMEOUT 3
2a919596
JS
111/*
112 * bits put together from HRP_LB_BAU_SB_ACTIVATION_STATUS_0/1/2
ae90c232 113 * values 1 and 3 will not occur
114 * Decoded meaning ERROR BUSY AUX ERR
115 * ------------------------------- ---- ----- -------
116 * IDLE 0 0 0
117 * BUSY (active) 0 1 0
118 * SW Ack Timeout (destination) 1 0 0
119 * SW Ack INTD rejected (strong NACK) 1 0 1
120 * Source Side Time Out Detected 1 1 0
121 * Destination Side PUT Failed 1 1 1
2a919596
JS
122 */
123#define UV2H_DESC_IDLE 0
ae90c232 124#define UV2H_DESC_BUSY 2
125#define UV2H_DESC_DEST_TIMEOUT 4
126#define UV2H_DESC_DEST_STRONG_NACK 5
2a919596
JS
127#define UV2H_DESC_SOURCE_TIMEOUT 6
128#define UV2H_DESC_DEST_PUT_ERR 7
1812924b 129
b194b120 130/*
e8e5e8a8 131 * delay for 'plugged' timeout retries, in microseconds
b8f7fb13 132 */
e8e5e8a8 133#define PLUGGED_DELAY 10
b8f7fb13
CW
134
135/*
136 * threshholds at which to use IPI to free resources
137 */
e8e5e8a8 138/* after this # consecutive 'plugged' timeouts, use IPI to release resources */
f073cc8f 139#define PLUGSB4RESET 100
e8e5e8a8 140/* after this many consecutive timeouts, use IPI to release resources */
f073cc8f 141#define TIMEOUTSB4RESET 1
e8e5e8a8 142/* at this number uses of IPI to release resources, giveup the request */
f073cc8f 143#define IPI_RESET_LIMIT 1
e8e5e8a8 144/* after this # consecutive successes, bump up the throttle if it was lowered */
f073cc8f 145#define COMPLETE_THRESHOLD 5
8b6e511e
CW
146/* after this # of giveups (fall back to kernel IPI's) disable the use of
147 the BAU for a period of time */
148#define GIVEUP_LIMIT 100
b8f7fb13 149
f073cc8f 150#define UV_LB_SUBNODEID 0x10
77ed23f8 151
2a919596
JS
152/* these two are the same for UV1 and UV2: */
153#define UV_SA_SHFT UVH_LB_BAU_MISC_CONTROL_INTD_SOFT_ACK_TIMEOUT_PERIOD_SHFT
154#define UV_SA_MASK UVH_LB_BAU_MISC_CONTROL_INTD_SOFT_ACK_TIMEOUT_PERIOD_MASK
155/* 4 bits of software ack period */
f073cc8f
CW
156#define UV2_ACK_MASK 0x7UL
157#define UV2_ACK_UNITS_SHFT 3
2a919596
JS
158#define UV2_EXT_SHFT UV2H_LB_BAU_MISC_CONTROL_ENABLE_EXTENDED_SB_STATUS_SHFT
159
b194b120
CW
160/*
161 * number of entries in the destination side payload queue
162 */
b8f7fb13 163#define DEST_Q_SIZE 20
b194b120
CW
164/*
165 * number of destination side software ack resources
166 */
dc163a41 167#define DEST_NUM_RESOURCES 8
b194b120
CW
168/*
169 * completion statuses for sending a TLB flush message
170 */
b8f7fb13
CW
171#define FLUSH_RETRY_PLUGGED 1
172#define FLUSH_RETRY_TIMEOUT 2
173#define FLUSH_GIVEUP 3
174#define FLUSH_COMPLETE 4
1812924b 175
e8e5e8a8
CW
176/*
177 * tuning the action when the numalink network is extremely delayed
178 */
f073cc8f
CW
179#define CONGESTED_RESPONSE_US 1000 /* 'long' response time, in
180 microseconds */
181#define CONGESTED_REPS 10 /* long delays averaged over
182 this many broadcasts */
8b6e511e 183#define DISABLED_PERIOD 10 /* time for the bau to be
f073cc8f
CW
184 disabled, in seconds */
185/* see msg_type: */
186#define MSG_NOOP 0
187#define MSG_REGULAR 1
188#define MSG_RETRY 2
e8e5e8a8 189
b194b120
CW
190/*
191 * Distribution: 32 bytes (256 bits) (bytes 0-0x1f of descriptor)
192 * If the 'multilevel' flag in the header portion of the descriptor
1812924b
CW
193 * has been set to 0, then endpoint multi-unicast mode is selected.
194 * The distribution specification (32 bytes) is interpreted as a 256-bit
195 * distribution vector. Adjacent bits correspond to consecutive even numbered
196 * nodeIDs. The result of adding the index of a given bit to the 15-bit
77ed23f8 197 * 'base_dest_nasid' field of the header corresponds to the
b194b120
CW
198 * destination nodeID associated with that specified bit.
199 */
a456eaab 200struct pnmask {
f073cc8f 201 unsigned long bits[BITS_TO_LONGS(UV_DISTRIBUTION_SIZE)];
1812924b
CW
202};
203
b194b120 204/*
b8f7fb13 205 * mask of cpu's on a uvhub
b194b120 206 * (during initialization we need to check that unsigned long has
b8f7fb13 207 * enough bits for max. cpu's per uvhub)
b194b120 208 */
1812924b 209struct bau_local_cpumask {
f073cc8f 210 unsigned long bits;
1812924b
CW
211};
212
213/*
214 * Payload: 16 bytes (128 bits) (bytes 0x20-0x2f of descriptor)
215 * only 12 bytes (96 bits) of the payload area are usable.
216 * An additional 3 bytes (bits 27:4) of the header address are carried
217 * to the next bytes of the destination payload queue.
218 * And an additional 2 bytes of the header Suppl_A field are also
219 * carried to the destination payload queue.
220 * But the first byte of the Suppl_A becomes bits 127:120 (the 16th byte)
221 * of the destination payload queue, which is written by the hardware
222 * with the s/w ack resource bit vector.
223 * [ effective message contents (16 bytes (128 bits) maximum), not counting
224 * the s/w ack bit vector ]
225 */
226
b194b120
CW
227/*
228 * The payload is software-defined for INTD transactions
229 */
1812924b 230struct bau_msg_payload {
f073cc8f
CW
231 unsigned long address; /* signifies a page or all
232 TLB's of the cpu */
1812924b 233 /* 64 bits */
f073cc8f 234 unsigned short sending_cpu; /* filled in by sender */
1812924b 235 /* 16 bits */
f073cc8f 236 unsigned short acknowledge_count; /* filled in by destination */
1812924b 237 /* 16 bits */
f073cc8f 238 unsigned int reserved1:32; /* not usable */
1812924b
CW
239};
240
241
b194b120 242/*
da87c937 243 * UV1 Message header: 16 bytes (128 bits) (bytes 0x30-0x3f of descriptor)
b194b120
CW
244 * see table 4.2.3.0.1 in broacast_assist spec.
245 */
da87c937 246struct uv1_bau_msg_header {
f073cc8f 247 unsigned int dest_subnodeid:6; /* must be 0x10, for the LB */
1812924b 248 /* bits 5:0 */
f073cc8f
CW
249 unsigned int base_dest_nasid:15; /* nasid of the first bit */
250 /* bits 20:6 */ /* in uvhub map */
251 unsigned int command:8; /* message type */
1812924b 252 /* bits 28:21 */
f073cc8f
CW
253 /* 0x38: SN3net EndPoint Message */
254 unsigned int rsvd_1:3; /* must be zero */
1812924b 255 /* bits 31:29 */
f073cc8f
CW
256 /* int will align on 32 bits */
257 unsigned int rsvd_2:9; /* must be zero */
1812924b 258 /* bits 40:32 */
f073cc8f
CW
259 /* Suppl_A is 56-41 */
260 unsigned int sequence:16; /* message sequence number */
261 /* bits 56:41 */ /* becomes bytes 16-17 of msg */
262 /* Address field (96:57) is
263 never used as an address
264 (these are address bits
265 42:3) */
266
267 unsigned int rsvd_3:1; /* must be zero */
1812924b 268 /* bit 57 */
f073cc8f 269 /* address bits 27:4 are payload */
b8f7fb13 270 /* these next 24 (58-81) bits become bytes 12-14 of msg */
b8f7fb13 271 /* bits 65:58 land in byte 12 */
f073cc8f
CW
272 unsigned int replied_to:1; /* sent as 0 by the source to
273 byte 12 */
1812924b 274 /* bit 58 */
f073cc8f
CW
275 unsigned int msg_type:3; /* software type of the
276 message */
b8f7fb13 277 /* bits 61:59 */
f073cc8f
CW
278 unsigned int canceled:1; /* message canceled, resource
279 is to be freed*/
b8f7fb13 280 /* bit 62 */
f073cc8f 281 unsigned int payload_1a:1; /* not currently used */
b8f7fb13 282 /* bit 63 */
f073cc8f 283 unsigned int payload_1b:2; /* not currently used */
b8f7fb13
CW
284 /* bits 65:64 */
285
286 /* bits 73:66 land in byte 13 */
f073cc8f 287 unsigned int payload_1ca:6; /* not currently used */
b8f7fb13 288 /* bits 71:66 */
f073cc8f 289 unsigned int payload_1c:2; /* not currently used */
b8f7fb13
CW
290 /* bits 73:72 */
291
292 /* bits 81:74 land in byte 14 */
f073cc8f 293 unsigned int payload_1d:6; /* not currently used */
b8f7fb13 294 /* bits 79:74 */
f073cc8f 295 unsigned int payload_1e:2; /* not currently used */
1812924b
CW
296 /* bits 81:80 */
297
f073cc8f 298 unsigned int rsvd_4:7; /* must be zero */
1812924b 299 /* bits 88:82 */
f073cc8f 300 unsigned int swack_flag:1; /* software acknowledge flag */
1812924b 301 /* bit 89 */
f073cc8f
CW
302 /* INTD trasactions at
303 destination are to wait for
304 software acknowledge */
305 unsigned int rsvd_5:6; /* must be zero */
1812924b 306 /* bits 95:90 */
f073cc8f 307 unsigned int rsvd_6:5; /* must be zero */
1812924b 308 /* bits 100:96 */
f073cc8f
CW
309 unsigned int int_both:1; /* if 1, interrupt both sockets
310 on the uvhub */
1812924b 311 /* bit 101*/
f073cc8f 312 unsigned int fairness:3; /* usually zero */
1812924b 313 /* bits 104:102 */
f073cc8f
CW
314 unsigned int multilevel:1; /* multi-level multicast
315 format */
1812924b 316 /* bit 105 */
f073cc8f
CW
317 /* 0 for TLB: endpoint multi-unicast messages */
318 unsigned int chaining:1; /* next descriptor is part of
319 this activation*/
1812924b 320 /* bit 106 */
f073cc8f 321 unsigned int rsvd_7:21; /* must be zero */
1812924b
CW
322 /* bits 127:107 */
323};
324
da87c937
CW
325/*
326 * UV2 Message header: 16 bytes (128 bits) (bytes 0x30-0x3f of descriptor)
327 * see figure 9-2 of harp_sys.pdf
a26fd719 328 * assuming UV3 is the same
da87c937 329 */
a26fd719 330struct uv2_3_bau_msg_header {
da87c937
CW
331 unsigned int base_dest_nasid:15; /* nasid of the first bit */
332 /* bits 14:0 */ /* in uvhub map */
333 unsigned int dest_subnodeid:5; /* must be 0x10, for the LB */
334 /* bits 19:15 */
335 unsigned int rsvd_1:1; /* must be zero */
336 /* bit 20 */
337 /* Address bits 59:21 */
338 /* bits 25:2 of address (44:21) are payload */
339 /* these next 24 bits become bytes 12-14 of msg */
340 /* bits 28:21 land in byte 12 */
341 unsigned int replied_to:1; /* sent as 0 by the source to
342 byte 12 */
343 /* bit 21 */
344 unsigned int msg_type:3; /* software type of the
345 message */
346 /* bits 24:22 */
347 unsigned int canceled:1; /* message canceled, resource
348 is to be freed*/
349 /* bit 25 */
350 unsigned int payload_1:3; /* not currently used */
351 /* bits 28:26 */
352
353 /* bits 36:29 land in byte 13 */
354 unsigned int payload_2a:3; /* not currently used */
355 unsigned int payload_2b:5; /* not currently used */
356 /* bits 36:29 */
357
358 /* bits 44:37 land in byte 14 */
359 unsigned int payload_3:8; /* not currently used */
360 /* bits 44:37 */
361
362 unsigned int rsvd_2:7; /* reserved */
363 /* bits 51:45 */
364 unsigned int swack_flag:1; /* software acknowledge flag */
365 /* bit 52 */
366 unsigned int rsvd_3a:3; /* must be zero */
367 unsigned int rsvd_3b:8; /* must be zero */
368 unsigned int rsvd_3c:8; /* must be zero */
369 unsigned int rsvd_3d:3; /* must be zero */
370 /* bits 74:53 */
371 unsigned int fairness:3; /* usually zero */
372 /* bits 77:75 */
373
374 unsigned int sequence:16; /* message sequence number */
375 /* bits 93:78 Suppl_A */
376 unsigned int chaining:1; /* next descriptor is part of
377 this activation*/
378 /* bit 94 */
379 unsigned int multilevel:1; /* multi-level multicast
380 format */
381 /* bit 95 */
382 unsigned int rsvd_4:24; /* ordered / source node /
383 source subnode / aging
384 must be zero */
385 /* bits 119:96 */
386 unsigned int command:8; /* message type */
387 /* bits 127:120 */
388};
389
b194b120 390/*
dc163a41 391 * The activation descriptor:
b194b120
CW
392 * The format of the message to send, plus all accompanying control
393 * Should be 64 bytes
394 */
dc163a41 395struct bau_desc {
da87c937 396 struct pnmask distribution;
b194b120
CW
397 /*
398 * message template, consisting of header and payload:
399 */
da87c937
CW
400 union bau_msg_header {
401 struct uv1_bau_msg_header uv1_hdr;
a26fd719 402 struct uv2_3_bau_msg_header uv2_3_hdr;
da87c937
CW
403 } header;
404
405 struct bau_msg_payload payload;
1812924b 406};
da87c937 407/* UV1:
1812924b
CW
408 * -payload-- ---------header------
409 * bytes 0-11 bits 41-56 bits 58-81
410 * A B (2) C (3)
411 *
412 * A/B/C are moved to:
413 * A C B
414 * bytes 0-11 bytes 12-14 bytes 16-17 (byte 15 filled in by hw as vector)
415 * ------------payload queue-----------
416 */
da87c937
CW
417/* UV2:
418 * -payload-- ---------header------
419 * bytes 0-11 bits 70-78 bits 21-44
420 * A B (2) C (3)
421 *
422 * A/B/C are moved to:
423 * A C B
424 * bytes 0-11 bytes 12-14 bytes 16-17 (byte 15 filled in by hw as vector)
425 * ------------payload queue-----------
426 */
1812924b
CW
427
428/*
429 * The payload queue on the destination side is an array of these.
430 * With BAU_MISC_CONTROL set for software acknowledge mode, the messages
431 * are 32 bytes (2 micropackets) (256 bits) in length, but contain only 17
432 * bytes of usable data, including the sw ack vector in byte 15 (bits 127:120)
433 * (12 bytes come from bau_msg_payload, 3 from payload_1, 2 from
f073cc8f 434 * swack_vec and payload_2)
1812924b
CW
435 * "Enabling Software Acknowledgment mode (see Section 4.3.3 Software
436 * Acknowledge Processing) also selects 32 byte (17 bytes usable) payload
437 * operation."
438 */
f073cc8f
CW
439struct bau_pq_entry {
440 unsigned long address; /* signifies a page or all TLB's
441 of the cpu */
1812924b 442 /* 64 bits, bytes 0-7 */
f073cc8f 443 unsigned short sending_cpu; /* cpu that sent the message */
1812924b 444 /* 16 bits, bytes 8-9 */
f073cc8f 445 unsigned short acknowledge_count; /* filled in by destination */
1812924b 446 /* 16 bits, bytes 10-11 */
b8f7fb13 447 /* these next 3 bytes come from bits 58-81 of the message header */
f073cc8f
CW
448 unsigned short replied_to:1; /* sent as 0 by the source */
449 unsigned short msg_type:3; /* software message type */
450 unsigned short canceled:1; /* sent as 0 by the source */
451 unsigned short unused1:3; /* not currently using */
b8f7fb13 452 /* byte 12 */
f073cc8f 453 unsigned char unused2a; /* not currently using */
b8f7fb13 454 /* byte 13 */
f073cc8f 455 unsigned char unused2; /* not currently using */
b8f7fb13 456 /* byte 14 */
f073cc8f 457 unsigned char swack_vec; /* filled in by the hardware */
1812924b 458 /* byte 15 (bits 127:120) */
f073cc8f 459 unsigned short sequence; /* message sequence number */
b8f7fb13 460 /* bytes 16-17 */
f073cc8f 461 unsigned char unused4[2]; /* not currently using bytes 18-19 */
b8f7fb13 462 /* bytes 18-19 */
f073cc8f 463 int number_of_cpus; /* filled in at destination */
1812924b 464 /* 32 bits, bytes 20-23 (aligned) */
f073cc8f 465 unsigned char unused5[8]; /* not using */
1812924b
CW
466 /* bytes 24-31 */
467};
468
4faca155 469struct msg_desc {
f073cc8f
CW
470 struct bau_pq_entry *msg;
471 int msg_slot;
f073cc8f
CW
472 struct bau_pq_entry *queue_first;
473 struct bau_pq_entry *queue_last;
4faca155
CW
474};
475
476struct reset_args {
f073cc8f 477 int sender;
4faca155
CW
478};
479
480/*
481 * This structure is allocated per_cpu for UV TLB shootdown statistics.
482 */
483struct ptc_stats {
484 /* sender statistics */
f073cc8f
CW
485 unsigned long s_giveup; /* number of fall backs to
486 IPI-style flushes */
487 unsigned long s_requestor; /* number of shootdown
488 requests */
489 unsigned long s_stimeout; /* source side timeouts */
490 unsigned long s_dtimeout; /* destination side timeouts */
b54bd9be 491 unsigned long s_strongnacks; /* number of strong nack's */
f073cc8f
CW
492 unsigned long s_time; /* time spent in sending side */
493 unsigned long s_retriesok; /* successful retries */
494 unsigned long s_ntargcpu; /* total number of cpu's
495 targeted */
496 unsigned long s_ntargself; /* times the sending cpu was
497 targeted */
498 unsigned long s_ntarglocals; /* targets of cpus on the local
499 blade */
500 unsigned long s_ntargremotes; /* targets of cpus on remote
501 blades */
502 unsigned long s_ntarglocaluvhub; /* targets of the local hub */
503 unsigned long s_ntargremoteuvhub; /* remotes hubs targeted */
504 unsigned long s_ntarguvhub; /* total number of uvhubs
505 targeted */
506 unsigned long s_ntarguvhub16; /* number of times target
507 hubs >= 16*/
508 unsigned long s_ntarguvhub8; /* number of times target
509 hubs >= 8 */
510 unsigned long s_ntarguvhub4; /* number of times target
511 hubs >= 4 */
512 unsigned long s_ntarguvhub2; /* number of times target
513 hubs >= 2 */
514 unsigned long s_ntarguvhub1; /* number of times target
515 hubs == 1 */
516 unsigned long s_resets_plug; /* ipi-style resets from plug
517 state */
518 unsigned long s_resets_timeout; /* ipi-style resets from
519 timeouts */
520 unsigned long s_busy; /* status stayed busy past
521 s/w timer */
522 unsigned long s_throttles; /* waits in throttle */
523 unsigned long s_retry_messages; /* retry broadcasts */
524 unsigned long s_bau_reenabled; /* for bau enable/disable */
525 unsigned long s_bau_disabled; /* for bau enable/disable */
c5d35d39
CW
526 unsigned long s_uv2_wars; /* uv2 workaround, perm. busy */
527 unsigned long s_uv2_wars_hw; /* uv2 workaround, hiwater */
528 unsigned long s_uv2_war_waits; /* uv2 workaround, long waits */
8b6e511e
CW
529 unsigned long s_overipilimit; /* over the ipi reset limit */
530 unsigned long s_giveuplimit; /* disables, over giveup limit*/
531 unsigned long s_enters; /* entries to the driver */
532 unsigned long s_ipifordisabled; /* fall back to IPI; disabled */
533 unsigned long s_plugged; /* plugged by h/w bug*/
534 unsigned long s_congested; /* giveup on long wait */
4faca155 535 /* destination statistics */
f073cc8f
CW
536 unsigned long d_alltlb; /* times all tlb's on this
537 cpu were flushed */
538 unsigned long d_onetlb; /* times just one tlb on this
539 cpu was flushed */
540 unsigned long d_multmsg; /* interrupts with multiple
541 messages */
542 unsigned long d_nomsg; /* interrupts with no message */
543 unsigned long d_time; /* time spent on destination
544 side */
545 unsigned long d_requestee; /* number of messages
546 processed */
547 unsigned long d_retries; /* number of retry messages
548 processed */
549 unsigned long d_canceled; /* number of messages canceled
550 by retries */
551 unsigned long d_nocanceled; /* retries that found nothing
552 to cancel */
553 unsigned long d_resets; /* number of ipi-style requests
554 processed */
555 unsigned long d_rcanceled; /* number of messages canceled
556 by resets */
557};
558
559struct tunables {
560 int *tunp;
561 int deflt;
4faca155
CW
562};
563
77ed23f8 564struct hub_and_pnode {
f073cc8f
CW
565 short uvhub;
566 short pnode;
567};
568
569struct socket_desc {
570 short num_cpus;
571 short cpu_number[MAX_CPUS_PER_SOCKET];
572};
573
574struct uvhub_desc {
575 unsigned short socket_mask;
576 short num_cpus;
577 short uvhub;
578 short pnode;
579 struct socket_desc socket[2];
77ed23f8 580};
f073cc8f 581
b194b120 582/*
b8f7fb13 583 * one per-cpu; to locate the software tables
b194b120 584 */
1812924b 585struct bau_control {
f073cc8f
CW
586 struct bau_desc *descriptor_base;
587 struct bau_pq_entry *queue_first;
588 struct bau_pq_entry *queue_last;
589 struct bau_pq_entry *bau_msg_head;
590 struct bau_control *uvhub_master;
591 struct bau_control *socket_master;
592 struct ptc_stats *statp;
442d3924 593 cpumask_t *cpumask;
f073cc8f
CW
594 unsigned long timeout_interval;
595 unsigned long set_bau_on_time;
596 atomic_t active_descriptor_count;
597 int plugged_tries;
598 int timeout_tries;
599 int ipi_attempts;
600 int conseccompletes;
1c532e00 601 bool nobau;
8b6e511e 602 short baudisabled;
f073cc8f
CW
603 short cpu;
604 short osnode;
605 short uvhub_cpu;
606 short uvhub;
da87c937 607 short uvhub_version;
f073cc8f
CW
608 short cpus_in_socket;
609 short cpus_in_uvhub;
610 short partition_base_pnode;
8b6e511e 611 short busy; /* all were busy (war) */
f073cc8f
CW
612 unsigned short message_number;
613 unsigned short uvhub_quiesce;
614 short socket_acknowledge_count[DEST_Q_SIZE];
615 cycles_t send_message;
8b6e511e
CW
616 cycles_t period_end;
617 cycles_t period_time;
f073cc8f
CW
618 spinlock_t uvhub_lock;
619 spinlock_t queue_lock;
8b6e511e 620 spinlock_t disable_lock;
e8e5e8a8 621 /* tunables */
f073cc8f
CW
622 int max_concurr;
623 int max_concurr_const;
624 int plugged_delay;
625 int plugsb4reset;
626 int timeoutsb4reset;
627 int ipi_reset_limit;
628 int complete_threshold;
629 int cong_response_us;
630 int cong_reps;
8b6e511e
CW
631 cycles_t disabled_period;
632 int period_giveups;
633 int giveup_limit;
f073cc8f
CW
634 long period_requests;
635 struct hub_and_pnode *thp;
1812924b
CW
636};
637
b18fb2c0 638static inline void write_mmr_data_broadcast(int pnode, unsigned long mmr_image)
f073cc8f
CW
639{
640 write_gmmr(pnode, UVH_BAU_DATA_BROADCAST, mmr_image);
641}
642
b18fb2c0 643static inline void write_mmr_descriptor_base(int pnode, unsigned long mmr_image)
f073cc8f
CW
644{
645 write_gmmr(pnode, UVH_LB_BAU_SB_DESCRIPTOR_BASE, mmr_image);
646}
647
b18fb2c0 648static inline void write_mmr_activation(unsigned long index)
f073cc8f
CW
649{
650 write_lmmr(UVH_LB_BAU_SB_ACTIVATION_CONTROL, index);
651}
652
b18fb2c0 653static inline void write_gmmr_activation(int pnode, unsigned long mmr_image)
f073cc8f
CW
654{
655 write_gmmr(pnode, UVH_LB_BAU_SB_ACTIVATION_CONTROL, mmr_image);
656}
657
b18fb2c0 658static inline void write_mmr_payload_first(int pnode, unsigned long mmr_image)
f073cc8f
CW
659{
660 write_gmmr(pnode, UVH_LB_BAU_INTD_PAYLOAD_QUEUE_FIRST, mmr_image);
661}
662
b18fb2c0 663static inline void write_mmr_payload_tail(int pnode, unsigned long mmr_image)
f073cc8f
CW
664{
665 write_gmmr(pnode, UVH_LB_BAU_INTD_PAYLOAD_QUEUE_TAIL, mmr_image);
666}
667
b18fb2c0 668static inline void write_mmr_payload_last(int pnode, unsigned long mmr_image)
f073cc8f
CW
669{
670 write_gmmr(pnode, UVH_LB_BAU_INTD_PAYLOAD_QUEUE_LAST, mmr_image);
671}
672
b18fb2c0 673static inline void write_mmr_misc_control(int pnode, unsigned long mmr_image)
f073cc8f
CW
674{
675 write_gmmr(pnode, UVH_LB_BAU_MISC_CONTROL, mmr_image);
676}
677
b18fb2c0 678static inline unsigned long read_mmr_misc_control(int pnode)
f073cc8f
CW
679{
680 return read_gmmr(pnode, UVH_LB_BAU_MISC_CONTROL);
681}
682
b18fb2c0 683static inline void write_mmr_sw_ack(unsigned long mr)
f073cc8f
CW
684{
685 uv_write_local_mmr(UVH_LB_BAU_INTD_SOFTWARE_ACKNOWLEDGE_ALIAS, mr);
686}
687
c5d35d39
CW
688static inline void write_gmmr_sw_ack(int pnode, unsigned long mr)
689{
690 write_gmmr(pnode, UVH_LB_BAU_INTD_SOFTWARE_ACKNOWLEDGE_ALIAS, mr);
691}
692
b18fb2c0 693static inline unsigned long read_mmr_sw_ack(void)
f073cc8f
CW
694{
695 return read_lmmr(UVH_LB_BAU_INTD_SOFTWARE_ACKNOWLEDGE);
696}
697
b18fb2c0 698static inline unsigned long read_gmmr_sw_ack(int pnode)
f073cc8f
CW
699{
700 return read_gmmr(pnode, UVH_LB_BAU_INTD_SOFTWARE_ACKNOWLEDGE);
701}
702
b18fb2c0 703static inline void write_mmr_data_config(int pnode, unsigned long mr)
f073cc8f
CW
704{
705 uv_write_global_mmr64(pnode, UVH_BAU_DATA_CONFIG, mr);
706}
707
a456eaab 708static inline int bau_uvhub_isset(int uvhub, struct pnmask *dstp)
1812924b 709{
b8f7fb13 710 return constant_test_bit(uvhub, &dstp->bits[0]);
1812924b 711}
a456eaab 712static inline void bau_uvhub_set(int pnode, struct pnmask *dstp)
1812924b 713{
77ed23f8 714 __set_bit(pnode, &dstp->bits[0]);
1812924b 715}
a456eaab 716static inline void bau_uvhubs_clear(struct pnmask *dstp,
b8f7fb13 717 int nbits)
1812924b
CW
718{
719 bitmap_zero(&dstp->bits[0], nbits);
720}
a456eaab 721static inline int bau_uvhub_weight(struct pnmask *dstp)
b8f7fb13
CW
722{
723 return bitmap_weight((unsigned long *)&dstp->bits[0],
724 UV_DISTRIBUTION_SIZE);
725}
1812924b
CW
726
727static inline void bau_cpubits_clear(struct bau_local_cpumask *dstp, int nbits)
728{
729 bitmap_zero(&dstp->bits, nbits);
730}
731
b194b120 732extern void uv_bau_message_intr1(void);
cf910e83
SA
733#ifdef CONFIG_TRACING
734#define trace_uv_bau_message_intr1 uv_bau_message_intr1
735#endif
b194b120 736extern void uv_bau_timeout_intr1(void);
1812924b 737
b8f7fb13
CW
738struct atomic_short {
739 short counter;
740};
741
f073cc8f 742/*
b8f7fb13
CW
743 * atomic_read_short - read a short atomic variable
744 * @v: pointer of type atomic_short
745 *
746 * Atomically reads the value of @v.
747 */
748static inline int atomic_read_short(const struct atomic_short *v)
749{
750 return v->counter;
751}
752
f073cc8f
CW
753/*
754 * atom_asr - add and return a short int
b8f7fb13
CW
755 * @i: short value to add
756 * @v: pointer of type atomic_short
757 *
758 * Atomically adds @i to @v and returns @i + @v
759 */
f073cc8f 760static inline int atom_asr(short i, struct atomic_short *v)
b8f7fb13 761{
a26fd719
CW
762 short __i = i;
763 asm volatile(LOCK_PREFIX "xaddw %0, %1"
764 : "+r" (i), "+m" (v->counter)
765 : : "memory");
766 return i + __i;
b8f7fb13
CW
767}
768
f073cc8f
CW
769/*
770 * conditionally add 1 to *v, unless *v is >= u
771 * return 0 if we cannot add 1 to *v because it is >= u
772 * return 1 if we can add 1 to *v because it is < u
773 * the add is atomic
774 *
775 * This is close to atomic_add_unless(), but this allows the 'u' value
776 * to be lowered below the current 'v'. atomic_add_unless can only stop
777 * on equal.
778 */
779static inline int atomic_inc_unless_ge(spinlock_t *lock, atomic_t *v, int u)
780{
781 spin_lock(lock);
782 if (atomic_read(v) >= u) {
783 spin_unlock(lock);
784 return 0;
785 }
786 atomic_inc(v);
787 spin_unlock(lock);
788 return 1;
789}
790
05e4d316 791#endif /* _ASM_X86_UV_UV_BAU_H */