1/*
2 * This file is subject to the terms and conditions of the GNU General Public
3 * License.  See the file "COPYING" in the main directory of this archive
4 * for more details.
5 *
6 * SGI UV Broadcast Assist Unit definitions
7 *
8 * Copyright (C) 2008-2011 Silicon Graphics, Inc. All rights reserved.
9 */
10
11#ifndef _ASM_X86_UV_UV_BAU_H
12#define _ASM_X86_UV_UV_BAU_H
13
14#include <linux/bitmap.h>
15#define BITSPERBYTE 8
16
17/*
18 * Broadcast Assist Unit messaging structures
19 *
20 * Selective Broadcast activations are induced by software action
21 * specifying a particular 8-descriptor "set" via a 6-bit index written
22 * to an MMR.
23 * Thus there are 64 unique 512-byte sets of SB descriptors - one set for
24 * each 6-bit index value. These descriptor sets are mapped in sequence
25 * starting with set 0 located at the address specified in the
26 * BAU_SB_DESCRIPTOR_BASE register, set 1 is located at BASE + 512,
27 * set 2 is at BASE + 2*512, set 3 at BASE + 3*512, and so on.
28 *
29 * We will use one set for sending BAU messages from each of the
30 * cpu's on the uvhub.
31 *
32 * TLB shootdown will use the first of the 8 descriptors of each set.
33 * Each of the descriptors is 64 bytes in size (8*64 = 512 bytes in a set).
34 */
35
36#define MAX_CPUS_PER_UVHUB		128
37#define MAX_CPUS_PER_SOCKET		64
38#define ADP_SZ				64 /* hardware-provided max. */
39#define UV_CPUS_PER_AS			32 /* hardware-provided max. */
40#define ITEMS_PER_DESC			8
41/* the 'throttle' to prevent the hardware stay-busy bug */
42#define MAX_BAU_CONCURRENT		3
43#define UV_ACT_STATUS_MASK		0x3
44#define UV_ACT_STATUS_SIZE		2
45#define UV_DISTRIBUTION_SIZE		256
46#define UV_SW_ACK_NPENDING		8
47#define UV1_NET_ENDPOINT_INTD		0x38
48#define UV2_NET_ENDPOINT_INTD		0x28
49#define UV_NET_ENDPOINT_INTD		(is_uv1_hub() ?			\
50			UV1_NET_ENDPOINT_INTD : UV2_NET_ENDPOINT_INTD)
51#define UV_DESC_PSHIFT			49
52#define UV_PAYLOADQ_PNODE_SHIFT		49
53#define UV_PTC_BASENAME			"sgi_uv/ptc_statistics"
54#define UV_BAU_BASENAME			"sgi_uv/bau_tunables"
55#define UV_BAU_TUNABLES_DIR		"sgi_uv"
56#define UV_BAU_TUNABLES_FILE		"bau_tunables"
57#define WHITESPACE			" \t\n"
58#define uv_mmask			((1UL << uv_hub_info->m_val) - 1)
59#define uv_physnodeaddr(x)		((__pa((unsigned long)(x)) & uv_mmask))
60#define cpubit_isset(cpu, bau_local_cpumask) \
61	test_bit((cpu), (bau_local_cpumask).bits)
62
63/* [19:16] SOFT_ACK timeout period  19: 1 is urgency 7  17:16 1 is multiplier */
64/*
65 * UV2: Bit 19 selects between
66 *  (0): 10 microsecond timebase and
67 *  (1): 80 microseconds
68 *  we're using 560us, similar to UV1: 65 units of 10us
69 */
70#define UV1_INTD_SOFT_ACK_TIMEOUT_PERIOD (9UL)
71#define UV2_INTD_SOFT_ACK_TIMEOUT_PERIOD (15UL)
72
73#define UV_INTD_SOFT_ACK_TIMEOUT_PERIOD	(is_uv1_hub() ?			\
74		UV1_INTD_SOFT_ACK_TIMEOUT_PERIOD :			\
75		UV2_INTD_SOFT_ACK_TIMEOUT_PERIOD)
76/* assuming UV3 is the same */
77
78#define BAU_MISC_CONTROL_MULT_MASK	3
79
80#define UVH_AGING_PRESCALE_SEL		0x000000b000UL
81/* [30:28] URGENCY_7  an index into a table of times */
82#define BAU_URGENCY_7_SHIFT		28
83#define BAU_URGENCY_7_MASK		7
84
85#define UVH_TRANSACTION_TIMEOUT		0x000000b200UL
86/* [45:40] BAU - BAU transaction timeout select - a multiplier */
87#define BAU_TRANS_SHIFT			40
88#define BAU_TRANS_MASK			0x3f
89
90/*
91 * shorten some awkward names
92 */
93#define AS_PUSH_SHIFT UVH_LB_BAU_SB_ACTIVATION_CONTROL_PUSH_SHFT
94#define SOFTACK_MSHIFT UVH_LB_BAU_MISC_CONTROL_ENABLE_INTD_SOFT_ACK_MODE_SHFT
95#define SOFTACK_PSHIFT UVH_LB_BAU_MISC_CONTROL_INTD_SOFT_ACK_TIMEOUT_PERIOD_SHFT
96#define SOFTACK_TIMEOUT_PERIOD UV_INTD_SOFT_ACK_TIMEOUT_PERIOD
97#define PREFETCH_HINT_SHFT UV3H_LB_BAU_MISC_CONTROL_ENABLE_INTD_PREFETCH_HINT_SHFT
98#define SB_STATUS_SHFT UV3H_LB_BAU_MISC_CONTROL_ENABLE_EXTENDED_SB_STATUS_SHFT
99#define write_gmmr	uv_write_global_mmr64
100#define write_lmmr	uv_write_local_mmr
101#define read_lmmr	uv_read_local_mmr
102#define read_gmmr	uv_read_global_mmr64
103
104/*
105 * bits in UVH_LB_BAU_SB_ACTIVATION_STATUS_0/1
106 */
107#define DS_IDLE				0
108#define DS_ACTIVE			1
109#define DS_DESTINATION_TIMEOUT		2
110#define DS_SOURCE_TIMEOUT		3
111/*
112 * bits put together from HRP_LB_BAU_SB_ACTIVATION_STATUS_0/1/2
113 * values 1 and 3 will not occur
114 *        Decoded meaning              ERROR  BUSY    AUX ERR
115 * -------------------------------     ----   -----   -------
116 * IDLE                                 0       0        0
117 * BUSY (active)                        0       1        0
118 * SW Ack Timeout (destination)         1       0        0
119 * SW Ack INTD rejected (strong NACK)   1       0        1
120 * Source Side Time Out Detected        1       1        0
121 * Destination Side PUT Failed          1       1        1
122 */
123#define UV2H_DESC_IDLE			0
124#define UV2H_DESC_BUSY			2
125#define UV2H_DESC_DEST_TIMEOUT		4
126#define UV2H_DESC_DEST_STRONG_NACK	5
127#define UV2H_DESC_SOURCE_TIMEOUT	6
128#define UV2H_DESC_DEST_PUT_ERR		7
129
130/*
131 * delay for 'plugged' timeout retries, in microseconds
132 */
133#define PLUGGED_DELAY			10
134
135/*
136 * threshholds at which to use IPI to free resources
137 */
138/* after this # consecutive 'plugged' timeouts, use IPI to release resources */
139#define PLUGSB4RESET			100
140/* after this many consecutive timeouts, use IPI to release resources */
141#define TIMEOUTSB4RESET			1
142/* at this number uses of IPI to release resources, giveup the request */
143#define IPI_RESET_LIMIT			1
144/* after this # consecutive successes, bump up the throttle if it was lowered */
145#define COMPLETE_THRESHOLD		5
146/* after this # of giveups (fall back to kernel IPI's) disable the use of
147   the BAU for a period of time */
148#define GIVEUP_LIMIT			100
149
150#define UV_LB_SUBNODEID			0x10
151
152/* these two are the same for UV1 and UV2: */
153#define UV_SA_SHFT UVH_LB_BAU_MISC_CONTROL_INTD_SOFT_ACK_TIMEOUT_PERIOD_SHFT
154#define UV_SA_MASK UVH_LB_BAU_MISC_CONTROL_INTD_SOFT_ACK_TIMEOUT_PERIOD_MASK
155/* 4 bits of software ack period */
156#define UV2_ACK_MASK			0x7UL
157#define UV2_ACK_UNITS_SHFT		3
158#define UV2_EXT_SHFT UV2H_LB_BAU_MISC_CONTROL_ENABLE_EXTENDED_SB_STATUS_SHFT
159
160/*
161 * number of entries in the destination side payload queue
162 */
163#define DEST_Q_SIZE			20
164/*
165 * number of destination side software ack resources
166 */
167#define DEST_NUM_RESOURCES		8
168/*
169 * completion statuses for sending a TLB flush message
170 */
171#define FLUSH_RETRY_PLUGGED		1
172#define FLUSH_RETRY_TIMEOUT		2
173#define FLUSH_GIVEUP			3
174#define FLUSH_COMPLETE			4
175
176/*
177 * tuning the action when the numalink network is extremely delayed
178 */
179#define CONGESTED_RESPONSE_US		1000	/* 'long' response time, in
180						   microseconds */
181#define CONGESTED_REPS			10	/* long delays averaged over
182						   this many broadcasts */
183#define DISABLED_PERIOD			10	/* time for the bau to be
184						   disabled, in seconds */
185/* see msg_type: */
186#define MSG_NOOP			0
187#define MSG_REGULAR			1
188#define MSG_RETRY			2
189
190/*
191 * Distribution: 32 bytes (256 bits) (bytes 0-0x1f of descriptor)
192 * If the 'multilevel' flag in the header portion of the descriptor
193 * has been set to 0, then endpoint multi-unicast mode is selected.
194 * The distribution specification (32 bytes) is interpreted as a 256-bit
195 * distribution vector. Adjacent bits correspond to consecutive even numbered
196 * nodeIDs. The result of adding the index of a given bit to the 15-bit
197 * 'base_dest_nasid' field of the header corresponds to the
198 * destination nodeID associated with that specified bit.
199 */
200struct pnmask {
201	unsigned long		bits[BITS_TO_LONGS(UV_DISTRIBUTION_SIZE)];
202};
203
204/*
205 * mask of cpu's on a uvhub
206 * (during initialization we need to check that unsigned long has
207 *  enough bits for max. cpu's per uvhub)
208 */
209struct bau_local_cpumask {
210	unsigned long		bits;
211};
212
213/*
214 * Payload: 16 bytes (128 bits) (bytes 0x20-0x2f of descriptor)
215 * only 12 bytes (96 bits) of the payload area are usable.
216 * An additional 3 bytes (bits 27:4) of the header address are carried
217 * to the next bytes of the destination payload queue.
218 * And an additional 2 bytes of the header Suppl_A field are also
219 * carried to the destination payload queue.
220 * But the first byte of the Suppl_A becomes bits 127:120 (the 16th byte)
221 * of the destination payload queue, which is written by the hardware
222 * with the s/w ack resource bit vector.
223 * [ effective message contents (16 bytes (128 bits) maximum), not counting
224 *   the s/w ack bit vector  ]
225 */
226
227/*
228 * The payload is software-defined for INTD transactions
229 */
230struct bau_msg_payload {
231	unsigned long	address;		/* signifies a page or all
232						   TLB's of the cpu */
233	/* 64 bits */
234	unsigned short	sending_cpu;		/* filled in by sender */
235	/* 16 bits */
236	unsigned short	acknowledge_count;	/* filled in by destination */
237	/* 16 bits */
238	unsigned int	reserved1:32;		/* not usable */
239};
240
241
242/*
243 * UV1 Message header:  16 bytes (128 bits) (bytes 0x30-0x3f of descriptor)
244 * see table 4.2.3.0.1 in broacast_assist spec.
245 */
246struct uv1_bau_msg_header {
247	unsigned int	dest_subnodeid:6;	/* must be 0x10, for the LB */
248	/* bits 5:0 */
249	unsigned int	base_dest_nasid:15;	/* nasid of the first bit */
250	/* bits 20:6 */				/* in uvhub map */
251	unsigned int	command:8;		/* message type */
252	/* bits 28:21 */
253	/* 0x38: SN3net EndPoint Message */
254	unsigned int	rsvd_1:3;		/* must be zero */
255	/* bits 31:29 */
256	/* int will align on 32 bits */
257	unsigned int	rsvd_2:9;		/* must be zero */
258	/* bits 40:32 */
259	/* Suppl_A is 56-41 */
260	unsigned int	sequence:16;		/* message sequence number */
261	/* bits 56:41 */			/* becomes bytes 16-17 of msg */
262						/* Address field (96:57) is
263						   never used as an address
264						   (these are address bits
265						   42:3) */
266
267	unsigned int	rsvd_3:1;		/* must be zero */
268	/* bit 57 */
269	/* address bits 27:4 are payload */
270	/* these next 24  (58-81) bits become bytes 12-14 of msg */
271	/* bits 65:58 land in byte 12 */
272	unsigned int	replied_to:1;		/* sent as 0 by the source to
273						   byte 12 */
274	/* bit 58 */
275	unsigned int	msg_type:3;		/* software type of the
276						   message */
277	/* bits 61:59 */
278	unsigned int	canceled:1;		/* message canceled, resource
279						   is to be freed*/
280	/* bit 62 */
281	unsigned int	payload_1a:1;		/* not currently used */
282	/* bit 63 */
283	unsigned int	payload_1b:2;		/* not currently used */
284	/* bits 65:64 */
285
286	/* bits 73:66 land in byte 13 */
287	unsigned int	payload_1ca:6;		/* not currently used */
288	/* bits 71:66 */
289	unsigned int	payload_1c:2;		/* not currently used */
290	/* bits 73:72 */
291
292	/* bits 81:74 land in byte 14 */
293	unsigned int	payload_1d:6;		/* not currently used */
294	/* bits 79:74 */
295	unsigned int	payload_1e:2;		/* not currently used */
296	/* bits 81:80 */
297
298	unsigned int	rsvd_4:7;		/* must be zero */
299	/* bits 88:82 */
300	unsigned int	swack_flag:1;		/* software acknowledge flag */
301	/* bit 89 */
302						/* INTD trasactions at
303						   destination are to wait for
304						   software acknowledge */
305	unsigned int	rsvd_5:6;		/* must be zero */
306	/* bits 95:90 */
307	unsigned int	rsvd_6:5;		/* must be zero */
308	/* bits 100:96 */
309	unsigned int	int_both:1;		/* if 1, interrupt both sockets
310						   on the uvhub */
311	/* bit 101*/
312	unsigned int	fairness:3;		/* usually zero */
313	/* bits 104:102 */
314	unsigned int	multilevel:1;		/* multi-level multicast
315						   format */
316	/* bit 105 */
317	/* 0 for TLB: endpoint multi-unicast messages */
318	unsigned int	chaining:1;		/* next descriptor is part of
319						   this activation*/
320	/* bit 106 */
321	unsigned int	rsvd_7:21;		/* must be zero */
322	/* bits 127:107 */
323};
324
325/*
326 * UV2 Message header:  16 bytes (128 bits) (bytes 0x30-0x3f of descriptor)
327 * see figure 9-2 of harp_sys.pdf
328 * assuming UV3 is the same
329 */
330struct uv2_3_bau_msg_header {
331	unsigned int	base_dest_nasid:15;	/* nasid of the first bit */
332	/* bits 14:0 */				/* in uvhub map */
333	unsigned int	dest_subnodeid:5;	/* must be 0x10, for the LB */
334	/* bits 19:15 */
335	unsigned int	rsvd_1:1;		/* must be zero */
336	/* bit 20 */
337	/* Address bits 59:21 */
338	/* bits 25:2 of address (44:21) are payload */
339	/* these next 24 bits become bytes 12-14 of msg */
340	/* bits 28:21 land in byte 12 */
341	unsigned int	replied_to:1;		/* sent as 0 by the source to
342						   byte 12 */
343	/* bit 21 */
344	unsigned int	msg_type:3;		/* software type of the
345						   message */
346	/* bits 24:22 */
347	unsigned int	canceled:1;		/* message canceled, resource
348						   is to be freed*/
349	/* bit 25 */
350	unsigned int	payload_1:3;		/* not currently used */
351	/* bits 28:26 */
352
353	/* bits 36:29 land in byte 13 */
354	unsigned int	payload_2a:3;		/* not currently used */
355	unsigned int	payload_2b:5;		/* not currently used */
356	/* bits 36:29 */
357
358	/* bits 44:37 land in byte 14 */
359	unsigned int	payload_3:8;		/* not currently used */
360	/* bits 44:37 */
361
362	unsigned int	rsvd_2:7;		/* reserved */
363	/* bits 51:45 */
364	unsigned int	swack_flag:1;		/* software acknowledge flag */
365	/* bit 52 */
366	unsigned int	rsvd_3a:3;		/* must be zero */
367	unsigned int	rsvd_3b:8;		/* must be zero */
368	unsigned int	rsvd_3c:8;		/* must be zero */
369	unsigned int	rsvd_3d:3;		/* must be zero */
370	/* bits 74:53 */
371	unsigned int	fairness:3;		/* usually zero */
372	/* bits 77:75 */
373
374	unsigned int	sequence:16;		/* message sequence number */
375	/* bits 93:78  Suppl_A  */
376	unsigned int	chaining:1;		/* next descriptor is part of
377						   this activation*/
378	/* bit 94 */
379	unsigned int	multilevel:1;		/* multi-level multicast
380						   format */
381	/* bit 95 */
382	unsigned int	rsvd_4:24;		/* ordered / source node /
383						   source subnode / aging
384						   must be zero */
385	/* bits 119:96 */
386	unsigned int	command:8;		/* message type */
387	/* bits 127:120 */
388};
389
390/*
391 * The activation descriptor:
392 * The format of the message to send, plus all accompanying control
393 * Should be 64 bytes
394 */
395struct bau_desc {
396	struct pnmask				distribution;
397	/*
398	 * message template, consisting of header and payload:
399	 */
400	union bau_msg_header {
401		struct uv1_bau_msg_header	uv1_hdr;
402		struct uv2_3_bau_msg_header	uv2_3_hdr;
403	} header;
404
405	struct bau_msg_payload			payload;
406};
407/* UV1:
408 *   -payload--    ---------header------
409 *   bytes 0-11    bits 41-56  bits 58-81
410 *       A           B  (2)      C (3)
411 *
412 *            A/B/C are moved to:
413 *       A            C          B
414 *   bytes 0-11  bytes 12-14  bytes 16-17  (byte 15 filled in by hw as vector)
415 *   ------------payload queue-----------
416 */
417/* UV2:
418 *   -payload--    ---------header------
419 *   bytes 0-11    bits 70-78  bits 21-44
420 *       A           B  (2)      C (3)
421 *
422 *            A/B/C are moved to:
423 *       A            C          B
424 *   bytes 0-11  bytes 12-14  bytes 16-17  (byte 15 filled in by hw as vector)
425 *   ------------payload queue-----------
426 */
427
428/*
429 * The payload queue on the destination side is an array of these.
430 * With BAU_MISC_CONTROL set for software acknowledge mode, the messages
431 * are 32 bytes (2 micropackets) (256 bits) in length, but contain only 17
432 * bytes of usable data, including the sw ack vector in byte 15 (bits 127:120)
433 * (12 bytes come from bau_msg_payload, 3 from payload_1, 2 from
434 *  swack_vec and payload_2)
435 * "Enabling Software Acknowledgment mode (see Section 4.3.3 Software
436 *  Acknowledge Processing) also selects 32 byte (17 bytes usable) payload
437 *  operation."
438 */
439struct bau_pq_entry {
440	unsigned long	address;	/* signifies a page or all TLB's
441					   of the cpu */
442	/* 64 bits, bytes 0-7 */
443	unsigned short	sending_cpu;	/* cpu that sent the message */
444	/* 16 bits, bytes 8-9 */
445	unsigned short	acknowledge_count; /* filled in by destination */
446	/* 16 bits, bytes 10-11 */
447	/* these next 3 bytes come from bits 58-81 of the message header */
448	unsigned short	replied_to:1;	/* sent as 0 by the source */
449	unsigned short	msg_type:3;	/* software message type */
450	unsigned short	canceled:1;	/* sent as 0 by the source */
451	unsigned short	unused1:3;	/* not currently using */
452	/* byte 12 */
453	unsigned char	unused2a;	/* not currently using */
454	/* byte 13 */
455	unsigned char	unused2;	/* not currently using */
456	/* byte 14 */
457	unsigned char	swack_vec;	/* filled in by the hardware */
458	/* byte 15 (bits 127:120) */
459	unsigned short	sequence;	/* message sequence number */
460	/* bytes 16-17 */
461	unsigned char	unused4[2];	/* not currently using bytes 18-19 */
462	/* bytes 18-19 */
463	int		number_of_cpus;	/* filled in at destination */
464	/* 32 bits, bytes 20-23 (aligned) */
465	unsigned char	unused5[8];	/* not using */
466	/* bytes 24-31 */
467};
468
469struct msg_desc {
470	struct bau_pq_entry	*msg;
471	int			msg_slot;
472	struct bau_pq_entry	*queue_first;
473	struct bau_pq_entry	*queue_last;
474};
475
476struct reset_args {
477	int			sender;
478};
479
480/*
481 * This structure is allocated per_cpu for UV TLB shootdown statistics.
482 */
483struct ptc_stats {
484	/* sender statistics */
485	unsigned long	s_giveup;		/* number of fall backs to
486						   IPI-style flushes */
487	unsigned long	s_requestor;		/* number of shootdown
488						   requests */
489	unsigned long	s_stimeout;		/* source side timeouts */
490	unsigned long	s_dtimeout;		/* destination side timeouts */
491	unsigned long	s_strongnacks;		/* number of strong nack's */
492	unsigned long	s_time;			/* time spent in sending side */
493	unsigned long	s_retriesok;		/* successful retries */
494	unsigned long	s_ntargcpu;		/* total number of cpu's
495						   targeted */
496	unsigned long	s_ntargself;		/* times the sending cpu was
497						   targeted */
498	unsigned long	s_ntarglocals;		/* targets of cpus on the local
499						   blade */
500	unsigned long	s_ntargremotes;		/* targets of cpus on remote
501						   blades */
502	unsigned long	s_ntarglocaluvhub;	/* targets of the local hub */
503	unsigned long	s_ntargremoteuvhub;	/* remotes hubs targeted */
504	unsigned long	s_ntarguvhub;		/* total number of uvhubs
505						   targeted */
506	unsigned long	s_ntarguvhub16;		/* number of times target
507						   hubs >= 16*/
508	unsigned long	s_ntarguvhub8;		/* number of times target
509						   hubs >= 8 */
510	unsigned long	s_ntarguvhub4;		/* number of times target
511						   hubs >= 4 */
512	unsigned long	s_ntarguvhub2;		/* number of times target
513						   hubs >= 2 */
514	unsigned long	s_ntarguvhub1;		/* number of times target
515						   hubs == 1 */
516	unsigned long	s_resets_plug;		/* ipi-style resets from plug
517						   state */
518	unsigned long	s_resets_timeout;	/* ipi-style resets from
519						   timeouts */
520	unsigned long	s_busy;			/* status stayed busy past
521						   s/w timer */
522	unsigned long	s_throttles;		/* waits in throttle */
523	unsigned long	s_retry_messages;	/* retry broadcasts */
524	unsigned long	s_bau_reenabled;	/* for bau enable/disable */
525	unsigned long	s_bau_disabled;		/* for bau enable/disable */
526	unsigned long	s_uv2_wars;		/* uv2 workaround, perm. busy */
527	unsigned long	s_uv2_wars_hw;		/* uv2 workaround, hiwater */
528	unsigned long	s_uv2_war_waits;	/* uv2 workaround, long waits */
529	unsigned long	s_overipilimit;		/* over the ipi reset limit */
530	unsigned long	s_giveuplimit;		/* disables, over giveup limit*/
531	unsigned long	s_enters;		/* entries to the driver */
532	unsigned long	s_ipifordisabled;	/* fall back to IPI; disabled */
533	unsigned long	s_plugged;		/* plugged by h/w bug*/
534	unsigned long	s_congested;		/* giveup on long wait */
535	/* destination statistics */
536	unsigned long	d_alltlb;		/* times all tlb's on this
537						   cpu were flushed */
538	unsigned long	d_onetlb;		/* times just one tlb on this
539						   cpu was flushed */
540	unsigned long	d_multmsg;		/* interrupts with multiple
541						   messages */
542	unsigned long	d_nomsg;		/* interrupts with no message */
543	unsigned long	d_time;			/* time spent on destination
544						   side */
545	unsigned long	d_requestee;		/* number of messages
546						   processed */
547	unsigned long	d_retries;		/* number of retry messages
548						   processed */
549	unsigned long	d_canceled;		/* number of messages canceled
550						   by retries */
551	unsigned long	d_nocanceled;		/* retries that found nothing
552						   to cancel */
553	unsigned long	d_resets;		/* number of ipi-style requests
554						   processed */
555	unsigned long	d_rcanceled;		/* number of messages canceled
556						   by resets */
557};
558
559struct tunables {
560	int			*tunp;
561	int			deflt;
562};
563
564struct hub_and_pnode {
565	short			uvhub;
566	short			pnode;
567};
568
569struct socket_desc {
570	short			num_cpus;
571	short			cpu_number[MAX_CPUS_PER_SOCKET];
572};
573
574struct uvhub_desc {
575	unsigned short		socket_mask;
576	short			num_cpus;
577	short			uvhub;
578	short			pnode;
579	struct socket_desc	socket[2];
580};
581
582/*
583 * one per-cpu; to locate the software tables
584 */
585struct bau_control {
586	struct bau_desc		*descriptor_base;
587	struct bau_pq_entry	*queue_first;
588	struct bau_pq_entry	*queue_last;
589	struct bau_pq_entry	*bau_msg_head;
590	struct bau_control	*uvhub_master;
591	struct bau_control	*socket_master;
592	struct ptc_stats	*statp;
593	cpumask_t		*cpumask;
594	unsigned long		timeout_interval;
595	unsigned long		set_bau_on_time;
596	atomic_t		active_descriptor_count;
597	int			plugged_tries;
598	int			timeout_tries;
599	int			ipi_attempts;
600	int			conseccompletes;
601	short			nobau;
602	short			baudisabled;
603	short			cpu;
604	short			osnode;
605	short			uvhub_cpu;
606	short			uvhub;
607	short			uvhub_version;
608	short			cpus_in_socket;
609	short			cpus_in_uvhub;
610	short			partition_base_pnode;
611	short			busy;       /* all were busy (war) */
612	unsigned short		message_number;
613	unsigned short		uvhub_quiesce;
614	short			socket_acknowledge_count[DEST_Q_SIZE];
615	cycles_t		send_message;
616	cycles_t		period_end;
617	cycles_t		period_time;
618	spinlock_t		uvhub_lock;
619	spinlock_t		queue_lock;
620	spinlock_t		disable_lock;
621	/* tunables */
622	int			max_concurr;
623	int			max_concurr_const;
624	int			plugged_delay;
625	int			plugsb4reset;
626	int			timeoutsb4reset;
627	int			ipi_reset_limit;
628	int			complete_threshold;
629	int			cong_response_us;
630	int			cong_reps;
631	cycles_t		disabled_period;
632	int			period_giveups;
633	int			giveup_limit;
634	long			period_requests;
635	struct hub_and_pnode	*thp;
636};
637
638static inline void write_mmr_data_broadcast(int pnode, unsigned long mmr_image)
639{
640	write_gmmr(pnode, UVH_BAU_DATA_BROADCAST, mmr_image);
641}
642
643static inline void write_mmr_descriptor_base(int pnode, unsigned long mmr_image)
644{
645	write_gmmr(pnode, UVH_LB_BAU_SB_DESCRIPTOR_BASE, mmr_image);
646}
647
648static inline void write_mmr_activation(unsigned long index)
649{
650	write_lmmr(UVH_LB_BAU_SB_ACTIVATION_CONTROL, index);
651}
652
653static inline void write_gmmr_activation(int pnode, unsigned long mmr_image)
654{
655	write_gmmr(pnode, UVH_LB_BAU_SB_ACTIVATION_CONTROL, mmr_image);
656}
657
658static inline void write_mmr_payload_first(int pnode, unsigned long mmr_image)
659{
660	write_gmmr(pnode, UVH_LB_BAU_INTD_PAYLOAD_QUEUE_FIRST, mmr_image);
661}
662
663static inline void write_mmr_payload_tail(int pnode, unsigned long mmr_image)
664{
665	write_gmmr(pnode, UVH_LB_BAU_INTD_PAYLOAD_QUEUE_TAIL, mmr_image);
666}
667
668static inline void write_mmr_payload_last(int pnode, unsigned long mmr_image)
669{
670	write_gmmr(pnode, UVH_LB_BAU_INTD_PAYLOAD_QUEUE_LAST, mmr_image);
671}
672
673static inline void write_mmr_misc_control(int pnode, unsigned long mmr_image)
674{
675	write_gmmr(pnode, UVH_LB_BAU_MISC_CONTROL, mmr_image);
676}
677
678static inline unsigned long read_mmr_misc_control(int pnode)
679{
680	return read_gmmr(pnode, UVH_LB_BAU_MISC_CONTROL);
681}
682
683static inline void write_mmr_sw_ack(unsigned long mr)
684{
685	uv_write_local_mmr(UVH_LB_BAU_INTD_SOFTWARE_ACKNOWLEDGE_ALIAS, mr);
686}
687
688static inline void write_gmmr_sw_ack(int pnode, unsigned long mr)
689{
690	write_gmmr(pnode, UVH_LB_BAU_INTD_SOFTWARE_ACKNOWLEDGE_ALIAS, mr);
691}
692
693static inline unsigned long read_mmr_sw_ack(void)
694{
695	return read_lmmr(UVH_LB_BAU_INTD_SOFTWARE_ACKNOWLEDGE);
696}
697
698static inline unsigned long read_gmmr_sw_ack(int pnode)
699{
700	return read_gmmr(pnode, UVH_LB_BAU_INTD_SOFTWARE_ACKNOWLEDGE);
701}
702
703static inline void write_mmr_data_config(int pnode, unsigned long mr)
704{
705	uv_write_global_mmr64(pnode, UVH_BAU_DATA_CONFIG, mr);
706}
707
708static inline int bau_uvhub_isset(int uvhub, struct pnmask *dstp)
709{
710	return constant_test_bit(uvhub, &dstp->bits[0]);
711}
712static inline void bau_uvhub_set(int pnode, struct pnmask *dstp)
713{
714	__set_bit(pnode, &dstp->bits[0]);
715}
716static inline void bau_uvhubs_clear(struct pnmask *dstp,
717				    int nbits)
718{
719	bitmap_zero(&dstp->bits[0], nbits);
720}
721static inline int bau_uvhub_weight(struct pnmask *dstp)
722{
723	return bitmap_weight((unsigned long *)&dstp->bits[0],
724				UV_DISTRIBUTION_SIZE);
725}
726
727static inline void bau_cpubits_clear(struct bau_local_cpumask *dstp, int nbits)
728{
729	bitmap_zero(&dstp->bits, nbits);
730}
731
732extern void uv_bau_message_intr1(void);
733#ifdef CONFIG_TRACING
734#define trace_uv_bau_message_intr1 uv_bau_message_intr1
735#endif
736extern void uv_bau_timeout_intr1(void);
737
738struct atomic_short {
739	short counter;
740};
741
742/*
743 * atomic_read_short - read a short atomic variable
744 * @v: pointer of type atomic_short
745 *
746 * Atomically reads the value of @v.
747 */
748static inline int atomic_read_short(const struct atomic_short *v)
749{
750	return v->counter;
751}
752
753/*
754 * atom_asr - add and return a short int
755 * @i: short value to add
756 * @v: pointer of type atomic_short
757 *
758 * Atomically adds @i to @v and returns @i + @v
759 */
760static inline int atom_asr(short i, struct atomic_short *v)
761{
762	short __i = i;
763	asm volatile(LOCK_PREFIX "xaddw %0, %1"
764			: "+r" (i), "+m" (v->counter)
765			: : "memory");
766	return i + __i;
767}
768
769/*
770 * conditionally add 1 to *v, unless *v is >= u
771 * return 0 if we cannot add 1 to *v because it is >= u
772 * return 1 if we can add 1 to *v because it is < u
773 * the add is atomic
774 *
775 * This is close to atomic_add_unless(), but this allows the 'u' value
776 * to be lowered below the current 'v'.  atomic_add_unless can only stop
777 * on equal.
778 */
779static inline int atomic_inc_unless_ge(spinlock_t *lock, atomic_t *v, int u)
780{
781	spin_lock(lock);
782	if (atomic_read(v) >= u) {
783		spin_unlock(lock);
784		return 0;
785	}
786	atomic_inc(v);
787	spin_unlock(lock);
788	return 1;
789}
790
791#endif /* _ASM_X86_UV_UV_BAU_H */
792