4 * Copyright(c) 2015-2017 Intel Corporation.
6 * This file is provided under a dual BSD/GPLv2 license. When using or
7 * redistributing this file, you may do so under either license.
11 * This program is free software; you can redistribute it and/or modify
12 * it under the terms of version 2 of the GNU General Public License as
13 * published by the Free Software Foundation.
15 * This program is distributed in the hope that it will be useful, but
16 * WITHOUT ANY WARRANTY; without even the implied warranty of
17 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
18 * General Public License for more details.
22 * Redistribution and use in source and binary forms, with or without
23 * modification, are permitted provided that the following conditions
26 * - Redistributions of source code must retain the above copyright
27 * notice, this list of conditions and the following disclaimer.
28 * - Redistributions in binary form must reproduce the above copyright
29 * notice, this list of conditions and the following disclaimer in
30 * the documentation and/or other materials provided with the
32 * - Neither the name of Intel Corporation nor the names of its
33 * contributors may be used to endorse or promote products derived
34 * from this software without specific prior written permission.
36 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
37 * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
38 * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
39 * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
40 * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
41 * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
42 * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
43 * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
44 * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
45 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
46 * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
50 /* send context types */
54 #define SC_USER 3 /* must be the last one: it may take all left */
55 #define SC_MAX 4 /* count of send context types */
57 /* invalid send context index */
58 #define INVALID_SCI 0xff
60 /* PIO buffer release callback function */
61 typedef void (*pio_release_cb
)(void *arg
, int code
);
63 /* PIO release codes - in bits, as there could more than one that apply */
64 #define PRC_OK 0 /* no known error */
65 #define PRC_STATUS_ERR 0x01 /* credit return due to status error */
66 #define PRC_PBC 0x02 /* credit return due to PBC */
67 #define PRC_THRESHOLD 0x04 /* credit return due to threshold */
68 #define PRC_FILL_ERR 0x08 /* credit return due fill error */
69 #define PRC_FORCE 0x10 /* credit return due credit force */
70 #define PRC_SC_DISABLE 0x20 /* clean-up after a context disable */
79 /* an allocated PIO buffer */
81 struct send_context
*sc
;/* back pointer to owning send context */
82 pio_release_cb cb
; /* called when the buffer is released */
83 void *arg
; /* argument for cb */
84 void __iomem
*start
; /* buffer start address */
85 void __iomem
*end
; /* context end address */
86 unsigned long sent_at
; /* buffer is sent when <= free */
87 union mix carry
; /* pending unwritten bytes */
88 u16 qw_written
; /* QW written so far */
89 u8 carry_bytes
; /* number of valid bytes in carry */
92 /* cache line aligned pio buffer array */
93 union pio_shadow_ring
{
95 } ____cacheline_aligned
;
97 /* per-NUMA send context */
99 /* read-only after init */
100 struct hfi1_devdata
*dd
; /* device */
101 union pio_shadow_ring
*sr
; /* shadow ring */
102 void __iomem
*base_addr
; /* start of PIO memory */
103 u32 __percpu
*buffers_allocated
;/* count of buffers allocated */
104 u32 size
; /* context size, in bytes */
106 int node
; /* context home node */
107 u32 sr_size
; /* size of the shadow ring */
108 u16 flags
; /* flags */
109 u8 type
; /* context type */
110 u8 sw_index
; /* software index number */
111 u8 hw_context
; /* hardware context number */
112 u8 group
; /* credit return group */
114 /* allocator fields */
115 spinlock_t alloc_lock ____cacheline_aligned_in_smp
;
116 u32 sr_head
; /* shadow ring head */
117 unsigned long fill
; /* official alloc count */
118 unsigned long alloc_free
; /* copy of free (less cache thrash) */
119 u32 fill_wrap
; /* tracks fill within ring */
120 u32 credits
; /* number of blocks in context */
121 /* adding a new field here would make it part of this cacheline */
123 /* releaser fields */
124 spinlock_t release_lock ____cacheline_aligned_in_smp
;
125 u32 sr_tail
; /* shadow ring tail */
126 unsigned long free
; /* official free count */
127 volatile __le64
*hw_free
; /* HW free counter */
128 /* list for PIO waiters */
129 struct list_head piowait ____cacheline_aligned_in_smp
;
132 spinlock_t credit_ctrl_lock ____cacheline_aligned_in_smp
;
133 u32 credit_intr_count
; /* count of credit intr users */
134 u64 credit_ctrl
; /* cache for credit control */
135 wait_queue_head_t halt_wait
; /* wait until kernel sees interrupt */
136 struct work_struct halt_work
; /* halted context work queue entry */
139 /* send context flags */
140 #define SCF_ENABLED 0x01
141 #define SCF_IN_FREE 0x02
142 #define SCF_HALTED 0x04
143 #define SCF_FROZEN 0x08
144 #define SCF_LINK_DOWN 0x10
146 struct send_context_info
{
147 struct send_context
*sc
; /* allocated working context */
148 u16 allocated
; /* has this been allocated? */
149 u16 type
; /* context type */
150 u16 base
; /* base in PIO array */
151 u16 credits
; /* size in PIO array */
154 /* DMA credit return, index is always (context & 0x7) */
155 struct credit_return
{
156 volatile __le64 cr
[8];
159 /* NUMA indexed credit return array */
160 struct credit_return_base
{
161 struct credit_return
*va
;
165 /* send context configuration sizes (one per type) */
166 struct sc_config_sizes
{
172 * The diagram below details the relationship of the mapping structures
174 * Since the mapping now allows for non-uniform send contexts per vl, the
175 * number of send contexts for a vl is either the vl_scontexts[vl] or
176 * a computation based on num_kernel_send_contexts/num_vls:
179 * nactual = vl_scontexts ? vl_scontexts[vl] : num_kernel_send_contexts/num_vls
181 * n = roundup to next highest power of 2 using nactual
183 * In the case where there are num_kernel_send_contexts/num_vls doesn't divide
184 * evenly, the extras are added from the last vl downward.
186 * For the case where n > nactual, the send contexts are assigned
187 * in a round robin fashion wrapping back to the first send context
188 * for a particular vl.
192 * | +--------------------+
194 * pio_vl_map |--------------------|
195 * +--------------------------+ | ksc[0] -> sc 1 |
196 * | list (RCU) | |--------------------|
197 * |--------------------------| ->| ksc[1] -> sc 2 |
198 * | mask | --/ |--------------------|
199 * |--------------------------| -/ | * |
200 * | actual_vls (max 8) | -/ |--------------------|
201 * |--------------------------| --/ | ksc[n-1] -> sc n |
202 * | vls (max 8) | -/ +--------------------+
203 * |--------------------------| --/
205 * |--------------------------| +--------------------+
206 * | map[1] |--- | mask |
207 * |--------------------------| \---- |--------------------|
208 * | * | \-- | ksc[0] -> sc 1+n |
209 * | * | \---- |--------------------|
210 * | * | \->| ksc[1] -> sc 2+n |
211 * |--------------------------| |--------------------|
212 * | map[vls - 1] |- | * |
213 * +--------------------------+ \- |--------------------|
214 * \- | ksc[m-1] -> sc m+n |
215 * \ +--------------------+
218 * \- +----------------------+
220 * \ |----------------------|
221 * \- | ksc[0] -> sc 1+m+n |
222 * \- |----------------------|
223 * >| ksc[1] -> sc 2+m+n |
224 * |----------------------|
226 * |----------------------|
227 * | ksc[o-1] -> sc o+m+n |
228 * +----------------------+
232 /* Initial number of send contexts per VL */
233 #define INIT_SC_PER_VL 2
236 * struct pio_map_elem - mapping for a vl
237 * @mask - selector mask
238 * @ksc - array of kernel send contexts for this vl
240 * The mask is used to "mod" the selector to
241 * produce index into the trailing array of
244 struct pio_map_elem
{
246 struct send_context
*ksc
[0];
250 * struct pio_vl_map - mapping for a vl
251 * @list - rcu head for free callback
252 * @mask - vl mask to "mod" the vl to produce an index to map array
253 * @actual_vls - number of vls
254 * @vls - numbers of vls rounded to next power of 2
255 * @map - array of pio_map_elem entries
257 * This is the parent mapping structure. The trailing members of the
258 * struct point to pio_map_elem entries, which in turn point to an
259 * array of kscs for that vl.
262 struct rcu_head list
;
266 struct pio_map_elem
*map
[0];
269 int pio_map_init(struct hfi1_devdata
*dd
, u8 port
, u8 num_vls
,
271 void free_pio_map(struct hfi1_devdata
*dd
);
272 struct send_context
*pio_select_send_context_vl(struct hfi1_devdata
*dd
,
273 u32 selector
, u8 vl
);
274 struct send_context
*pio_select_send_context_sc(struct hfi1_devdata
*dd
,
275 u32 selector
, u8 sc5
);
277 /* send context functions */
278 int init_credit_return(struct hfi1_devdata
*dd
);
279 void free_credit_return(struct hfi1_devdata
*dd
);
280 int init_sc_pools_and_sizes(struct hfi1_devdata
*dd
);
281 int init_send_contexts(struct hfi1_devdata
*dd
);
282 int init_credit_return(struct hfi1_devdata
*dd
);
283 int init_pervl_scs(struct hfi1_devdata
*dd
);
284 struct send_context
*sc_alloc(struct hfi1_devdata
*dd
, int type
,
285 uint hdrqentsize
, int numa
);
286 void sc_free(struct send_context
*sc
);
287 int sc_enable(struct send_context
*sc
);
288 void sc_disable(struct send_context
*sc
);
289 int sc_restart(struct send_context
*sc
);
290 void sc_return_credits(struct send_context
*sc
);
291 void sc_flush(struct send_context
*sc
);
292 void sc_drop(struct send_context
*sc
);
293 void sc_stop(struct send_context
*sc
, int bit
);
294 struct pio_buf
*sc_buffer_alloc(struct send_context
*sc
, u32 dw_len
,
295 pio_release_cb cb
, void *arg
);
296 void sc_release_update(struct send_context
*sc
);
297 void sc_return_credits(struct send_context
*sc
);
298 void sc_group_release_update(struct hfi1_devdata
*dd
, u32 hw_context
);
299 void sc_add_credit_return_intr(struct send_context
*sc
);
300 void sc_del_credit_return_intr(struct send_context
*sc
);
301 void sc_set_cr_threshold(struct send_context
*sc
, u32 new_threshold
);
302 u32
sc_percent_to_threshold(struct send_context
*sc
, u32 percent
);
303 u32
sc_mtu_to_threshold(struct send_context
*sc
, u32 mtu
, u32 hdrqentsize
);
304 void hfi1_sc_wantpiobuf_intr(struct send_context
*sc
, u32 needint
);
305 void sc_wait(struct hfi1_devdata
*dd
);
306 void set_pio_integrity(struct send_context
*sc
);
308 /* support functions */
309 void pio_reset_all(struct hfi1_devdata
*dd
);
310 void pio_freeze(struct hfi1_devdata
*dd
);
311 void pio_kernel_unfreeze(struct hfi1_devdata
*dd
);
312 void pio_kernel_linkup(struct hfi1_devdata
*dd
);
314 /* global PIO send control operations */
315 #define PSC_GLOBAL_ENABLE 0
316 #define PSC_GLOBAL_DISABLE 1
317 #define PSC_GLOBAL_VLARB_ENABLE 2
318 #define PSC_GLOBAL_VLARB_DISABLE 3
319 #define PSC_CM_RESET 4
320 #define PSC_DATA_VL_ENABLE 5
321 #define PSC_DATA_VL_DISABLE 6
323 void __cm_reset(struct hfi1_devdata
*dd
, u64 sendctrl
);
324 void pio_send_control(struct hfi1_devdata
*dd
, int op
);
326 /* PIO copy routines */
327 void pio_copy(struct hfi1_devdata
*dd
, struct pio_buf
*pbuf
, u64 pbc
,
328 const void *from
, size_t count
);
329 void seg_pio_copy_start(struct pio_buf
*pbuf
, u64 pbc
,
330 const void *from
, size_t nbytes
);
331 void seg_pio_copy_mid(struct pio_buf
*pbuf
, const void *from
, size_t nbytes
);
332 void seg_pio_copy_end(struct pio_buf
*pbuf
);
334 void seqfile_dump_sci(struct seq_file
*s
, u32 i
,
335 struct send_context_info
*sci
);