2 * Copyright (c) 2006, 2007, 2009 QLogic Corporation. All rights reserved.
3 * Copyright (c) 2005, 2006 PathScale, Inc. All rights reserved.
5 * This software is available to you under a choice of one of two
6 * licenses. You may choose to be licensed under the terms of the GNU
7 * General Public License (GPL) Version 2, available from the file
8 * COPYING in the main directory of this source tree, or the
9 * OpenIB.org BSD license below:
11 * Redistribution and use in source and binary forms, with or
12 * without modification, are permitted provided that the following
15 * - Redistributions of source code must retain the above
16 * copyright notice, this list of conditions and the following
19 * - Redistributions in binary form must reproduce the above
20 * copyright notice, this list of conditions and the following
21 * disclaimer in the documentation and/or other materials
22 * provided with the distribution.
24 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
25 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
26 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
27 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
28 * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
29 * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
30 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
37 * qib_alloc_lkey - allocate an lkey
38 * @mr: memory region that this lkey protects
39 * @dma_region: 0->normal key, 1->restricted DMA key
41 * Returns 0 if successful, otherwise returns -errno.
43 * Increments mr reference count as required.
45 * Sets the lkey field mr for non-dma regions.
49 int qib_alloc_lkey(struct qib_mregion
*mr
, int dma_region
)
55 struct qib_ibdev
*dev
= to_idev(mr
->pd
->device
);
56 struct qib_lkey_table
*rkt
= &dev
->lk_table
;
58 spin_lock_irqsave(&rkt
->lock
, flags
);
60 /* special case for dma_mr lkey == 0 */
62 struct qib_mregion
*tmr
;
64 tmr
= rcu_dereference(dev
->dma_mr
);
67 rcu_assign_pointer(dev
->dma_mr
, mr
);
68 mr
->lkey_published
= 1;
73 /* Find the next available LKEY */
77 if (rkt
->table
[r
] == NULL
)
79 r
= (r
+ 1) & (rkt
->max
- 1);
83 rkt
->next
= (r
+ 1) & (rkt
->max
- 1);
85 * Make sure lkey is never zero which is reserved to indicate an
89 mr
->lkey
= (r
<< (32 - ib_qib_lkey_table_size
)) |
90 ((((1 << (24 - ib_qib_lkey_table_size
)) - 1) & rkt
->gen
)
97 rcu_assign_pointer(rkt
->table
[r
], mr
);
98 mr
->lkey_published
= 1;
100 spin_unlock_irqrestore(&rkt
->lock
, flags
);
104 spin_unlock_irqrestore(&rkt
->lock
, flags
);
110 * qib_free_lkey - free an lkey
111 * @mr: mr to free from tables
113 void qib_free_lkey(struct qib_mregion
*mr
)
118 struct qib_ibdev
*dev
= to_idev(mr
->pd
->device
);
119 struct qib_lkey_table
*rkt
= &dev
->lk_table
;
121 spin_lock_irqsave(&rkt
->lock
, flags
);
122 if (!mr
->lkey_published
)
125 rcu_assign_pointer(dev
->dma_mr
, NULL
);
127 r
= lkey
>> (32 - ib_qib_lkey_table_size
);
128 rcu_assign_pointer(rkt
->table
[r
], NULL
);
131 mr
->lkey_published
= 0;
133 spin_unlock_irqrestore(&rkt
->lock
, flags
);
137 * qib_lkey_ok - check IB SGE for validity and initialize
138 * @rkt: table containing lkey to check SGE against
139 * @pd: protection domain
140 * @isge: outgoing internal SGE
144 * Return 1 if valid and successful, otherwise returns 0.
146 * increments the reference count upon success
148 * Check the IB SGE for validity and initialize our internal version
151 int qib_lkey_ok(struct qib_lkey_table
*rkt
, struct qib_pd
*pd
,
152 struct qib_sge
*isge
, struct ib_sge
*sge
, int acc
)
154 struct qib_mregion
*mr
;
159 * We use LKEY == zero for kernel virtual addresses
160 * (see qib_get_dma_mr and qib_dma.c).
163 if (sge
->lkey
== 0) {
164 struct qib_ibdev
*dev
= to_idev(pd
->ibpd
.device
);
168 mr
= rcu_dereference(dev
->dma_mr
);
171 if (unlikely(!atomic_inc_not_zero(&mr
->refcount
)))
176 isge
->vaddr
= (void *) sge
->addr
;
177 isge
->length
= sge
->length
;
178 isge
->sge_length
= sge
->length
;
183 mr
= rcu_dereference(
184 rkt
->table
[(sge
->lkey
>> (32 - ib_qib_lkey_table_size
))]);
185 if (unlikely(!mr
|| mr
->lkey
!= sge
->lkey
|| mr
->pd
!= &pd
->ibpd
))
188 off
= sge
->addr
- mr
->user_base
;
189 if (unlikely(sge
->addr
< mr
->user_base
||
190 off
+ sge
->length
> mr
->length
||
191 (mr
->access_flags
& acc
) != acc
))
193 if (unlikely(!atomic_inc_not_zero(&mr
->refcount
)))
198 if (mr
->page_shift
) {
200 page sizes are uniform power of 2 so no loop is necessary
201 entries_spanned_by_off is the number of times the loop below
204 size_t entries_spanned_by_off
;
206 entries_spanned_by_off
= off
>> mr
->page_shift
;
207 off
-= (entries_spanned_by_off
<< mr
->page_shift
);
208 m
= entries_spanned_by_off
/QIB_SEGSZ
;
209 n
= entries_spanned_by_off
%QIB_SEGSZ
;
213 while (off
>= mr
->map
[m
]->segs
[n
].length
) {
214 off
-= mr
->map
[m
]->segs
[n
].length
;
216 if (n
>= QIB_SEGSZ
) {
223 isge
->vaddr
= mr
->map
[m
]->segs
[n
].vaddr
+ off
;
224 isge
->length
= mr
->map
[m
]->segs
[n
].length
- off
;
225 isge
->sge_length
= sge
->length
;
236 * qib_rkey_ok - check the IB virtual address, length, and RKEY
237 * @qp: qp for validation
239 * @len: length of data
240 * @vaddr: virtual address to place data
241 * @rkey: rkey to check
244 * Return 1 if successful, otherwise 0.
246 * increments the reference count upon success
248 int qib_rkey_ok(struct qib_qp
*qp
, struct qib_sge
*sge
,
249 u32 len
, u64 vaddr
, u32 rkey
, int acc
)
251 struct qib_lkey_table
*rkt
= &to_idev(qp
->ibqp
.device
)->lk_table
;
252 struct qib_mregion
*mr
;
257 * We use RKEY == zero for kernel virtual addresses
258 * (see qib_get_dma_mr and qib_dma.c).
262 struct qib_pd
*pd
= to_ipd(qp
->ibqp
.pd
);
263 struct qib_ibdev
*dev
= to_idev(pd
->ibpd
.device
);
267 mr
= rcu_dereference(dev
->dma_mr
);
270 if (unlikely(!atomic_inc_not_zero(&mr
->refcount
)))
275 sge
->vaddr
= (void *) vaddr
;
277 sge
->sge_length
= len
;
283 mr
= rcu_dereference(
284 rkt
->table
[(rkey
>> (32 - ib_qib_lkey_table_size
))]);
285 if (unlikely(!mr
|| mr
->lkey
!= rkey
|| qp
->ibqp
.pd
!= mr
->pd
))
288 off
= vaddr
- mr
->iova
;
289 if (unlikely(vaddr
< mr
->iova
|| off
+ len
> mr
->length
||
290 (mr
->access_flags
& acc
) == 0))
292 if (unlikely(!atomic_inc_not_zero(&mr
->refcount
)))
297 if (mr
->page_shift
) {
299 page sizes are uniform power of 2 so no loop is necessary
300 entries_spanned_by_off is the number of times the loop below
303 size_t entries_spanned_by_off
;
305 entries_spanned_by_off
= off
>> mr
->page_shift
;
306 off
-= (entries_spanned_by_off
<< mr
->page_shift
);
307 m
= entries_spanned_by_off
/QIB_SEGSZ
;
308 n
= entries_spanned_by_off
%QIB_SEGSZ
;
312 while (off
>= mr
->map
[m
]->segs
[n
].length
) {
313 off
-= mr
->map
[m
]->segs
[n
].length
;
315 if (n
>= QIB_SEGSZ
) {
322 sge
->vaddr
= mr
->map
[m
]->segs
[n
].vaddr
+ off
;
323 sge
->length
= mr
->map
[m
]->segs
[n
].length
- off
;
324 sge
->sge_length
= len
;
335 * Initialize the memory region specified by the work reqeust.
337 int qib_fast_reg_mr(struct qib_qp
*qp
, struct ib_send_wr
*wr
)
339 struct qib_lkey_table
*rkt
= &to_idev(qp
->ibqp
.device
)->lk_table
;
340 struct qib_pd
*pd
= to_ipd(qp
->ibqp
.pd
);
341 struct qib_mregion
*mr
;
342 u32 rkey
= wr
->wr
.fast_reg
.rkey
;
349 spin_lock_irqsave(&rkt
->lock
, flags
);
350 if (pd
->user
|| rkey
== 0)
353 mr
= rcu_dereference_protected(
354 rkt
->table
[(rkey
>> (32 - ib_qib_lkey_table_size
))],
355 lockdep_is_held(&rkt
->lock
));
356 if (unlikely(mr
== NULL
|| qp
->ibqp
.pd
!= mr
->pd
))
359 if (wr
->wr
.fast_reg
.page_list_len
> mr
->max_segs
)
362 ps
= 1UL << wr
->wr
.fast_reg
.page_shift
;
363 if (wr
->wr
.fast_reg
.length
> ps
* wr
->wr
.fast_reg
.page_list_len
)
366 mr
->user_base
= wr
->wr
.fast_reg
.iova_start
;
367 mr
->iova
= wr
->wr
.fast_reg
.iova_start
;
369 mr
->length
= wr
->wr
.fast_reg
.length
;
370 mr
->access_flags
= wr
->wr
.fast_reg
.access_flags
;
371 page_list
= wr
->wr
.fast_reg
.page_list
->page_list
;
374 for (i
= 0; i
< wr
->wr
.fast_reg
.page_list_len
; i
++) {
375 mr
->map
[m
]->segs
[n
].vaddr
= (void *) page_list
[i
];
376 mr
->map
[m
]->segs
[n
].length
= ps
;
377 if (++n
== QIB_SEGSZ
) {
385 spin_unlock_irqrestore(&rkt
->lock
, flags
);