2 * Copyright (c) 2004 Topspin Communications. All rights reserved.
3 * Copyright (c) 2005 Mellanox Technologies. All rights reserved.
5 * This software is available to you under a choice of one of two
6 * licenses. You may choose to be licensed under the terms of the GNU
7 * General Public License (GPL) Version 2, available from the file
8 * COPYING in the main directory of this source tree, or the
9 * OpenIB.org BSD license below:
11 * Redistribution and use in source and binary forms, with or
12 * without modification, are permitted provided that the following
15 * - Redistributions of source code must retain the above
16 * copyright notice, this list of conditions and the following
19 * - Redistributions in binary form must reproduce the above
20 * copyright notice, this list of conditions and the following
21 * disclaimer in the documentation and/or other materials
22 * provided with the distribution.
24 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
25 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
26 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
27 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
28 * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
29 * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
30 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
34 #include <linux/slab.h>
35 #include <linux/errno.h>
37 #include "mthca_dev.h"
38 #include "mthca_cmd.h"
39 #include "mthca_memfree.h"
42 struct mthca_buddy
*buddy
;
48 * Must be packed because mtt_seg is 64 bits but only aligned to 32 bits.
50 struct mthca_mpt_entry
{
59 __be32 window_count_limit
;
61 __be32 mtt_sz
; /* Arbel only */
63 } __attribute__((packed
));
65 #define MTHCA_MPT_FLAG_SW_OWNS (0xfUL << 28)
66 #define MTHCA_MPT_FLAG_MIO (1 << 17)
67 #define MTHCA_MPT_FLAG_BIND_ENABLE (1 << 15)
68 #define MTHCA_MPT_FLAG_PHYSICAL (1 << 9)
69 #define MTHCA_MPT_FLAG_REGION (1 << 8)
71 #define MTHCA_MTT_FLAG_PRESENT 1
73 #define MTHCA_MPT_STATUS_SW 0xF0
74 #define MTHCA_MPT_STATUS_HW 0x00
76 #define SINAI_FMR_KEY_INC 0x1000000
79 * Buddy allocator for MTT segments (currently not very efficient
80 * since it doesn't keep a free list and just searches linearly
81 * through the bitmaps)
84 static u32
mthca_buddy_alloc(struct mthca_buddy
*buddy
, int order
)
90 spin_lock(&buddy
->lock
);
92 for (o
= order
; o
<= buddy
->max_order
; ++o
)
93 if (buddy
->num_free
[o
]) {
94 m
= 1 << (buddy
->max_order
- o
);
95 seg
= find_first_bit(buddy
->bits
[o
], m
);
100 spin_unlock(&buddy
->lock
);
104 clear_bit(seg
, buddy
->bits
[o
]);
105 --buddy
->num_free
[o
];
110 set_bit(seg
^ 1, buddy
->bits
[o
]);
111 ++buddy
->num_free
[o
];
114 spin_unlock(&buddy
->lock
);
121 static void mthca_buddy_free(struct mthca_buddy
*buddy
, u32 seg
, int order
)
125 spin_lock(&buddy
->lock
);
127 while (test_bit(seg
^ 1, buddy
->bits
[order
])) {
128 clear_bit(seg
^ 1, buddy
->bits
[order
]);
129 --buddy
->num_free
[order
];
134 set_bit(seg
, buddy
->bits
[order
]);
135 ++buddy
->num_free
[order
];
137 spin_unlock(&buddy
->lock
);
140 static int mthca_buddy_init(struct mthca_buddy
*buddy
, int max_order
)
144 buddy
->max_order
= max_order
;
145 spin_lock_init(&buddy
->lock
);
147 buddy
->bits
= kzalloc((buddy
->max_order
+ 1) * sizeof (long *),
149 buddy
->num_free
= kzalloc((buddy
->max_order
+ 1) * sizeof (int *),
151 if (!buddy
->bits
|| !buddy
->num_free
)
154 for (i
= 0; i
<= buddy
->max_order
; ++i
) {
155 s
= BITS_TO_LONGS(1 << (buddy
->max_order
- i
));
156 buddy
->bits
[i
] = kmalloc(s
* sizeof (long), GFP_KERNEL
);
159 bitmap_zero(buddy
->bits
[i
],
160 1 << (buddy
->max_order
- i
));
163 set_bit(0, buddy
->bits
[buddy
->max_order
]);
164 buddy
->num_free
[buddy
->max_order
] = 1;
169 for (i
= 0; i
<= buddy
->max_order
; ++i
)
170 kfree(buddy
->bits
[i
]);
174 kfree(buddy
->num_free
);
179 static void mthca_buddy_cleanup(struct mthca_buddy
*buddy
)
183 for (i
= 0; i
<= buddy
->max_order
; ++i
)
184 kfree(buddy
->bits
[i
]);
187 kfree(buddy
->num_free
);
190 static u32
mthca_alloc_mtt_range(struct mthca_dev
*dev
, int order
,
191 struct mthca_buddy
*buddy
)
193 u32 seg
= mthca_buddy_alloc(buddy
, order
);
198 if (mthca_is_memfree(dev
))
199 if (mthca_table_get_range(dev
, dev
->mr_table
.mtt_table
, seg
,
200 seg
+ (1 << order
) - 1)) {
201 mthca_buddy_free(buddy
, seg
, order
);
208 static struct mthca_mtt
*__mthca_alloc_mtt(struct mthca_dev
*dev
, int size
,
209 struct mthca_buddy
*buddy
)
211 struct mthca_mtt
*mtt
;
215 return ERR_PTR(-EINVAL
);
217 mtt
= kmalloc(sizeof *mtt
, GFP_KERNEL
);
219 return ERR_PTR(-ENOMEM
);
223 for (i
= MTHCA_MTT_SEG_SIZE
/ 8; i
< size
; i
<<= 1)
226 mtt
->first_seg
= mthca_alloc_mtt_range(dev
, mtt
->order
, buddy
);
227 if (mtt
->first_seg
== -1) {
229 return ERR_PTR(-ENOMEM
);
235 struct mthca_mtt
*mthca_alloc_mtt(struct mthca_dev
*dev
, int size
)
237 return __mthca_alloc_mtt(dev
, size
, &dev
->mr_table
.mtt_buddy
);
240 void mthca_free_mtt(struct mthca_dev
*dev
, struct mthca_mtt
*mtt
)
245 mthca_buddy_free(mtt
->buddy
, mtt
->first_seg
, mtt
->order
);
247 mthca_table_put_range(dev
, dev
->mr_table
.mtt_table
,
249 mtt
->first_seg
+ (1 << mtt
->order
) - 1);
254 static int __mthca_write_mtt(struct mthca_dev
*dev
, struct mthca_mtt
*mtt
,
255 int start_index
, u64
*buffer_list
, int list_len
)
257 struct mthca_mailbox
*mailbox
;
263 mailbox
= mthca_alloc_mailbox(dev
, GFP_KERNEL
);
265 return PTR_ERR(mailbox
);
266 mtt_entry
= mailbox
->buf
;
268 while (list_len
> 0) {
269 mtt_entry
[0] = cpu_to_be64(dev
->mr_table
.mtt_base
+
270 mtt
->first_seg
* MTHCA_MTT_SEG_SIZE
+
273 for (i
= 0; i
< list_len
&& i
< MTHCA_MAILBOX_SIZE
/ 8 - 2; ++i
)
274 mtt_entry
[i
+ 2] = cpu_to_be64(buffer_list
[i
] |
275 MTHCA_MTT_FLAG_PRESENT
);
278 * If we have an odd number of entries to write, add
279 * one more dummy entry for firmware efficiency.
282 mtt_entry
[i
+ 2] = 0;
284 err
= mthca_WRITE_MTT(dev
, mailbox
, (i
+ 1) & ~1, &status
);
286 mthca_warn(dev
, "WRITE_MTT failed (%d)\n", err
);
290 mthca_warn(dev
, "WRITE_MTT returned status 0x%02x\n",
302 mthca_free_mailbox(dev
, mailbox
);
306 int mthca_write_mtt_size(struct mthca_dev
*dev
)
308 if (dev
->mr_table
.fmr_mtt_buddy
!= &dev
->mr_table
.mtt_buddy
||
309 !(dev
->mthca_flags
& MTHCA_FLAG_FMR
))
311 * Be friendly to WRITE_MTT command
312 * and leave two empty slots for the
313 * index and reserved fields of the
316 return PAGE_SIZE
/ sizeof (u64
) - 2;
318 /* For Arbel, all MTTs must fit in the same page. */
319 return mthca_is_memfree(dev
) ? (PAGE_SIZE
/ sizeof (u64
)) : 0x7ffffff;
322 static void mthca_tavor_write_mtt_seg(struct mthca_dev
*dev
,
323 struct mthca_mtt
*mtt
, int start_index
,
324 u64
*buffer_list
, int list_len
)
329 mtts
= dev
->mr_table
.tavor_fmr
.mtt_base
+ mtt
->first_seg
* MTHCA_MTT_SEG_SIZE
+
330 start_index
* sizeof (u64
);
331 for (i
= 0; i
< list_len
; ++i
)
332 mthca_write64_raw(cpu_to_be64(buffer_list
[i
] | MTHCA_MTT_FLAG_PRESENT
),
336 static void mthca_arbel_write_mtt_seg(struct mthca_dev
*dev
,
337 struct mthca_mtt
*mtt
, int start_index
,
338 u64
*buffer_list
, int list_len
)
341 dma_addr_t dma_handle
;
343 int s
= start_index
* sizeof (u64
);
345 /* For Arbel, all MTTs must fit in the same page. */
346 BUG_ON(s
/ PAGE_SIZE
!= (s
+ list_len
* sizeof(u64
) - 1) / PAGE_SIZE
);
347 /* Require full segments */
348 BUG_ON(s
% MTHCA_MTT_SEG_SIZE
);
350 mtts
= mthca_table_find(dev
->mr_table
.mtt_table
, mtt
->first_seg
+
351 s
/ MTHCA_MTT_SEG_SIZE
, &dma_handle
);
355 for (i
= 0; i
< list_len
; ++i
)
356 mtts
[i
] = cpu_to_be64(buffer_list
[i
] | MTHCA_MTT_FLAG_PRESENT
);
358 dma_sync_single(&dev
->pdev
->dev
, dma_handle
, list_len
* sizeof (u64
), DMA_TO_DEVICE
);
361 int mthca_write_mtt(struct mthca_dev
*dev
, struct mthca_mtt
*mtt
,
362 int start_index
, u64
*buffer_list
, int list_len
)
364 int size
= mthca_write_mtt_size(dev
);
367 if (dev
->mr_table
.fmr_mtt_buddy
!= &dev
->mr_table
.mtt_buddy
||
368 !(dev
->mthca_flags
& MTHCA_FLAG_FMR
))
369 return __mthca_write_mtt(dev
, mtt
, start_index
, buffer_list
, list_len
);
371 while (list_len
> 0) {
372 chunk
= min(size
, list_len
);
373 if (mthca_is_memfree(dev
))
374 mthca_arbel_write_mtt_seg(dev
, mtt
, start_index
,
377 mthca_tavor_write_mtt_seg(dev
, mtt
, start_index
,
381 start_index
+= chunk
;
382 buffer_list
+= chunk
;
388 static inline u32
tavor_hw_index_to_key(u32 ind
)
393 static inline u32
tavor_key_to_hw_index(u32 key
)
398 static inline u32
arbel_hw_index_to_key(u32 ind
)
400 return (ind
>> 24) | (ind
<< 8);
403 static inline u32
arbel_key_to_hw_index(u32 key
)
405 return (key
<< 24) | (key
>> 8);
408 static inline u32
hw_index_to_key(struct mthca_dev
*dev
, u32 ind
)
410 if (mthca_is_memfree(dev
))
411 return arbel_hw_index_to_key(ind
);
413 return tavor_hw_index_to_key(ind
);
416 static inline u32
key_to_hw_index(struct mthca_dev
*dev
, u32 key
)
418 if (mthca_is_memfree(dev
))
419 return arbel_key_to_hw_index(key
);
421 return tavor_key_to_hw_index(key
);
424 static inline u32
adjust_key(struct mthca_dev
*dev
, u32 key
)
426 if (dev
->mthca_flags
& MTHCA_FLAG_SINAI_OPT
)
427 return ((key
<< 20) & 0x800000) | (key
& 0x7fffff);
432 int mthca_mr_alloc(struct mthca_dev
*dev
, u32 pd
, int buffer_size_shift
,
433 u64 iova
, u64 total_size
, u32 access
, struct mthca_mr
*mr
)
435 struct mthca_mailbox
*mailbox
;
436 struct mthca_mpt_entry
*mpt_entry
;
442 WARN_ON(buffer_size_shift
>= 32);
444 key
= mthca_alloc(&dev
->mr_table
.mpt_alloc
);
447 key
= adjust_key(dev
, key
);
448 mr
->ibmr
.rkey
= mr
->ibmr
.lkey
= hw_index_to_key(dev
, key
);
450 if (mthca_is_memfree(dev
)) {
451 err
= mthca_table_get(dev
, dev
->mr_table
.mpt_table
, key
);
453 goto err_out_mpt_free
;
456 mailbox
= mthca_alloc_mailbox(dev
, GFP_KERNEL
);
457 if (IS_ERR(mailbox
)) {
458 err
= PTR_ERR(mailbox
);
461 mpt_entry
= mailbox
->buf
;
463 mpt_entry
->flags
= cpu_to_be32(MTHCA_MPT_FLAG_SW_OWNS
|
465 MTHCA_MPT_FLAG_REGION
|
468 mpt_entry
->flags
|= cpu_to_be32(MTHCA_MPT_FLAG_PHYSICAL
);
470 mpt_entry
->page_size
= cpu_to_be32(buffer_size_shift
- 12);
471 mpt_entry
->key
= cpu_to_be32(key
);
472 mpt_entry
->pd
= cpu_to_be32(pd
);
473 mpt_entry
->start
= cpu_to_be64(iova
);
474 mpt_entry
->length
= cpu_to_be64(total_size
);
476 memset(&mpt_entry
->lkey
, 0,
477 sizeof *mpt_entry
- offsetof(struct mthca_mpt_entry
, lkey
));
481 cpu_to_be64(dev
->mr_table
.mtt_base
+
482 mr
->mtt
->first_seg
* MTHCA_MTT_SEG_SIZE
);
485 mthca_dbg(dev
, "Dumping MPT entry %08x:\n", mr
->ibmr
.lkey
);
486 for (i
= 0; i
< sizeof (struct mthca_mpt_entry
) / 4; ++i
) {
488 printk("[%02x] ", i
* 4);
489 printk(" %08x", be32_to_cpu(((__be32
*) mpt_entry
)[i
]));
490 if ((i
+ 1) % 4 == 0)
495 err
= mthca_SW2HW_MPT(dev
, mailbox
,
496 key
& (dev
->limits
.num_mpts
- 1),
499 mthca_warn(dev
, "SW2HW_MPT failed (%d)\n", err
);
500 goto err_out_mailbox
;
502 mthca_warn(dev
, "SW2HW_MPT returned status 0x%02x\n",
505 goto err_out_mailbox
;
508 mthca_free_mailbox(dev
, mailbox
);
512 mthca_free_mailbox(dev
, mailbox
);
515 mthca_table_put(dev
, dev
->mr_table
.mpt_table
, key
);
518 mthca_free(&dev
->mr_table
.mpt_alloc
, key
);
522 int mthca_mr_alloc_notrans(struct mthca_dev
*dev
, u32 pd
,
523 u32 access
, struct mthca_mr
*mr
)
526 return mthca_mr_alloc(dev
, pd
, 12, 0, ~0ULL, access
, mr
);
529 int mthca_mr_alloc_phys(struct mthca_dev
*dev
, u32 pd
,
530 u64
*buffer_list
, int buffer_size_shift
,
531 int list_len
, u64 iova
, u64 total_size
,
532 u32 access
, struct mthca_mr
*mr
)
536 mr
->mtt
= mthca_alloc_mtt(dev
, list_len
);
538 return PTR_ERR(mr
->mtt
);
540 err
= mthca_write_mtt(dev
, mr
->mtt
, 0, buffer_list
, list_len
);
542 mthca_free_mtt(dev
, mr
->mtt
);
546 err
= mthca_mr_alloc(dev
, pd
, buffer_size_shift
, iova
,
547 total_size
, access
, mr
);
549 mthca_free_mtt(dev
, mr
->mtt
);
555 static void mthca_free_region(struct mthca_dev
*dev
, u32 lkey
)
557 mthca_table_put(dev
, dev
->mr_table
.mpt_table
,
558 key_to_hw_index(dev
, lkey
));
560 mthca_free(&dev
->mr_table
.mpt_alloc
, key_to_hw_index(dev
, lkey
));
563 void mthca_free_mr(struct mthca_dev
*dev
, struct mthca_mr
*mr
)
568 err
= mthca_HW2SW_MPT(dev
, NULL
,
569 key_to_hw_index(dev
, mr
->ibmr
.lkey
) &
570 (dev
->limits
.num_mpts
- 1),
573 mthca_warn(dev
, "HW2SW_MPT failed (%d)\n", err
);
575 mthca_warn(dev
, "HW2SW_MPT returned status 0x%02x\n",
578 mthca_free_region(dev
, mr
->ibmr
.lkey
);
579 mthca_free_mtt(dev
, mr
->mtt
);
582 int mthca_fmr_alloc(struct mthca_dev
*dev
, u32 pd
,
583 u32 access
, struct mthca_fmr
*mr
)
585 struct mthca_mpt_entry
*mpt_entry
;
586 struct mthca_mailbox
*mailbox
;
590 int list_len
= mr
->attr
.max_pages
;
594 if (mr
->attr
.page_shift
< 12 || mr
->attr
.page_shift
>= 32)
597 /* For Arbel, all MTTs must fit in the same page. */
598 if (mthca_is_memfree(dev
) &&
599 mr
->attr
.max_pages
* sizeof *mr
->mem
.arbel
.mtts
> PAGE_SIZE
)
604 key
= mthca_alloc(&dev
->mr_table
.mpt_alloc
);
607 key
= adjust_key(dev
, key
);
609 idx
= key
& (dev
->limits
.num_mpts
- 1);
610 mr
->ibmr
.rkey
= mr
->ibmr
.lkey
= hw_index_to_key(dev
, key
);
612 if (mthca_is_memfree(dev
)) {
613 err
= mthca_table_get(dev
, dev
->mr_table
.mpt_table
, key
);
615 goto err_out_mpt_free
;
617 mr
->mem
.arbel
.mpt
= mthca_table_find(dev
->mr_table
.mpt_table
, key
, NULL
);
618 BUG_ON(!mr
->mem
.arbel
.mpt
);
620 mr
->mem
.tavor
.mpt
= dev
->mr_table
.tavor_fmr
.mpt_base
+
621 sizeof *(mr
->mem
.tavor
.mpt
) * idx
;
623 mr
->mtt
= __mthca_alloc_mtt(dev
, list_len
, dev
->mr_table
.fmr_mtt_buddy
);
624 if (IS_ERR(mr
->mtt
)) {
625 err
= PTR_ERR(mr
->mtt
);
629 mtt_seg
= mr
->mtt
->first_seg
* MTHCA_MTT_SEG_SIZE
;
631 if (mthca_is_memfree(dev
)) {
632 mr
->mem
.arbel
.mtts
= mthca_table_find(dev
->mr_table
.mtt_table
,
634 &mr
->mem
.arbel
.dma_handle
);
635 BUG_ON(!mr
->mem
.arbel
.mtts
);
637 mr
->mem
.tavor
.mtts
= dev
->mr_table
.tavor_fmr
.mtt_base
+ mtt_seg
;
639 mailbox
= mthca_alloc_mailbox(dev
, GFP_KERNEL
);
640 if (IS_ERR(mailbox
)) {
641 err
= PTR_ERR(mailbox
);
642 goto err_out_free_mtt
;
645 mpt_entry
= mailbox
->buf
;
647 mpt_entry
->flags
= cpu_to_be32(MTHCA_MPT_FLAG_SW_OWNS
|
649 MTHCA_MPT_FLAG_REGION
|
652 mpt_entry
->page_size
= cpu_to_be32(mr
->attr
.page_shift
- 12);
653 mpt_entry
->key
= cpu_to_be32(key
);
654 mpt_entry
->pd
= cpu_to_be32(pd
);
655 memset(&mpt_entry
->start
, 0,
656 sizeof *mpt_entry
- offsetof(struct mthca_mpt_entry
, start
));
657 mpt_entry
->mtt_seg
= cpu_to_be64(dev
->mr_table
.mtt_base
+ mtt_seg
);
660 mthca_dbg(dev
, "Dumping MPT entry %08x:\n", mr
->ibmr
.lkey
);
661 for (i
= 0; i
< sizeof (struct mthca_mpt_entry
) / 4; ++i
) {
663 printk("[%02x] ", i
* 4);
664 printk(" %08x", be32_to_cpu(((__be32
*) mpt_entry
)[i
]));
665 if ((i
+ 1) % 4 == 0)
670 err
= mthca_SW2HW_MPT(dev
, mailbox
,
671 key
& (dev
->limits
.num_mpts
- 1),
674 mthca_warn(dev
, "SW2HW_MPT failed (%d)\n", err
);
675 goto err_out_mailbox_free
;
678 mthca_warn(dev
, "SW2HW_MPT returned status 0x%02x\n",
681 goto err_out_mailbox_free
;
684 mthca_free_mailbox(dev
, mailbox
);
687 err_out_mailbox_free
:
688 mthca_free_mailbox(dev
, mailbox
);
691 mthca_free_mtt(dev
, mr
->mtt
);
694 mthca_table_put(dev
, dev
->mr_table
.mpt_table
, key
);
697 mthca_free(&dev
->mr_table
.mpt_alloc
, key
);
701 int mthca_free_fmr(struct mthca_dev
*dev
, struct mthca_fmr
*fmr
)
706 mthca_free_region(dev
, fmr
->ibmr
.lkey
);
707 mthca_free_mtt(dev
, fmr
->mtt
);
712 static inline int mthca_check_fmr(struct mthca_fmr
*fmr
, u64
*page_list
,
713 int list_len
, u64 iova
)
717 if (list_len
> fmr
->attr
.max_pages
)
720 page_mask
= (1 << fmr
->attr
.page_shift
) - 1;
722 /* We are getting page lists, so va must be page aligned. */
723 if (iova
& page_mask
)
726 /* Trust the user not to pass misaligned data in page_list */
728 for (i
= 0; i
< list_len
; ++i
) {
729 if (page_list
[i
] & ~page_mask
)
733 if (fmr
->maps
>= fmr
->attr
.max_maps
)
740 int mthca_tavor_map_phys_fmr(struct ib_fmr
*ibfmr
, u64
*page_list
,
741 int list_len
, u64 iova
)
743 struct mthca_fmr
*fmr
= to_mfmr(ibfmr
);
744 struct mthca_dev
*dev
= to_mdev(ibfmr
->device
);
745 struct mthca_mpt_entry mpt_entry
;
749 err
= mthca_check_fmr(fmr
, page_list
, list_len
, iova
);
755 key
= tavor_key_to_hw_index(fmr
->ibmr
.lkey
);
756 key
+= dev
->limits
.num_mpts
;
757 fmr
->ibmr
.lkey
= fmr
->ibmr
.rkey
= tavor_hw_index_to_key(key
);
759 writeb(MTHCA_MPT_STATUS_SW
, fmr
->mem
.tavor
.mpt
);
761 for (i
= 0; i
< list_len
; ++i
) {
762 __be64 mtt_entry
= cpu_to_be64(page_list
[i
] |
763 MTHCA_MTT_FLAG_PRESENT
);
764 mthca_write64_raw(mtt_entry
, fmr
->mem
.tavor
.mtts
+ i
);
767 mpt_entry
.lkey
= cpu_to_be32(key
);
768 mpt_entry
.length
= cpu_to_be64(list_len
* (1ull << fmr
->attr
.page_shift
));
769 mpt_entry
.start
= cpu_to_be64(iova
);
771 __raw_writel((__force u32
) mpt_entry
.lkey
, &fmr
->mem
.tavor
.mpt
->key
);
772 memcpy_toio(&fmr
->mem
.tavor
.mpt
->start
, &mpt_entry
.start
,
773 offsetof(struct mthca_mpt_entry
, window_count
) -
774 offsetof(struct mthca_mpt_entry
, start
));
776 writeb(MTHCA_MPT_STATUS_HW
, fmr
->mem
.tavor
.mpt
);
781 int mthca_arbel_map_phys_fmr(struct ib_fmr
*ibfmr
, u64
*page_list
,
782 int list_len
, u64 iova
)
784 struct mthca_fmr
*fmr
= to_mfmr(ibfmr
);
785 struct mthca_dev
*dev
= to_mdev(ibfmr
->device
);
789 err
= mthca_check_fmr(fmr
, page_list
, list_len
, iova
);
795 key
= arbel_key_to_hw_index(fmr
->ibmr
.lkey
);
796 if (dev
->mthca_flags
& MTHCA_FLAG_SINAI_OPT
)
797 key
+= SINAI_FMR_KEY_INC
;
799 key
+= dev
->limits
.num_mpts
;
800 fmr
->ibmr
.lkey
= fmr
->ibmr
.rkey
= arbel_hw_index_to_key(key
);
802 *(u8
*) fmr
->mem
.arbel
.mpt
= MTHCA_MPT_STATUS_SW
;
806 for (i
= 0; i
< list_len
; ++i
)
807 fmr
->mem
.arbel
.mtts
[i
] = cpu_to_be64(page_list
[i
] |
808 MTHCA_MTT_FLAG_PRESENT
);
810 dma_sync_single(&dev
->pdev
->dev
, fmr
->mem
.arbel
.dma_handle
,
811 list_len
* sizeof(u64
), DMA_TO_DEVICE
);
813 fmr
->mem
.arbel
.mpt
->key
= cpu_to_be32(key
);
814 fmr
->mem
.arbel
.mpt
->lkey
= cpu_to_be32(key
);
815 fmr
->mem
.arbel
.mpt
->length
= cpu_to_be64(list_len
* (1ull << fmr
->attr
.page_shift
));
816 fmr
->mem
.arbel
.mpt
->start
= cpu_to_be64(iova
);
820 *(u8
*) fmr
->mem
.arbel
.mpt
= MTHCA_MPT_STATUS_HW
;
827 void mthca_tavor_fmr_unmap(struct mthca_dev
*dev
, struct mthca_fmr
*fmr
)
834 writeb(MTHCA_MPT_STATUS_SW
, fmr
->mem
.tavor
.mpt
);
837 void mthca_arbel_fmr_unmap(struct mthca_dev
*dev
, struct mthca_fmr
*fmr
)
844 *(u8
*) fmr
->mem
.arbel
.mpt
= MTHCA_MPT_STATUS_SW
;
847 int mthca_init_mr_table(struct mthca_dev
*dev
)
850 int mpts
, mtts
, err
, i
;
852 err
= mthca_alloc_init(&dev
->mr_table
.mpt_alloc
,
853 dev
->limits
.num_mpts
,
854 ~0, dev
->limits
.reserved_mrws
);
858 if (!mthca_is_memfree(dev
) &&
859 (dev
->mthca_flags
& MTHCA_FLAG_DDR_HIDDEN
))
860 dev
->limits
.fmr_reserved_mtts
= 0;
862 dev
->mthca_flags
|= MTHCA_FLAG_FMR
;
864 if (dev
->mthca_flags
& MTHCA_FLAG_SINAI_OPT
)
865 mthca_dbg(dev
, "Memory key throughput optimization activated.\n");
867 err
= mthca_buddy_init(&dev
->mr_table
.mtt_buddy
,
868 fls(dev
->limits
.num_mtt_segs
- 1));
873 dev
->mr_table
.tavor_fmr
.mpt_base
= NULL
;
874 dev
->mr_table
.tavor_fmr
.mtt_base
= NULL
;
876 if (dev
->limits
.fmr_reserved_mtts
) {
877 i
= fls(dev
->limits
.fmr_reserved_mtts
- 1);
880 mthca_warn(dev
, "Unable to reserve 2^31 FMR MTTs.\n");
884 mpts
= mtts
= 1 << i
;
886 mtts
= dev
->limits
.num_mtt_segs
;
887 mpts
= dev
->limits
.num_mpts
;
890 if (!mthca_is_memfree(dev
) &&
891 (dev
->mthca_flags
& MTHCA_FLAG_FMR
)) {
893 addr
= pci_resource_start(dev
->pdev
, 4) +
894 ((pci_resource_len(dev
->pdev
, 4) - 1) &
895 dev
->mr_table
.mpt_base
);
897 dev
->mr_table
.tavor_fmr
.mpt_base
=
898 ioremap(addr
, mpts
* sizeof(struct mthca_mpt_entry
));
900 if (!dev
->mr_table
.tavor_fmr
.mpt_base
) {
901 mthca_warn(dev
, "MPT ioremap for FMR failed.\n");
906 addr
= pci_resource_start(dev
->pdev
, 4) +
907 ((pci_resource_len(dev
->pdev
, 4) - 1) &
908 dev
->mr_table
.mtt_base
);
910 dev
->mr_table
.tavor_fmr
.mtt_base
=
911 ioremap(addr
, mtts
* MTHCA_MTT_SEG_SIZE
);
912 if (!dev
->mr_table
.tavor_fmr
.mtt_base
) {
913 mthca_warn(dev
, "MTT ioremap for FMR failed.\n");
919 if (dev
->limits
.fmr_reserved_mtts
) {
920 err
= mthca_buddy_init(&dev
->mr_table
.tavor_fmr
.mtt_buddy
, fls(mtts
- 1));
922 goto err_fmr_mtt_buddy
;
924 /* Prevent regular MRs from using FMR keys */
925 err
= mthca_buddy_alloc(&dev
->mr_table
.mtt_buddy
, fls(mtts
- 1));
927 goto err_reserve_fmr
;
929 dev
->mr_table
.fmr_mtt_buddy
=
930 &dev
->mr_table
.tavor_fmr
.mtt_buddy
;
932 dev
->mr_table
.fmr_mtt_buddy
= &dev
->mr_table
.mtt_buddy
;
934 /* FMR table is always the first, take reserved MTTs out of there */
935 if (dev
->limits
.reserved_mtts
) {
936 i
= fls(dev
->limits
.reserved_mtts
- 1);
938 if (mthca_alloc_mtt_range(dev
, i
,
939 dev
->mr_table
.fmr_mtt_buddy
) == -1) {
940 mthca_warn(dev
, "MTT table of order %d is too small.\n",
941 dev
->mr_table
.fmr_mtt_buddy
->max_order
);
943 goto err_reserve_mtts
;
951 if (dev
->limits
.fmr_reserved_mtts
)
952 mthca_buddy_cleanup(&dev
->mr_table
.tavor_fmr
.mtt_buddy
);
955 if (dev
->mr_table
.tavor_fmr
.mtt_base
)
956 iounmap(dev
->mr_table
.tavor_fmr
.mtt_base
);
959 if (dev
->mr_table
.tavor_fmr
.mpt_base
)
960 iounmap(dev
->mr_table
.tavor_fmr
.mpt_base
);
963 mthca_buddy_cleanup(&dev
->mr_table
.mtt_buddy
);
966 mthca_alloc_cleanup(&dev
->mr_table
.mpt_alloc
);
971 void mthca_cleanup_mr_table(struct mthca_dev
*dev
)
973 /* XXX check if any MRs are still allocated? */
974 if (dev
->limits
.fmr_reserved_mtts
)
975 mthca_buddy_cleanup(&dev
->mr_table
.tavor_fmr
.mtt_buddy
);
977 mthca_buddy_cleanup(&dev
->mr_table
.mtt_buddy
);
979 if (dev
->mr_table
.tavor_fmr
.mtt_base
)
980 iounmap(dev
->mr_table
.tavor_fmr
.mtt_base
);
981 if (dev
->mr_table
.tavor_fmr
.mpt_base
)
982 iounmap(dev
->mr_table
.tavor_fmr
.mpt_base
);
984 mthca_alloc_cleanup(&dev
->mr_table
.mpt_alloc
);