2 * Copyright (c) 2004 Topspin Communications. All rights reserved.
3 * Copyright (c) 2005 Mellanox Technologies. All rights reserved.
5 * This software is available to you under a choice of one of two
6 * licenses. You may choose to be licensed under the terms of the GNU
7 * General Public License (GPL) Version 2, available from the file
8 * COPYING in the main directory of this source tree, or the
9 * OpenIB.org BSD license below:
11 * Redistribution and use in source and binary forms, with or
12 * without modification, are permitted provided that the following
15 * - Redistributions of source code must retain the above
16 * copyright notice, this list of conditions and the following
19 * - Redistributions in binary form must reproduce the above
20 * copyright notice, this list of conditions and the following
21 * disclaimer in the documentation and/or other materials
22 * provided with the distribution.
24 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
25 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
26 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
27 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
28 * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
29 * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
30 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
34 #include <linux/slab.h>
35 #include <linux/errno.h>
37 #include "mthca_dev.h"
38 #include "mthca_cmd.h"
39 #include "mthca_memfree.h"
42 struct mthca_buddy
*buddy
;
48 * Must be packed because mtt_seg is 64 bits but only aligned to 32 bits.
50 struct mthca_mpt_entry
{
59 __be32 window_count_limit
;
61 __be32 mtt_sz
; /* Arbel only */
63 } __attribute__((packed
));
65 #define MTHCA_MPT_FLAG_SW_OWNS (0xfUL << 28)
66 #define MTHCA_MPT_FLAG_MIO (1 << 17)
67 #define MTHCA_MPT_FLAG_BIND_ENABLE (1 << 15)
68 #define MTHCA_MPT_FLAG_PHYSICAL (1 << 9)
69 #define MTHCA_MPT_FLAG_REGION (1 << 8)
71 #define MTHCA_MTT_FLAG_PRESENT 1
73 #define MTHCA_MPT_STATUS_SW 0xF0
74 #define MTHCA_MPT_STATUS_HW 0x00
76 #define SINAI_FMR_KEY_INC 0x1000000
79 * Buddy allocator for MTT segments (currently not very efficient
80 * since it doesn't keep a free list and just searches linearly
81 * through the bitmaps)
84 static u32
mthca_buddy_alloc(struct mthca_buddy
*buddy
, int order
)
90 spin_lock(&buddy
->lock
);
92 for (o
= order
; o
<= buddy
->max_order
; ++o
)
93 if (buddy
->num_free
[o
]) {
94 m
= 1 << (buddy
->max_order
- o
);
95 seg
= find_first_bit(buddy
->bits
[o
], m
);
100 spin_unlock(&buddy
->lock
);
104 clear_bit(seg
, buddy
->bits
[o
]);
105 --buddy
->num_free
[o
];
110 set_bit(seg
^ 1, buddy
->bits
[o
]);
111 ++buddy
->num_free
[o
];
114 spin_unlock(&buddy
->lock
);
121 static void mthca_buddy_free(struct mthca_buddy
*buddy
, u32 seg
, int order
)
125 spin_lock(&buddy
->lock
);
127 while (test_bit(seg
^ 1, buddy
->bits
[order
])) {
128 clear_bit(seg
^ 1, buddy
->bits
[order
]);
129 --buddy
->num_free
[order
];
134 set_bit(seg
, buddy
->bits
[order
]);
135 ++buddy
->num_free
[order
];
137 spin_unlock(&buddy
->lock
);
140 static int mthca_buddy_init(struct mthca_buddy
*buddy
, int max_order
)
144 buddy
->max_order
= max_order
;
145 spin_lock_init(&buddy
->lock
);
147 buddy
->bits
= kzalloc((buddy
->max_order
+ 1) * sizeof (long *),
149 buddy
->num_free
= kzalloc((buddy
->max_order
+ 1) * sizeof (int *),
151 if (!buddy
->bits
|| !buddy
->num_free
)
154 for (i
= 0; i
<= buddy
->max_order
; ++i
) {
155 s
= BITS_TO_LONGS(1 << (buddy
->max_order
- i
));
156 buddy
->bits
[i
] = kmalloc(s
* sizeof (long), GFP_KERNEL
);
159 bitmap_zero(buddy
->bits
[i
],
160 1 << (buddy
->max_order
- i
));
163 set_bit(0, buddy
->bits
[buddy
->max_order
]);
164 buddy
->num_free
[buddy
->max_order
] = 1;
169 for (i
= 0; i
<= buddy
->max_order
; ++i
)
170 kfree(buddy
->bits
[i
]);
174 kfree(buddy
->num_free
);
179 static void mthca_buddy_cleanup(struct mthca_buddy
*buddy
)
183 for (i
= 0; i
<= buddy
->max_order
; ++i
)
184 kfree(buddy
->bits
[i
]);
187 kfree(buddy
->num_free
);
190 static u32
mthca_alloc_mtt_range(struct mthca_dev
*dev
, int order
,
191 struct mthca_buddy
*buddy
)
193 u32 seg
= mthca_buddy_alloc(buddy
, order
);
198 if (mthca_is_memfree(dev
))
199 if (mthca_table_get_range(dev
, dev
->mr_table
.mtt_table
, seg
,
200 seg
+ (1 << order
) - 1)) {
201 mthca_buddy_free(buddy
, seg
, order
);
208 static struct mthca_mtt
*__mthca_alloc_mtt(struct mthca_dev
*dev
, int size
,
209 struct mthca_buddy
*buddy
)
211 struct mthca_mtt
*mtt
;
215 return ERR_PTR(-EINVAL
);
217 mtt
= kmalloc(sizeof *mtt
, GFP_KERNEL
);
219 return ERR_PTR(-ENOMEM
);
223 for (i
= dev
->limits
.mtt_seg_size
/ 8; i
< size
; i
<<= 1)
226 mtt
->first_seg
= mthca_alloc_mtt_range(dev
, mtt
->order
, buddy
);
227 if (mtt
->first_seg
== -1) {
229 return ERR_PTR(-ENOMEM
);
235 struct mthca_mtt
*mthca_alloc_mtt(struct mthca_dev
*dev
, int size
)
237 return __mthca_alloc_mtt(dev
, size
, &dev
->mr_table
.mtt_buddy
);
240 void mthca_free_mtt(struct mthca_dev
*dev
, struct mthca_mtt
*mtt
)
245 mthca_buddy_free(mtt
->buddy
, mtt
->first_seg
, mtt
->order
);
247 mthca_table_put_range(dev
, dev
->mr_table
.mtt_table
,
249 mtt
->first_seg
+ (1 << mtt
->order
) - 1);
254 static int __mthca_write_mtt(struct mthca_dev
*dev
, struct mthca_mtt
*mtt
,
255 int start_index
, u64
*buffer_list
, int list_len
)
257 struct mthca_mailbox
*mailbox
;
263 mailbox
= mthca_alloc_mailbox(dev
, GFP_KERNEL
);
265 return PTR_ERR(mailbox
);
266 mtt_entry
= mailbox
->buf
;
268 while (list_len
> 0) {
269 mtt_entry
[0] = cpu_to_be64(dev
->mr_table
.mtt_base
+
270 mtt
->first_seg
* dev
->limits
.mtt_seg_size
+
273 for (i
= 0; i
< list_len
&& i
< MTHCA_MAILBOX_SIZE
/ 8 - 2; ++i
)
274 mtt_entry
[i
+ 2] = cpu_to_be64(buffer_list
[i
] |
275 MTHCA_MTT_FLAG_PRESENT
);
278 * If we have an odd number of entries to write, add
279 * one more dummy entry for firmware efficiency.
282 mtt_entry
[i
+ 2] = 0;
284 err
= mthca_WRITE_MTT(dev
, mailbox
, (i
+ 1) & ~1, &status
);
286 mthca_warn(dev
, "WRITE_MTT failed (%d)\n", err
);
290 mthca_warn(dev
, "WRITE_MTT returned status 0x%02x\n",
302 mthca_free_mailbox(dev
, mailbox
);
306 int mthca_write_mtt_size(struct mthca_dev
*dev
)
308 if (dev
->mr_table
.fmr_mtt_buddy
!= &dev
->mr_table
.mtt_buddy
||
309 !(dev
->mthca_flags
& MTHCA_FLAG_FMR
))
311 * Be friendly to WRITE_MTT command
312 * and leave two empty slots for the
313 * index and reserved fields of the
316 return PAGE_SIZE
/ sizeof (u64
) - 2;
318 /* For Arbel, all MTTs must fit in the same page. */
319 return mthca_is_memfree(dev
) ? (PAGE_SIZE
/ sizeof (u64
)) : 0x7ffffff;
322 static void mthca_tavor_write_mtt_seg(struct mthca_dev
*dev
,
323 struct mthca_mtt
*mtt
, int start_index
,
324 u64
*buffer_list
, int list_len
)
329 mtts
= dev
->mr_table
.tavor_fmr
.mtt_base
+ mtt
->first_seg
* dev
->limits
.mtt_seg_size
+
330 start_index
* sizeof (u64
);
331 for (i
= 0; i
< list_len
; ++i
)
332 mthca_write64_raw(cpu_to_be64(buffer_list
[i
] | MTHCA_MTT_FLAG_PRESENT
),
336 static void mthca_arbel_write_mtt_seg(struct mthca_dev
*dev
,
337 struct mthca_mtt
*mtt
, int start_index
,
338 u64
*buffer_list
, int list_len
)
341 dma_addr_t dma_handle
;
343 int s
= start_index
* sizeof (u64
);
345 /* For Arbel, all MTTs must fit in the same page. */
346 BUG_ON(s
/ PAGE_SIZE
!= (s
+ list_len
* sizeof(u64
) - 1) / PAGE_SIZE
);
347 /* Require full segments */
348 BUG_ON(s
% dev
->limits
.mtt_seg_size
);
350 mtts
= mthca_table_find(dev
->mr_table
.mtt_table
, mtt
->first_seg
+
351 s
/ dev
->limits
.mtt_seg_size
, &dma_handle
);
355 dma_sync_single_for_cpu(&dev
->pdev
->dev
, dma_handle
,
356 list_len
* sizeof (u64
), DMA_TO_DEVICE
);
358 for (i
= 0; i
< list_len
; ++i
)
359 mtts
[i
] = cpu_to_be64(buffer_list
[i
] | MTHCA_MTT_FLAG_PRESENT
);
361 dma_sync_single_for_device(&dev
->pdev
->dev
, dma_handle
,
362 list_len
* sizeof (u64
), DMA_TO_DEVICE
);
365 int mthca_write_mtt(struct mthca_dev
*dev
, struct mthca_mtt
*mtt
,
366 int start_index
, u64
*buffer_list
, int list_len
)
368 int size
= mthca_write_mtt_size(dev
);
371 if (dev
->mr_table
.fmr_mtt_buddy
!= &dev
->mr_table
.mtt_buddy
||
372 !(dev
->mthca_flags
& MTHCA_FLAG_FMR
))
373 return __mthca_write_mtt(dev
, mtt
, start_index
, buffer_list
, list_len
);
375 while (list_len
> 0) {
376 chunk
= min(size
, list_len
);
377 if (mthca_is_memfree(dev
))
378 mthca_arbel_write_mtt_seg(dev
, mtt
, start_index
,
381 mthca_tavor_write_mtt_seg(dev
, mtt
, start_index
,
385 start_index
+= chunk
;
386 buffer_list
+= chunk
;
392 static inline u32
tavor_hw_index_to_key(u32 ind
)
397 static inline u32
tavor_key_to_hw_index(u32 key
)
402 static inline u32
arbel_hw_index_to_key(u32 ind
)
404 return (ind
>> 24) | (ind
<< 8);
407 static inline u32
arbel_key_to_hw_index(u32 key
)
409 return (key
<< 24) | (key
>> 8);
412 static inline u32
hw_index_to_key(struct mthca_dev
*dev
, u32 ind
)
414 if (mthca_is_memfree(dev
))
415 return arbel_hw_index_to_key(ind
);
417 return tavor_hw_index_to_key(ind
);
420 static inline u32
key_to_hw_index(struct mthca_dev
*dev
, u32 key
)
422 if (mthca_is_memfree(dev
))
423 return arbel_key_to_hw_index(key
);
425 return tavor_key_to_hw_index(key
);
428 static inline u32
adjust_key(struct mthca_dev
*dev
, u32 key
)
430 if (dev
->mthca_flags
& MTHCA_FLAG_SINAI_OPT
)
431 return ((key
<< 20) & 0x800000) | (key
& 0x7fffff);
436 int mthca_mr_alloc(struct mthca_dev
*dev
, u32 pd
, int buffer_size_shift
,
437 u64 iova
, u64 total_size
, u32 access
, struct mthca_mr
*mr
)
439 struct mthca_mailbox
*mailbox
;
440 struct mthca_mpt_entry
*mpt_entry
;
446 WARN_ON(buffer_size_shift
>= 32);
448 key
= mthca_alloc(&dev
->mr_table
.mpt_alloc
);
451 key
= adjust_key(dev
, key
);
452 mr
->ibmr
.rkey
= mr
->ibmr
.lkey
= hw_index_to_key(dev
, key
);
454 if (mthca_is_memfree(dev
)) {
455 err
= mthca_table_get(dev
, dev
->mr_table
.mpt_table
, key
);
457 goto err_out_mpt_free
;
460 mailbox
= mthca_alloc_mailbox(dev
, GFP_KERNEL
);
461 if (IS_ERR(mailbox
)) {
462 err
= PTR_ERR(mailbox
);
465 mpt_entry
= mailbox
->buf
;
467 mpt_entry
->flags
= cpu_to_be32(MTHCA_MPT_FLAG_SW_OWNS
|
469 MTHCA_MPT_FLAG_REGION
|
472 mpt_entry
->flags
|= cpu_to_be32(MTHCA_MPT_FLAG_PHYSICAL
);
474 mpt_entry
->page_size
= cpu_to_be32(buffer_size_shift
- 12);
475 mpt_entry
->key
= cpu_to_be32(key
);
476 mpt_entry
->pd
= cpu_to_be32(pd
);
477 mpt_entry
->start
= cpu_to_be64(iova
);
478 mpt_entry
->length
= cpu_to_be64(total_size
);
480 memset(&mpt_entry
->lkey
, 0,
481 sizeof *mpt_entry
- offsetof(struct mthca_mpt_entry
, lkey
));
485 cpu_to_be64(dev
->mr_table
.mtt_base
+
486 mr
->mtt
->first_seg
* dev
->limits
.mtt_seg_size
);
489 mthca_dbg(dev
, "Dumping MPT entry %08x:\n", mr
->ibmr
.lkey
);
490 for (i
= 0; i
< sizeof (struct mthca_mpt_entry
) / 4; ++i
) {
492 printk("[%02x] ", i
* 4);
493 printk(" %08x", be32_to_cpu(((__be32
*) mpt_entry
)[i
]));
494 if ((i
+ 1) % 4 == 0)
499 err
= mthca_SW2HW_MPT(dev
, mailbox
,
500 key
& (dev
->limits
.num_mpts
- 1),
503 mthca_warn(dev
, "SW2HW_MPT failed (%d)\n", err
);
504 goto err_out_mailbox
;
506 mthca_warn(dev
, "SW2HW_MPT returned status 0x%02x\n",
509 goto err_out_mailbox
;
512 mthca_free_mailbox(dev
, mailbox
);
516 mthca_free_mailbox(dev
, mailbox
);
519 mthca_table_put(dev
, dev
->mr_table
.mpt_table
, key
);
522 mthca_free(&dev
->mr_table
.mpt_alloc
, key
);
526 int mthca_mr_alloc_notrans(struct mthca_dev
*dev
, u32 pd
,
527 u32 access
, struct mthca_mr
*mr
)
530 return mthca_mr_alloc(dev
, pd
, 12, 0, ~0ULL, access
, mr
);
533 int mthca_mr_alloc_phys(struct mthca_dev
*dev
, u32 pd
,
534 u64
*buffer_list
, int buffer_size_shift
,
535 int list_len
, u64 iova
, u64 total_size
,
536 u32 access
, struct mthca_mr
*mr
)
540 mr
->mtt
= mthca_alloc_mtt(dev
, list_len
);
542 return PTR_ERR(mr
->mtt
);
544 err
= mthca_write_mtt(dev
, mr
->mtt
, 0, buffer_list
, list_len
);
546 mthca_free_mtt(dev
, mr
->mtt
);
550 err
= mthca_mr_alloc(dev
, pd
, buffer_size_shift
, iova
,
551 total_size
, access
, mr
);
553 mthca_free_mtt(dev
, mr
->mtt
);
559 static void mthca_free_region(struct mthca_dev
*dev
, u32 lkey
)
561 mthca_table_put(dev
, dev
->mr_table
.mpt_table
,
562 key_to_hw_index(dev
, lkey
));
564 mthca_free(&dev
->mr_table
.mpt_alloc
, key_to_hw_index(dev
, lkey
));
567 void mthca_free_mr(struct mthca_dev
*dev
, struct mthca_mr
*mr
)
572 err
= mthca_HW2SW_MPT(dev
, NULL
,
573 key_to_hw_index(dev
, mr
->ibmr
.lkey
) &
574 (dev
->limits
.num_mpts
- 1),
577 mthca_warn(dev
, "HW2SW_MPT failed (%d)\n", err
);
579 mthca_warn(dev
, "HW2SW_MPT returned status 0x%02x\n",
582 mthca_free_region(dev
, mr
->ibmr
.lkey
);
583 mthca_free_mtt(dev
, mr
->mtt
);
586 int mthca_fmr_alloc(struct mthca_dev
*dev
, u32 pd
,
587 u32 access
, struct mthca_fmr
*mr
)
589 struct mthca_mpt_entry
*mpt_entry
;
590 struct mthca_mailbox
*mailbox
;
594 int list_len
= mr
->attr
.max_pages
;
598 if (mr
->attr
.page_shift
< 12 || mr
->attr
.page_shift
>= 32)
601 /* For Arbel, all MTTs must fit in the same page. */
602 if (mthca_is_memfree(dev
) &&
603 mr
->attr
.max_pages
* sizeof *mr
->mem
.arbel
.mtts
> PAGE_SIZE
)
608 key
= mthca_alloc(&dev
->mr_table
.mpt_alloc
);
611 key
= adjust_key(dev
, key
);
613 idx
= key
& (dev
->limits
.num_mpts
- 1);
614 mr
->ibmr
.rkey
= mr
->ibmr
.lkey
= hw_index_to_key(dev
, key
);
616 if (mthca_is_memfree(dev
)) {
617 err
= mthca_table_get(dev
, dev
->mr_table
.mpt_table
, key
);
619 goto err_out_mpt_free
;
621 mr
->mem
.arbel
.mpt
= mthca_table_find(dev
->mr_table
.mpt_table
, key
, NULL
);
622 BUG_ON(!mr
->mem
.arbel
.mpt
);
624 mr
->mem
.tavor
.mpt
= dev
->mr_table
.tavor_fmr
.mpt_base
+
625 sizeof *(mr
->mem
.tavor
.mpt
) * idx
;
627 mr
->mtt
= __mthca_alloc_mtt(dev
, list_len
, dev
->mr_table
.fmr_mtt_buddy
);
628 if (IS_ERR(mr
->mtt
)) {
629 err
= PTR_ERR(mr
->mtt
);
633 mtt_seg
= mr
->mtt
->first_seg
* dev
->limits
.mtt_seg_size
;
635 if (mthca_is_memfree(dev
)) {
636 mr
->mem
.arbel
.mtts
= mthca_table_find(dev
->mr_table
.mtt_table
,
638 &mr
->mem
.arbel
.dma_handle
);
639 BUG_ON(!mr
->mem
.arbel
.mtts
);
641 mr
->mem
.tavor
.mtts
= dev
->mr_table
.tavor_fmr
.mtt_base
+ mtt_seg
;
643 mailbox
= mthca_alloc_mailbox(dev
, GFP_KERNEL
);
644 if (IS_ERR(mailbox
)) {
645 err
= PTR_ERR(mailbox
);
646 goto err_out_free_mtt
;
649 mpt_entry
= mailbox
->buf
;
651 mpt_entry
->flags
= cpu_to_be32(MTHCA_MPT_FLAG_SW_OWNS
|
653 MTHCA_MPT_FLAG_REGION
|
656 mpt_entry
->page_size
= cpu_to_be32(mr
->attr
.page_shift
- 12);
657 mpt_entry
->key
= cpu_to_be32(key
);
658 mpt_entry
->pd
= cpu_to_be32(pd
);
659 memset(&mpt_entry
->start
, 0,
660 sizeof *mpt_entry
- offsetof(struct mthca_mpt_entry
, start
));
661 mpt_entry
->mtt_seg
= cpu_to_be64(dev
->mr_table
.mtt_base
+ mtt_seg
);
664 mthca_dbg(dev
, "Dumping MPT entry %08x:\n", mr
->ibmr
.lkey
);
665 for (i
= 0; i
< sizeof (struct mthca_mpt_entry
) / 4; ++i
) {
667 printk("[%02x] ", i
* 4);
668 printk(" %08x", be32_to_cpu(((__be32
*) mpt_entry
)[i
]));
669 if ((i
+ 1) % 4 == 0)
674 err
= mthca_SW2HW_MPT(dev
, mailbox
,
675 key
& (dev
->limits
.num_mpts
- 1),
678 mthca_warn(dev
, "SW2HW_MPT failed (%d)\n", err
);
679 goto err_out_mailbox_free
;
682 mthca_warn(dev
, "SW2HW_MPT returned status 0x%02x\n",
685 goto err_out_mailbox_free
;
688 mthca_free_mailbox(dev
, mailbox
);
691 err_out_mailbox_free
:
692 mthca_free_mailbox(dev
, mailbox
);
695 mthca_free_mtt(dev
, mr
->mtt
);
698 mthca_table_put(dev
, dev
->mr_table
.mpt_table
, key
);
701 mthca_free(&dev
->mr_table
.mpt_alloc
, key
);
705 int mthca_free_fmr(struct mthca_dev
*dev
, struct mthca_fmr
*fmr
)
710 mthca_free_region(dev
, fmr
->ibmr
.lkey
);
711 mthca_free_mtt(dev
, fmr
->mtt
);
716 static inline int mthca_check_fmr(struct mthca_fmr
*fmr
, u64
*page_list
,
717 int list_len
, u64 iova
)
721 if (list_len
> fmr
->attr
.max_pages
)
724 page_mask
= (1 << fmr
->attr
.page_shift
) - 1;
726 /* We are getting page lists, so va must be page aligned. */
727 if (iova
& page_mask
)
730 /* Trust the user not to pass misaligned data in page_list */
732 for (i
= 0; i
< list_len
; ++i
) {
733 if (page_list
[i
] & ~page_mask
)
737 if (fmr
->maps
>= fmr
->attr
.max_maps
)
744 int mthca_tavor_map_phys_fmr(struct ib_fmr
*ibfmr
, u64
*page_list
,
745 int list_len
, u64 iova
)
747 struct mthca_fmr
*fmr
= to_mfmr(ibfmr
);
748 struct mthca_dev
*dev
= to_mdev(ibfmr
->device
);
749 struct mthca_mpt_entry mpt_entry
;
753 err
= mthca_check_fmr(fmr
, page_list
, list_len
, iova
);
759 key
= tavor_key_to_hw_index(fmr
->ibmr
.lkey
);
760 key
+= dev
->limits
.num_mpts
;
761 fmr
->ibmr
.lkey
= fmr
->ibmr
.rkey
= tavor_hw_index_to_key(key
);
763 writeb(MTHCA_MPT_STATUS_SW
, fmr
->mem
.tavor
.mpt
);
765 for (i
= 0; i
< list_len
; ++i
) {
766 __be64 mtt_entry
= cpu_to_be64(page_list
[i
] |
767 MTHCA_MTT_FLAG_PRESENT
);
768 mthca_write64_raw(mtt_entry
, fmr
->mem
.tavor
.mtts
+ i
);
771 mpt_entry
.lkey
= cpu_to_be32(key
);
772 mpt_entry
.length
= cpu_to_be64(list_len
* (1ull << fmr
->attr
.page_shift
));
773 mpt_entry
.start
= cpu_to_be64(iova
);
775 __raw_writel((__force u32
) mpt_entry
.lkey
, &fmr
->mem
.tavor
.mpt
->key
);
776 memcpy_toio(&fmr
->mem
.tavor
.mpt
->start
, &mpt_entry
.start
,
777 offsetof(struct mthca_mpt_entry
, window_count
) -
778 offsetof(struct mthca_mpt_entry
, start
));
780 writeb(MTHCA_MPT_STATUS_HW
, fmr
->mem
.tavor
.mpt
);
785 int mthca_arbel_map_phys_fmr(struct ib_fmr
*ibfmr
, u64
*page_list
,
786 int list_len
, u64 iova
)
788 struct mthca_fmr
*fmr
= to_mfmr(ibfmr
);
789 struct mthca_dev
*dev
= to_mdev(ibfmr
->device
);
793 err
= mthca_check_fmr(fmr
, page_list
, list_len
, iova
);
799 key
= arbel_key_to_hw_index(fmr
->ibmr
.lkey
);
800 if (dev
->mthca_flags
& MTHCA_FLAG_SINAI_OPT
)
801 key
+= SINAI_FMR_KEY_INC
;
803 key
+= dev
->limits
.num_mpts
;
804 fmr
->ibmr
.lkey
= fmr
->ibmr
.rkey
= arbel_hw_index_to_key(key
);
806 *(u8
*) fmr
->mem
.arbel
.mpt
= MTHCA_MPT_STATUS_SW
;
810 dma_sync_single_for_cpu(&dev
->pdev
->dev
, fmr
->mem
.arbel
.dma_handle
,
811 list_len
* sizeof(u64
), DMA_TO_DEVICE
);
813 for (i
= 0; i
< list_len
; ++i
)
814 fmr
->mem
.arbel
.mtts
[i
] = cpu_to_be64(page_list
[i
] |
815 MTHCA_MTT_FLAG_PRESENT
);
817 dma_sync_single_for_device(&dev
->pdev
->dev
, fmr
->mem
.arbel
.dma_handle
,
818 list_len
* sizeof(u64
), DMA_TO_DEVICE
);
820 fmr
->mem
.arbel
.mpt
->key
= cpu_to_be32(key
);
821 fmr
->mem
.arbel
.mpt
->lkey
= cpu_to_be32(key
);
822 fmr
->mem
.arbel
.mpt
->length
= cpu_to_be64(list_len
* (1ull << fmr
->attr
.page_shift
));
823 fmr
->mem
.arbel
.mpt
->start
= cpu_to_be64(iova
);
827 *(u8
*) fmr
->mem
.arbel
.mpt
= MTHCA_MPT_STATUS_HW
;
834 void mthca_tavor_fmr_unmap(struct mthca_dev
*dev
, struct mthca_fmr
*fmr
)
841 writeb(MTHCA_MPT_STATUS_SW
, fmr
->mem
.tavor
.mpt
);
844 void mthca_arbel_fmr_unmap(struct mthca_dev
*dev
, struct mthca_fmr
*fmr
)
851 *(u8
*) fmr
->mem
.arbel
.mpt
= MTHCA_MPT_STATUS_SW
;
854 int mthca_init_mr_table(struct mthca_dev
*dev
)
857 int mpts
, mtts
, err
, i
;
859 err
= mthca_alloc_init(&dev
->mr_table
.mpt_alloc
,
860 dev
->limits
.num_mpts
,
861 ~0, dev
->limits
.reserved_mrws
);
865 if (!mthca_is_memfree(dev
) &&
866 (dev
->mthca_flags
& MTHCA_FLAG_DDR_HIDDEN
))
867 dev
->limits
.fmr_reserved_mtts
= 0;
869 dev
->mthca_flags
|= MTHCA_FLAG_FMR
;
871 if (dev
->mthca_flags
& MTHCA_FLAG_SINAI_OPT
)
872 mthca_dbg(dev
, "Memory key throughput optimization activated.\n");
874 err
= mthca_buddy_init(&dev
->mr_table
.mtt_buddy
,
875 fls(dev
->limits
.num_mtt_segs
- 1));
880 dev
->mr_table
.tavor_fmr
.mpt_base
= NULL
;
881 dev
->mr_table
.tavor_fmr
.mtt_base
= NULL
;
883 if (dev
->limits
.fmr_reserved_mtts
) {
884 i
= fls(dev
->limits
.fmr_reserved_mtts
- 1);
887 mthca_warn(dev
, "Unable to reserve 2^31 FMR MTTs.\n");
891 mpts
= mtts
= 1 << i
;
893 mtts
= dev
->limits
.num_mtt_segs
;
894 mpts
= dev
->limits
.num_mpts
;
897 if (!mthca_is_memfree(dev
) &&
898 (dev
->mthca_flags
& MTHCA_FLAG_FMR
)) {
900 addr
= pci_resource_start(dev
->pdev
, 4) +
901 ((pci_resource_len(dev
->pdev
, 4) - 1) &
902 dev
->mr_table
.mpt_base
);
904 dev
->mr_table
.tavor_fmr
.mpt_base
=
905 ioremap(addr
, mpts
* sizeof(struct mthca_mpt_entry
));
907 if (!dev
->mr_table
.tavor_fmr
.mpt_base
) {
908 mthca_warn(dev
, "MPT ioremap for FMR failed.\n");
913 addr
= pci_resource_start(dev
->pdev
, 4) +
914 ((pci_resource_len(dev
->pdev
, 4) - 1) &
915 dev
->mr_table
.mtt_base
);
917 dev
->mr_table
.tavor_fmr
.mtt_base
=
918 ioremap(addr
, mtts
* dev
->limits
.mtt_seg_size
);
919 if (!dev
->mr_table
.tavor_fmr
.mtt_base
) {
920 mthca_warn(dev
, "MTT ioremap for FMR failed.\n");
926 if (dev
->limits
.fmr_reserved_mtts
) {
927 err
= mthca_buddy_init(&dev
->mr_table
.tavor_fmr
.mtt_buddy
, fls(mtts
- 1));
929 goto err_fmr_mtt_buddy
;
931 /* Prevent regular MRs from using FMR keys */
932 err
= mthca_buddy_alloc(&dev
->mr_table
.mtt_buddy
, fls(mtts
- 1));
934 goto err_reserve_fmr
;
936 dev
->mr_table
.fmr_mtt_buddy
=
937 &dev
->mr_table
.tavor_fmr
.mtt_buddy
;
939 dev
->mr_table
.fmr_mtt_buddy
= &dev
->mr_table
.mtt_buddy
;
941 /* FMR table is always the first, take reserved MTTs out of there */
942 if (dev
->limits
.reserved_mtts
) {
943 i
= fls(dev
->limits
.reserved_mtts
- 1);
945 if (mthca_alloc_mtt_range(dev
, i
,
946 dev
->mr_table
.fmr_mtt_buddy
) == -1) {
947 mthca_warn(dev
, "MTT table of order %d is too small.\n",
948 dev
->mr_table
.fmr_mtt_buddy
->max_order
);
950 goto err_reserve_mtts
;
958 if (dev
->limits
.fmr_reserved_mtts
)
959 mthca_buddy_cleanup(&dev
->mr_table
.tavor_fmr
.mtt_buddy
);
962 if (dev
->mr_table
.tavor_fmr
.mtt_base
)
963 iounmap(dev
->mr_table
.tavor_fmr
.mtt_base
);
966 if (dev
->mr_table
.tavor_fmr
.mpt_base
)
967 iounmap(dev
->mr_table
.tavor_fmr
.mpt_base
);
970 mthca_buddy_cleanup(&dev
->mr_table
.mtt_buddy
);
973 mthca_alloc_cleanup(&dev
->mr_table
.mpt_alloc
);
978 void mthca_cleanup_mr_table(struct mthca_dev
*dev
)
980 /* XXX check if any MRs are still allocated? */
981 if (dev
->limits
.fmr_reserved_mtts
)
982 mthca_buddy_cleanup(&dev
->mr_table
.tavor_fmr
.mtt_buddy
);
984 mthca_buddy_cleanup(&dev
->mr_table
.mtt_buddy
);
986 if (dev
->mr_table
.tavor_fmr
.mtt_base
)
987 iounmap(dev
->mr_table
.tavor_fmr
.mtt_base
);
988 if (dev
->mr_table
.tavor_fmr
.mpt_base
)
989 iounmap(dev
->mr_table
.tavor_fmr
.mpt_base
);
991 mthca_alloc_cleanup(&dev
->mr_table
.mpt_alloc
);