2 * Linux MegaRAID driver for SAS based RAID controllers
4 * Copyright (c) 2009-2011 LSI Corporation.
6 * This program is free software; you can redistribute it and/or
7 * modify it under the terms of the GNU General Public License
8 * as published by the Free Software Foundation; either version 2
9 * of the License, or (at your option) any later version.
11 * This program is distributed in the hope that it will be useful,
12 * but WITHOUT ANY WARRANTY; without even the implied warranty of
13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 * GNU General Public License for more details.
16 * You should have received a copy of the GNU General Public License
17 * along with this program; if not, write to the Free Software
18 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
20 * FILE: megaraid_sas_fp.c
22 * Authors: LSI Corporation
27 * Send feedback to: <megaraidlinux@lsi.com>
29 * Mail to: LSI Corporation, 1621 Barber Lane, Milpitas, CA 95035
33 #include <linux/kernel.h>
34 #include <linux/types.h>
35 #include <linux/pci.h>
36 #include <linux/list.h>
37 #include <linux/moduleparam.h>
38 #include <linux/module.h>
39 #include <linux/spinlock.h>
40 #include <linux/interrupt.h>
41 #include <linux/delay.h>
42 #include <linux/uio.h>
43 #include <linux/uaccess.h>
45 #include <linux/compat.h>
46 #include <linux/blkdev.h>
47 #include <linux/poll.h>
49 #include <scsi/scsi.h>
50 #include <scsi/scsi_cmnd.h>
51 #include <scsi/scsi_device.h>
52 #include <scsi/scsi_host.h>
54 #include "megaraid_sas_fusion.h"
55 #include "megaraid_sas.h"
56 #include <asm/div64.h>
58 #define ABS_DIFF(a, b) (((a) > (b)) ? ((a) - (b)) : ((b) - (a)))
59 #define MR_LD_STATE_OPTIMAL 3
65 mr_update_load_balance_params(struct MR_FW_RAID_MAP_ALL
*map
,
66 struct LD_LOAD_BALANCE_INFO
*lbInfo
);
68 u32
mega_mod64(u64 dividend
, u32 divisor
)
74 printk(KERN_ERR
"megasas : DIVISOR is zero, in div fn\n");
76 remainder
= do_div(d
, divisor
);
81 * @param dividend : Dividend
82 * @param divisor : Divisor
86 u64
mega_div64_32(uint64_t dividend
, uint32_t divisor
)
92 printk(KERN_ERR
"megasas : DIVISOR is zero in mod fn\n");
95 remainder
= do_div(d
, divisor
);
100 struct MR_LD_RAID
*MR_LdRaidGet(u32 ld
, struct MR_FW_RAID_MAP_ALL
*map
)
102 return &map
->raidMap
.ldSpanMap
[ld
].ldRaid
;
105 static struct MR_SPAN_BLOCK_INFO
*MR_LdSpanInfoGet(u32 ld
,
106 struct MR_FW_RAID_MAP_ALL
109 return &map
->raidMap
.ldSpanMap
[ld
].spanBlock
[0];
112 static u8
MR_LdDataArmGet(u32 ld
, u32 armIdx
, struct MR_FW_RAID_MAP_ALL
*map
)
114 return map
->raidMap
.ldSpanMap
[ld
].dataArmMap
[armIdx
];
117 static u16
MR_ArPdGet(u32 ar
, u32 arm
, struct MR_FW_RAID_MAP_ALL
*map
)
119 return map
->raidMap
.arMapInfo
[ar
].pd
[arm
];
122 static u16
MR_LdSpanArrayGet(u32 ld
, u32 span
, struct MR_FW_RAID_MAP_ALL
*map
)
124 return map
->raidMap
.ldSpanMap
[ld
].spanBlock
[span
].span
.arrayRef
;
127 static u16
MR_PdDevHandleGet(u32 pd
, struct MR_FW_RAID_MAP_ALL
*map
)
129 return map
->raidMap
.devHndlInfo
[pd
].curDevHdl
;
132 u16
MR_GetLDTgtId(u32 ld
, struct MR_FW_RAID_MAP_ALL
*map
)
134 return map
->raidMap
.ldSpanMap
[ld
].ldRaid
.targetId
;
137 u16
MR_TargetIdToLdGet(u32 ldTgtId
, struct MR_FW_RAID_MAP_ALL
*map
)
139 return map
->raidMap
.ldTgtIdToLd
[ldTgtId
];
142 static struct MR_LD_SPAN
*MR_LdSpanPtrGet(u32 ld
, u32 span
,
143 struct MR_FW_RAID_MAP_ALL
*map
)
145 return &map
->raidMap
.ldSpanMap
[ld
].spanBlock
[span
].span
;
149 * This function will validate Map info data provided by FW
151 u8
MR_ValidateMapInfo(struct MR_FW_RAID_MAP_ALL
*map
,
152 struct LD_LOAD_BALANCE_INFO
*lbInfo
)
154 struct MR_FW_RAID_MAP
*pFwRaidMap
= &map
->raidMap
;
156 if (pFwRaidMap
->totalSize
!=
157 (sizeof(struct MR_FW_RAID_MAP
) -sizeof(struct MR_LD_SPAN_MAP
) +
158 (sizeof(struct MR_LD_SPAN_MAP
) *pFwRaidMap
->ldCount
))) {
159 printk(KERN_ERR
"megasas: map info structure size 0x%x is not matching with ld count\n",
160 (unsigned int)((sizeof(struct MR_FW_RAID_MAP
) -
161 sizeof(struct MR_LD_SPAN_MAP
)) +
162 (sizeof(struct MR_LD_SPAN_MAP
) *
163 pFwRaidMap
->ldCount
)));
164 printk(KERN_ERR
"megasas: span map %x, pFwRaidMap->totalSize "
165 ": %x\n", (unsigned int)sizeof(struct MR_LD_SPAN_MAP
),
166 pFwRaidMap
->totalSize
);
170 mr_update_load_balance_params(map
, lbInfo
);
175 u32
MR_GetSpanBlock(u32 ld
, u64 row
, u64
*span_blk
,
176 struct MR_FW_RAID_MAP_ALL
*map
, int *div_error
)
178 struct MR_SPAN_BLOCK_INFO
*pSpanBlock
= MR_LdSpanInfoGet(ld
, map
);
179 struct MR_QUAD_ELEMENT
*quad
;
180 struct MR_LD_RAID
*raid
= MR_LdRaidGet(ld
, map
);
183 for (span
= 0; span
< raid
->spanDepth
; span
++, pSpanBlock
++) {
185 for (j
= 0; j
< pSpanBlock
->block_span_info
.noElements
; j
++) {
186 quad
= &pSpanBlock
->block_span_info
.quad
[j
];
188 if (quad
->diff
== 0) {
192 if (quad
->logStart
<= row
&& row
<= quad
->logEnd
&&
193 (mega_mod64(row
-quad
->logStart
, quad
->diff
)) == 0) {
194 if (span_blk
!= NULL
) {
198 (row
-quad
->logStart
),
202 blk
= (blk
+ quad
->offsetInSpan
) <<
214 ******************************************************************************
216 * This routine calculates the arm, span and block for the specified stripe and
217 * reference in stripe.
221 * ld - Logical drive number
222 * stripRow - Stripe number
223 * stripRef - Reference in stripe
228 * block - Absolute Block number in the physical disk
230 u8
MR_GetPhyParams(struct megasas_instance
*instance
, u32 ld
, u64 stripRow
,
231 u16 stripRef
, u64
*pdBlock
, u16
*pDevHandle
,
232 struct RAID_CONTEXT
*pRAID_Context
,
233 struct MR_FW_RAID_MAP_ALL
*map
)
235 struct MR_LD_RAID
*raid
= MR_LdRaidGet(ld
, map
);
242 row
= mega_div64_32(stripRow
, raid
->rowDataSize
);
244 if (raid
->level
== 6) {
245 /* logical arm within row */
246 u32 logArm
= mega_mod64(stripRow
, raid
->rowDataSize
);
247 u32 rowMod
, armQ
, arm
;
249 if (raid
->rowSize
== 0)
251 /* get logical row mod */
252 rowMod
= mega_mod64(row
, raid
->rowSize
);
253 armQ
= raid
->rowSize
-1-rowMod
; /* index of Q drive */
254 arm
= armQ
+1+logArm
; /* data always logically follows Q */
255 if (arm
>= raid
->rowSize
) /* handle wrap condition */
256 arm
-= raid
->rowSize
;
259 if (raid
->modFactor
== 0)
261 physArm
= MR_LdDataArmGet(ld
, mega_mod64(stripRow
,
266 if (raid
->spanDepth
== 1) {
268 *pdBlock
= row
<< raid
->stripeShift
;
270 span
= (u8
)MR_GetSpanBlock(ld
, row
, pdBlock
, map
, &error_code
);
275 /* Get the array on which this span is present */
276 arRef
= MR_LdSpanArrayGet(ld
, span
, map
);
277 pd
= MR_ArPdGet(arRef
, physArm
, map
); /* Get the pd */
279 if (pd
!= MR_PD_INVALID
)
280 /* Get dev handle from Pd. */
281 *pDevHandle
= MR_PdDevHandleGet(pd
, map
);
283 *pDevHandle
= MR_PD_INVALID
; /* set dev handle as invalid. */
284 if ((raid
->level
>= 5) &&
285 ((instance
->pdev
->device
!= PCI_DEVICE_ID_LSI_INVADER
) ||
286 (instance
->pdev
->device
== PCI_DEVICE_ID_LSI_INVADER
&&
287 raid
->regTypeReqOnRead
!= REGION_TYPE_UNUSED
)))
288 pRAID_Context
->regLockFlags
= REGION_TYPE_EXCLUSIVE
;
289 else if (raid
->level
== 1) {
290 /* Get alternate Pd. */
291 pd
= MR_ArPdGet(arRef
, physArm
+ 1, map
);
292 if (pd
!= MR_PD_INVALID
)
293 /* Get dev handle from Pd */
294 *pDevHandle
= MR_PdDevHandleGet(pd
, map
);
298 *pdBlock
+= stripRef
+ MR_LdSpanPtrGet(ld
, span
, map
)->startBlk
;
299 pRAID_Context
->spanArm
= (span
<< RAID_CTX_SPANARM_SPAN_SHIFT
) |
305 ******************************************************************************
307 * MR_BuildRaidContext function
309 * This function will initiate command processing. The start/end row and strip
310 * information is calculated then the lock is acquired.
311 * This function will return 0 if region lock was acquired OR return num strips
314 MR_BuildRaidContext(struct megasas_instance
*instance
,
315 struct IO_REQUEST_INFO
*io_info
,
316 struct RAID_CONTEXT
*pRAID_Context
,
317 struct MR_FW_RAID_MAP_ALL
*map
)
319 struct MR_LD_RAID
*raid
;
320 u32 ld
, stripSize
, stripe_mask
;
321 u64 endLba
, endStrip
, endRow
, start_row
, start_strip
;
324 u8 num_strips
, numRows
;
325 u16 ref_in_start_stripe
, ref_in_end_stripe
;
327 u32 numBlocks
, ldTgtId
;
331 ldStartBlock
= io_info
->ldStartBlock
;
332 numBlocks
= io_info
->numBlocks
;
333 ldTgtId
= io_info
->ldTgtId
;
334 isRead
= io_info
->isRead
;
336 ld
= MR_TargetIdToLdGet(ldTgtId
, map
);
337 raid
= MR_LdRaidGet(ld
, map
);
339 stripSize
= 1 << raid
->stripeShift
;
340 stripe_mask
= stripSize
-1;
342 * calculate starting row and stripe, and number of strips and rows
344 start_strip
= ldStartBlock
>> raid
->stripeShift
;
345 ref_in_start_stripe
= (u16
)(ldStartBlock
& stripe_mask
);
346 endLba
= ldStartBlock
+ numBlocks
- 1;
347 ref_in_end_stripe
= (u16
)(endLba
& stripe_mask
);
348 endStrip
= endLba
>> raid
->stripeShift
;
349 num_strips
= (u8
)(endStrip
- start_strip
+ 1); /* End strip */
350 if (raid
->rowDataSize
== 0)
352 start_row
= mega_div64_32(start_strip
, raid
->rowDataSize
);
353 endRow
= mega_div64_32(endStrip
, raid
->rowDataSize
);
354 numRows
= (u8
)(endRow
- start_row
+ 1);
357 * calculate region info.
360 /* assume region is at the start of the first row */
361 regStart
= start_row
<< raid
->stripeShift
;
362 /* assume this IO needs the full row - we'll adjust if not true */
365 /* Check if we can send this I/O via FastPath */
366 if (raid
->capability
.fpCapable
) {
368 io_info
->fpOkForIo
= (raid
->capability
.fpReadCapable
&&
369 ((num_strips
== 1) ||
371 fpReadAcrossStripe
));
373 io_info
->fpOkForIo
= (raid
->capability
.fpWriteCapable
&&
374 ((num_strips
== 1) ||
376 fpWriteAcrossStripe
));
378 io_info
->fpOkForIo
= FALSE
;
381 /* single-strip IOs can always lock only the data needed */
382 if (num_strips
== 1) {
383 regStart
+= ref_in_start_stripe
;
386 /* multi-strip IOs always need to full stripe locked */
388 if (start_strip
== (start_row
+ 1) * raid
->rowDataSize
- 1) {
389 /* If the start strip is the last in the start row */
390 regStart
+= ref_in_start_stripe
;
391 regSize
= stripSize
- ref_in_start_stripe
;
392 /* initialize count to sectors from startref to end
397 /* Add complete rows in the middle of the transfer */
398 regSize
+= (numRows
-2) << raid
->stripeShift
;
400 /* if IO ends within first strip of last row */
401 if (endStrip
== endRow
*raid
->rowDataSize
)
402 regSize
+= ref_in_end_stripe
+1;
404 regSize
+= stripSize
;
407 pRAID_Context
->timeoutValue
= map
->raidMap
.fpPdIoTimeoutSec
;
408 if (instance
->pdev
->device
== PCI_DEVICE_ID_LSI_INVADER
)
409 pRAID_Context
->regLockFlags
= (isRead
) ?
410 raid
->regTypeReqOnRead
: raid
->regTypeReqOnWrite
;
412 pRAID_Context
->regLockFlags
= (isRead
) ?
413 REGION_TYPE_SHARED_READ
: raid
->regTypeReqOnWrite
;
414 pRAID_Context
->VirtualDiskTgtId
= raid
->targetId
;
415 pRAID_Context
->regLockRowLBA
= regStart
;
416 pRAID_Context
->regLockLength
= regSize
;
417 pRAID_Context
->configSeqNum
= raid
->seqNum
;
419 /*Get Phy Params only if FP capable, or else leave it to MR firmware
420 to do the calculation.*/
421 if (io_info
->fpOkForIo
) {
422 retval
= MR_GetPhyParams(instance
, ld
, start_strip
,
425 &io_info
->devHandle
, pRAID_Context
,
427 /* If IO on an invalid Pd, then FP i snot possible */
428 if (io_info
->devHandle
== MR_PD_INVALID
)
429 io_info
->fpOkForIo
= FALSE
;
433 for (stripIdx
= 0; stripIdx
< num_strips
; stripIdx
++) {
434 if (!MR_GetPhyParams(instance
, ld
,
435 start_strip
+ stripIdx
,
447 mr_update_load_balance_params(struct MR_FW_RAID_MAP_ALL
*map
,
448 struct LD_LOAD_BALANCE_INFO
*lbInfo
)
452 struct MR_LD_RAID
*raid
;
454 for (ldCount
= 0; ldCount
< MAX_LOGICAL_DRIVES
; ldCount
++) {
455 ld
= MR_TargetIdToLdGet(ldCount
, map
);
456 if (ld
>= MAX_LOGICAL_DRIVES
) {
457 lbInfo
[ldCount
].loadBalanceFlag
= 0;
461 raid
= MR_LdRaidGet(ld
, map
);
463 /* Two drive Optimal RAID 1 */
464 if ((raid
->level
== 1) && (raid
->rowSize
== 2) &&
465 (raid
->spanDepth
== 1) && raid
->ldState
==
466 MR_LD_STATE_OPTIMAL
) {
469 lbInfo
[ldCount
].loadBalanceFlag
= 1;
471 /* Get the array on which this span is present */
472 arRef
= MR_LdSpanArrayGet(ld
, 0, map
);
475 pd
= MR_ArPdGet(arRef
, 0, map
);
476 /* Get dev handle from Pd */
477 lbInfo
[ldCount
].raid1DevHandle
[0] =
478 MR_PdDevHandleGet(pd
, map
);
480 pd
= MR_ArPdGet(arRef
, 1, map
);
482 /* Get the dev handle from Pd */
483 lbInfo
[ldCount
].raid1DevHandle
[1] =
484 MR_PdDevHandleGet(pd
, map
);
486 lbInfo
[ldCount
].loadBalanceFlag
= 0;
490 u8
megasas_get_best_arm(struct LD_LOAD_BALANCE_INFO
*lbInfo
, u8 arm
, u64 block
,
497 /* get the pending cmds for the data and mirror arms */
498 pend0
= atomic_read(&lbInfo
->scsi_pending_cmds
[0]);
499 pend1
= atomic_read(&lbInfo
->scsi_pending_cmds
[1]);
501 /* Determine the disk whose head is nearer to the req. block */
502 diff0
= ABS_DIFF(block
, lbInfo
->last_accessed_block
[0]);
503 diff1
= ABS_DIFF(block
, lbInfo
->last_accessed_block
[1]);
504 bestArm
= (diff0
<= diff1
? 0 : 1);
506 if ((bestArm
== arm
&& pend0
> pend1
+ 16) ||
507 (bestArm
!= arm
&& pend1
> pend0
+ 16))
510 /* Update the last accessed block on the correct pd */
511 lbInfo
->last_accessed_block
[bestArm
] = block
+ count
- 1;
516 u16
get_updated_dev_handle(struct LD_LOAD_BALANCE_INFO
*lbInfo
,
517 struct IO_REQUEST_INFO
*io_info
)
522 old_arm
= lbInfo
->raid1DevHandle
[0] == io_info
->devHandle
? 0 : 1;
524 /* get best new arm */
525 arm
= megasas_get_best_arm(lbInfo
, old_arm
, io_info
->ldStartBlock
,
527 devHandle
= lbInfo
->raid1DevHandle
[arm
];
528 atomic_inc(&lbInfo
->scsi_pending_cmds
[arm
]);