1 // SPDX-License-Identifier: GPL-2.0-only
3 * Copyright (C) 2003 Russell King, All Rights Reserved.
4 * Copyright 2006-2007 Pierre Ossman
6 #include <linux/slab.h>
7 #include <linux/module.h>
8 #include <linux/blkdev.h>
9 #include <linux/freezer.h>
10 #include <linux/scatterlist.h>
11 #include <linux/dma-mapping.h>
12 #include <linux/backing-dev.h>
14 #include <linux/mmc/card.h>
15 #include <linux/mmc/host.h>
24 #define MMC_DMA_MAP_MERGE_SEGMENTS 512
26 static inline bool mmc_cqe_dcmd_busy(struct mmc_queue
*mq
)
28 /* Allow only 1 DCMD at a time */
29 return mq
->in_flight
[MMC_ISSUE_DCMD
];
32 void mmc_cqe_check_busy(struct mmc_queue
*mq
)
34 if ((mq
->cqe_busy
& MMC_CQE_DCMD_BUSY
) && !mmc_cqe_dcmd_busy(mq
))
35 mq
->cqe_busy
&= ~MMC_CQE_DCMD_BUSY
;
38 static inline bool mmc_cqe_can_dcmd(struct mmc_host
*host
)
40 return host
->caps2
& MMC_CAP2_CQE_DCMD
;
43 static enum mmc_issue_type
mmc_cqe_issue_type(struct mmc_host
*host
,
46 switch (req_op(req
)) {
50 case REQ_OP_SECURE_ERASE
:
51 case REQ_OP_WRITE_ZEROES
:
52 return MMC_ISSUE_SYNC
;
54 return mmc_cqe_can_dcmd(host
) ? MMC_ISSUE_DCMD
: MMC_ISSUE_SYNC
;
56 return MMC_ISSUE_ASYNC
;
60 enum mmc_issue_type
mmc_issue_type(struct mmc_queue
*mq
, struct request
*req
)
62 struct mmc_host
*host
= mq
->card
->host
;
64 if (host
->cqe_enabled
&& !host
->hsq_enabled
)
65 return mmc_cqe_issue_type(host
, req
);
67 if (req_op(req
) == REQ_OP_READ
|| req_op(req
) == REQ_OP_WRITE
)
68 return MMC_ISSUE_ASYNC
;
70 return MMC_ISSUE_SYNC
;
73 static void __mmc_cqe_recovery_notifier(struct mmc_queue
*mq
)
75 if (!mq
->recovery_needed
) {
76 mq
->recovery_needed
= true;
77 schedule_work(&mq
->recovery_work
);
81 void mmc_cqe_recovery_notifier(struct mmc_request
*mrq
)
83 struct mmc_queue_req
*mqrq
= container_of(mrq
, struct mmc_queue_req
,
85 struct request
*req
= mmc_queue_req_to_req(mqrq
);
86 struct request_queue
*q
= req
->q
;
87 struct mmc_queue
*mq
= q
->queuedata
;
90 spin_lock_irqsave(&mq
->lock
, flags
);
91 __mmc_cqe_recovery_notifier(mq
);
92 spin_unlock_irqrestore(&mq
->lock
, flags
);
95 static enum blk_eh_timer_return
mmc_cqe_timed_out(struct request
*req
)
97 struct mmc_queue_req
*mqrq
= req_to_mmc_queue_req(req
);
98 struct mmc_request
*mrq
= &mqrq
->brq
.mrq
;
99 struct mmc_queue
*mq
= req
->q
->queuedata
;
100 struct mmc_host
*host
= mq
->card
->host
;
101 enum mmc_issue_type issue_type
= mmc_issue_type(mq
, req
);
102 bool recovery_needed
= false;
104 switch (issue_type
) {
105 case MMC_ISSUE_ASYNC
:
107 if (host
->cqe_ops
->cqe_timeout(host
, mrq
, &recovery_needed
)) {
109 mmc_cqe_recovery_notifier(mrq
);
110 return BLK_EH_RESET_TIMER
;
112 /* The request has gone already */
115 /* Timeout is handled by mmc core */
116 return BLK_EH_RESET_TIMER
;
120 static enum blk_eh_timer_return
mmc_mq_timed_out(struct request
*req
)
122 struct request_queue
*q
= req
->q
;
123 struct mmc_queue
*mq
= q
->queuedata
;
124 struct mmc_card
*card
= mq
->card
;
125 struct mmc_host
*host
= card
->host
;
129 spin_lock_irqsave(&mq
->lock
, flags
);
130 ignore_tout
= mq
->recovery_needed
|| !host
->cqe_enabled
|| host
->hsq_enabled
;
131 spin_unlock_irqrestore(&mq
->lock
, flags
);
133 return ignore_tout
? BLK_EH_RESET_TIMER
: mmc_cqe_timed_out(req
);
136 static void mmc_mq_recovery_handler(struct work_struct
*work
)
138 struct mmc_queue
*mq
= container_of(work
, struct mmc_queue
,
140 struct request_queue
*q
= mq
->queue
;
141 struct mmc_host
*host
= mq
->card
->host
;
143 mmc_get_card(mq
->card
, &mq
->ctx
);
145 mq
->in_recovery
= true;
147 if (host
->cqe_enabled
&& !host
->hsq_enabled
)
148 mmc_blk_cqe_recovery(mq
);
150 mmc_blk_mq_recovery(mq
);
152 mq
->in_recovery
= false;
154 spin_lock_irq(&mq
->lock
);
155 mq
->recovery_needed
= false;
156 spin_unlock_irq(&mq
->lock
);
158 if (host
->hsq_enabled
)
159 host
->cqe_ops
->cqe_recovery_finish(host
);
161 mmc_put_card(mq
->card
, &mq
->ctx
);
163 blk_mq_run_hw_queues(q
, true);
166 static struct scatterlist
*mmc_alloc_sg(unsigned short sg_len
, gfp_t gfp
)
168 struct scatterlist
*sg
;
170 sg
= kmalloc_array(sg_len
, sizeof(*sg
), gfp
);
172 sg_init_table(sg
, sg_len
);
177 static void mmc_queue_setup_discard(struct mmc_card
*card
,
178 struct queue_limits
*lim
)
180 unsigned max_discard
;
182 max_discard
= mmc_calc_max_discard(card
);
186 lim
->max_hw_discard_sectors
= max_discard
;
187 if (mmc_can_secure_erase_trim(card
))
188 lim
->max_secure_erase_sectors
= max_discard
;
189 if (mmc_can_trim(card
) && card
->erased_byte
== 0)
190 lim
->max_write_zeroes_sectors
= max_discard
;
192 /* granularity must not be greater than max. discard */
193 if (card
->pref_erase
> max_discard
)
194 lim
->discard_granularity
= SECTOR_SIZE
;
196 lim
->discard_granularity
= card
->pref_erase
<< 9;
199 static unsigned short mmc_get_max_segments(struct mmc_host
*host
)
201 return host
->can_dma_map_merge
? MMC_DMA_MAP_MERGE_SEGMENTS
:
205 static int mmc_mq_init_request(struct blk_mq_tag_set
*set
, struct request
*req
,
206 unsigned int hctx_idx
, unsigned int numa_node
)
208 struct mmc_queue_req
*mq_rq
= req_to_mmc_queue_req(req
);
209 struct mmc_queue
*mq
= set
->driver_data
;
210 struct mmc_card
*card
= mq
->card
;
211 struct mmc_host
*host
= card
->host
;
213 mq_rq
->sg
= mmc_alloc_sg(mmc_get_max_segments(host
), GFP_KERNEL
);
220 static void mmc_mq_exit_request(struct blk_mq_tag_set
*set
, struct request
*req
,
221 unsigned int hctx_idx
)
223 struct mmc_queue_req
*mq_rq
= req_to_mmc_queue_req(req
);
229 static blk_status_t
mmc_mq_queue_rq(struct blk_mq_hw_ctx
*hctx
,
230 const struct blk_mq_queue_data
*bd
)
232 struct request
*req
= bd
->rq
;
233 struct request_queue
*q
= req
->q
;
234 struct mmc_queue
*mq
= q
->queuedata
;
235 struct mmc_card
*card
= mq
->card
;
236 struct mmc_host
*host
= card
->host
;
237 enum mmc_issue_type issue_type
;
238 enum mmc_issued issued
;
239 bool get_card
, cqe_retune_ok
;
242 if (mmc_card_removed(mq
->card
)) {
243 req
->rq_flags
|= RQF_QUIET
;
244 return BLK_STS_IOERR
;
247 issue_type
= mmc_issue_type(mq
, req
);
249 spin_lock_irq(&mq
->lock
);
251 if (mq
->recovery_needed
|| mq
->busy
) {
252 spin_unlock_irq(&mq
->lock
);
253 return BLK_STS_RESOURCE
;
256 switch (issue_type
) {
258 if (mmc_cqe_dcmd_busy(mq
)) {
259 mq
->cqe_busy
|= MMC_CQE_DCMD_BUSY
;
260 spin_unlock_irq(&mq
->lock
);
261 return BLK_STS_RESOURCE
;
264 case MMC_ISSUE_ASYNC
:
265 if (host
->hsq_enabled
&& mq
->in_flight
[issue_type
] > host
->hsq_depth
) {
266 spin_unlock_irq(&mq
->lock
);
267 return BLK_STS_RESOURCE
;
272 * Timeouts are handled by mmc core, and we don't have a host
273 * API to abort requests, so we can't handle the timeout anyway.
274 * However, when the timeout happens, blk_mq_complete_request()
275 * no longer works (to stop the request disappearing under us).
276 * To avoid racing with that, set a large timeout.
278 req
->timeout
= 600 * HZ
;
282 /* Parallel dispatch of requests is not supported at the moment */
285 mq
->in_flight
[issue_type
] += 1;
286 get_card
= (mmc_tot_in_flight(mq
) == 1);
287 cqe_retune_ok
= (mmc_cqe_qcnt(mq
) == 1);
289 spin_unlock_irq(&mq
->lock
);
291 if (!(req
->rq_flags
& RQF_DONTPREP
)) {
292 req_to_mmc_queue_req(req
)->retries
= 0;
293 req
->rq_flags
|= RQF_DONTPREP
;
297 mmc_get_card(card
, &mq
->ctx
);
299 if (host
->cqe_enabled
) {
300 host
->retune_now
= host
->need_retune
&& cqe_retune_ok
&&
304 blk_mq_start_request(req
);
306 issued
= mmc_blk_mq_issue_rq(mq
, req
);
310 ret
= BLK_STS_RESOURCE
;
312 case MMC_REQ_FAILED_TO_START
:
320 if (issued
!= MMC_REQ_STARTED
) {
321 bool put_card
= false;
323 spin_lock_irq(&mq
->lock
);
324 mq
->in_flight
[issue_type
] -= 1;
325 if (mmc_tot_in_flight(mq
) == 0)
328 spin_unlock_irq(&mq
->lock
);
330 mmc_put_card(card
, &mq
->ctx
);
332 WRITE_ONCE(mq
->busy
, false);
338 static const struct blk_mq_ops mmc_mq_ops
= {
339 .queue_rq
= mmc_mq_queue_rq
,
340 .init_request
= mmc_mq_init_request
,
341 .exit_request
= mmc_mq_exit_request
,
342 .complete
= mmc_blk_mq_complete
,
343 .timeout
= mmc_mq_timed_out
,
346 static struct gendisk
*mmc_alloc_disk(struct mmc_queue
*mq
,
347 struct mmc_card
*card
, unsigned int features
)
349 struct mmc_host
*host
= card
->host
;
350 struct queue_limits lim
= {
351 .features
= features
,
353 struct gendisk
*disk
;
355 if (mmc_can_erase(card
))
356 mmc_queue_setup_discard(card
, &lim
);
358 lim
.max_hw_sectors
= min(host
->max_blk_count
, host
->max_req_size
/ 512);
360 if (mmc_card_mmc(card
) && card
->ext_csd
.data_sector_size
)
361 lim
.logical_block_size
= card
->ext_csd
.data_sector_size
;
363 lim
.logical_block_size
= 512;
365 WARN_ON_ONCE(lim
.logical_block_size
!= 512 &&
366 lim
.logical_block_size
!= 4096);
369 * Setting a virt_boundary implicity sets a max_segment_size, so try
370 * to set the hardware one here.
372 if (host
->can_dma_map_merge
) {
373 lim
.virt_boundary_mask
= dma_get_merge_boundary(mmc_dev(host
));
374 lim
.max_segments
= MMC_DMA_MAP_MERGE_SEGMENTS
;
376 lim
.max_segment_size
=
377 round_down(host
->max_seg_size
, lim
.logical_block_size
);
378 lim
.max_segments
= host
->max_segs
;
381 if (mmc_host_is_spi(host
) && host
->use_spi_crc
)
382 lim
.features
|= BLK_FEAT_STABLE_WRITES
;
384 disk
= blk_mq_alloc_disk(&mq
->tag_set
, &lim
, mq
);
387 mq
->queue
= disk
->queue
;
389 blk_queue_rq_timeout(mq
->queue
, 60 * HZ
);
391 if (mmc_dev(host
)->dma_parms
)
392 dma_set_max_seg_size(mmc_dev(host
), queue_max_segment_size(mq
->queue
));
394 INIT_WORK(&mq
->recovery_work
, mmc_mq_recovery_handler
);
395 INIT_WORK(&mq
->complete_work
, mmc_blk_mq_complete_work
);
397 mutex_init(&mq
->complete_lock
);
399 init_waitqueue_head(&mq
->wait
);
401 mmc_crypto_setup_queue(mq
->queue
, host
);
405 static inline bool mmc_merge_capable(struct mmc_host
*host
)
407 return host
->caps2
& MMC_CAP2_MERGE_CAPABLE
;
410 /* Set queue depth to get a reasonable value for q->nr_requests */
411 #define MMC_QUEUE_DEPTH 64
414 * mmc_init_queue - initialise a queue structure.
416 * @card: mmc card to attach this queue
417 * @features: block layer features (BLK_FEAT_*)
419 * Initialise a MMC card request queue.
421 struct gendisk
*mmc_init_queue(struct mmc_queue
*mq
, struct mmc_card
*card
,
422 unsigned int features
)
424 struct mmc_host
*host
= card
->host
;
425 struct gendisk
*disk
;
430 spin_lock_init(&mq
->lock
);
432 memset(&mq
->tag_set
, 0, sizeof(mq
->tag_set
));
433 mq
->tag_set
.ops
= &mmc_mq_ops
;
435 * The queue depth for CQE must match the hardware because the request
436 * tag is used to index the hardware queue.
438 if (host
->cqe_enabled
&& !host
->hsq_enabled
)
439 mq
->tag_set
.queue_depth
=
440 min_t(int, card
->ext_csd
.cmdq_depth
, host
->cqe_qdepth
);
442 mq
->tag_set
.queue_depth
= MMC_QUEUE_DEPTH
;
443 mq
->tag_set
.numa_node
= NUMA_NO_NODE
;
444 mq
->tag_set
.flags
= BLK_MQ_F_SHOULD_MERGE
| BLK_MQ_F_BLOCKING
;
445 mq
->tag_set
.nr_hw_queues
= 1;
446 mq
->tag_set
.cmd_size
= sizeof(struct mmc_queue_req
);
447 mq
->tag_set
.driver_data
= mq
;
450 * Since blk_mq_alloc_tag_set() calls .init_request() of mmc_mq_ops,
451 * the host->can_dma_map_merge should be set before to get max_segs
452 * from mmc_get_max_segments().
454 if (mmc_merge_capable(host
) &&
455 host
->max_segs
< MMC_DMA_MAP_MERGE_SEGMENTS
&&
456 dma_get_merge_boundary(mmc_dev(host
)))
457 host
->can_dma_map_merge
= 1;
459 host
->can_dma_map_merge
= 0;
461 ret
= blk_mq_alloc_tag_set(&mq
->tag_set
);
466 disk
= mmc_alloc_disk(mq
, card
, features
);
468 blk_mq_free_tag_set(&mq
->tag_set
);
472 void mmc_queue_suspend(struct mmc_queue
*mq
)
474 blk_mq_quiesce_queue(mq
->queue
);
477 * The host remains claimed while there are outstanding requests, so
478 * simply claiming and releasing here ensures there are none.
480 mmc_claim_host(mq
->card
->host
);
481 mmc_release_host(mq
->card
->host
);
484 void mmc_queue_resume(struct mmc_queue
*mq
)
486 blk_mq_unquiesce_queue(mq
->queue
);
489 void mmc_cleanup_queue(struct mmc_queue
*mq
)
491 struct request_queue
*q
= mq
->queue
;
494 * The legacy code handled the possibility of being suspended,
495 * so do that here too.
497 if (blk_queue_quiesced(q
))
498 blk_mq_unquiesce_queue(q
);
501 * If the recovery completes the last (and only remaining) request in
502 * the queue, and the card has been removed, we could end up here with
503 * the recovery not quite finished yet, so cancel it.
505 cancel_work_sync(&mq
->recovery_work
);
507 blk_mq_free_tag_set(&mq
->tag_set
);
510 * A request can be completed before the next request, potentially
511 * leaving a complete_work with nothing to do. Such a work item might
512 * still be queued at this point. Flush it.
514 flush_work(&mq
->complete_work
);
520 * Prepare the sg list(s) to be handed of to the host driver
522 unsigned int mmc_queue_map_sg(struct mmc_queue
*mq
, struct mmc_queue_req
*mqrq
)
524 struct request
*req
= mmc_queue_req_to_req(mqrq
);
526 return blk_rq_map_sg(mq
->queue
, req
, mqrq
->sg
);