1 // SPDX-License-Identifier: GPL-2.0-only
3 * SCSI Zoned Block commands
5 * Copyright (C) 2014-2015 SUSE Linux GmbH
6 * Written by: Hannes Reinecke <hare@suse.de>
7 * Modified by: Damien Le Moal <damien.lemoal@hgst.com>
8 * Modified by: Shaun Tancheff <shaun.tancheff@seagate.com>
11 #include <linux/blkdev.h>
12 #include <linux/vmalloc.h>
13 #include <linux/sched/mm.h>
15 #include <asm/unaligned.h>
17 #include <scsi/scsi.h>
18 #include <scsi/scsi_cmnd.h>
22 static int sd_zbc_parse_report(struct scsi_disk
*sdkp
, u8
*buf
,
23 unsigned int idx
, report_zones_cb cb
, void *data
)
25 struct scsi_device
*sdp
= sdkp
->device
;
26 struct blk_zone zone
= { 0 };
28 zone
.type
= buf
[0] & 0x0f;
29 zone
.cond
= (buf
[1] >> 4) & 0xf;
35 zone
.len
= logical_to_sectors(sdp
, get_unaligned_be64(&buf
[8]));
36 zone
.start
= logical_to_sectors(sdp
, get_unaligned_be64(&buf
[16]));
37 zone
.wp
= logical_to_sectors(sdp
, get_unaligned_be64(&buf
[24]));
38 if (zone
.type
!= ZBC_ZONE_TYPE_CONV
&&
39 zone
.cond
== ZBC_ZONE_COND_FULL
)
40 zone
.wp
= zone
.start
+ zone
.len
;
42 return cb(&zone
, idx
, data
);
46 * sd_zbc_do_report_zones - Issue a REPORT ZONES scsi command.
47 * @sdkp: The target disk
48 * @buf: vmalloc-ed buffer to use for the reply
49 * @buflen: the buffer size
50 * @lba: Start LBA of the report
51 * @partial: Do partial report
53 * For internal use during device validation.
54 * Using partial=true can significantly speed up execution of a report zones
55 * command because the disk does not have to count all possible report matching
56 * zones and will only report the count of zones fitting in the command reply
59 static int sd_zbc_do_report_zones(struct scsi_disk
*sdkp
, unsigned char *buf
,
60 unsigned int buflen
, sector_t lba
,
63 struct scsi_device
*sdp
= sdkp
->device
;
64 const int timeout
= sdp
->request_queue
->rq_timeout
;
65 struct scsi_sense_hdr sshdr
;
66 unsigned char cmd
[16];
72 cmd
[1] = ZI_REPORT_ZONES
;
73 put_unaligned_be64(lba
, &cmd
[2]);
74 put_unaligned_be32(buflen
, &cmd
[10]);
76 cmd
[14] = ZBC_REPORT_ZONE_PARTIAL
;
78 result
= scsi_execute_req(sdp
, cmd
, DMA_FROM_DEVICE
,
80 timeout
, SD_MAX_RETRIES
, NULL
);
82 sd_printk(KERN_ERR
, sdkp
,
83 "REPORT ZONES start lba %llu failed\n", lba
);
84 sd_print_result(sdkp
, "REPORT ZONES", result
);
85 if (driver_byte(result
) == DRIVER_SENSE
&&
86 scsi_sense_valid(&sshdr
))
87 sd_print_sense_hdr(sdkp
, &sshdr
);
91 rep_len
= get_unaligned_be32(&buf
[0]);
93 sd_printk(KERN_ERR
, sdkp
,
94 "REPORT ZONES report invalid length %u\n",
103 * Allocate a buffer for report zones reply.
104 * @sdkp: The target disk
105 * @nr_zones: Maximum number of zones to report
106 * @buflen: Size of the buffer allocated
108 * Try to allocate a reply buffer for the number of requested zones.
109 * The size of the buffer allocated may be smaller than requested to
110 * satify the device constraint (max_hw_sectors, max_segments, etc).
112 * Return the address of the allocated buffer and update @buflen with
113 * the size of the allocated buffer.
115 static void *sd_zbc_alloc_report_buffer(struct scsi_disk
*sdkp
,
116 unsigned int nr_zones
, size_t *buflen
)
118 struct request_queue
*q
= sdkp
->disk
->queue
;
123 * Report zone buffer size should be at most 64B times the number of
124 * zones requested plus the 64B reply header, but should be at least
125 * SECTOR_SIZE for ATA devices.
126 * Make sure that this size does not exceed the hardware capabilities.
127 * Furthermore, since the report zone command cannot be split, make
128 * sure that the allocated buffer can always be mapped by limiting the
129 * number of pages allocated to the HBA max segments limit.
131 nr_zones
= min(nr_zones
, sdkp
->nr_zones
);
132 bufsize
= roundup((nr_zones
+ 1) * 64, SECTOR_SIZE
);
133 bufsize
= min_t(size_t, bufsize
,
134 queue_max_hw_sectors(q
) << SECTOR_SHIFT
);
135 bufsize
= min_t(size_t, bufsize
, queue_max_segments(q
) << PAGE_SHIFT
);
137 while (bufsize
>= SECTOR_SIZE
) {
138 buf
= __vmalloc(bufsize
,
139 GFP_KERNEL
| __GFP_ZERO
| __GFP_NORETRY
,
152 * sd_zbc_zone_sectors - Get the device zone size in number of 512B sectors.
153 * @sdkp: The target disk
155 static inline sector_t
sd_zbc_zone_sectors(struct scsi_disk
*sdkp
)
157 return logical_to_sectors(sdkp
->device
, sdkp
->zone_blocks
);
160 int sd_zbc_report_zones(struct gendisk
*disk
, sector_t sector
,
161 unsigned int nr_zones
, report_zones_cb cb
, void *data
)
163 struct scsi_disk
*sdkp
= scsi_disk(disk
);
164 sector_t capacity
= logical_to_sectors(sdkp
->device
, sdkp
->capacity
);
167 size_t offset
, buflen
= 0;
171 if (!sd_is_zoned(sdkp
))
172 /* Not a zoned device */
176 /* Device gone or invalid */
179 buf
= sd_zbc_alloc_report_buffer(sdkp
, nr_zones
, &buflen
);
183 while (zone_idx
< nr_zones
&& sector
< capacity
) {
184 ret
= sd_zbc_do_report_zones(sdkp
, buf
, buflen
,
185 sectors_to_logical(sdkp
->device
, sector
), true);
190 nr
= min(nr_zones
, get_unaligned_be32(&buf
[0]) / 64);
194 for (i
= 0; i
< nr
&& zone_idx
< nr_zones
; i
++) {
196 ret
= sd_zbc_parse_report(sdkp
, buf
+ offset
, zone_idx
,
203 sector
+= sd_zbc_zone_sectors(sdkp
) * i
;
213 * sd_zbc_setup_zone_mgmt_cmnd - Prepare a zone ZBC_OUT command. The operations
214 * can be RESET WRITE POINTER, OPEN, CLOSE or FINISH.
215 * @cmd: the command to setup
216 * @op: Operation to be performed
217 * @all: All zones control
219 * Called from sd_init_command() for REQ_OP_ZONE_RESET, REQ_OP_ZONE_RESET_ALL,
220 * REQ_OP_ZONE_OPEN, REQ_OP_ZONE_CLOSE or REQ_OP_ZONE_FINISH requests.
222 blk_status_t
sd_zbc_setup_zone_mgmt_cmnd(struct scsi_cmnd
*cmd
,
223 unsigned char op
, bool all
)
225 struct request
*rq
= cmd
->request
;
226 struct scsi_disk
*sdkp
= scsi_disk(rq
->rq_disk
);
227 sector_t sector
= blk_rq_pos(rq
);
228 sector_t block
= sectors_to_logical(sdkp
->device
, sector
);
230 if (!sd_is_zoned(sdkp
))
231 /* Not a zoned device */
232 return BLK_STS_IOERR
;
234 if (sdkp
->device
->changed
)
235 return BLK_STS_IOERR
;
237 if (sector
& (sd_zbc_zone_sectors(sdkp
) - 1))
238 /* Unaligned request */
239 return BLK_STS_IOERR
;
242 memset(cmd
->cmnd
, 0, cmd
->cmd_len
);
243 cmd
->cmnd
[0] = ZBC_OUT
;
248 put_unaligned_be64(block
, &cmd
->cmnd
[2]);
250 rq
->timeout
= SD_TIMEOUT
;
251 cmd
->sc_data_direction
= DMA_NONE
;
252 cmd
->transfersize
= 0;
259 * sd_zbc_complete - ZBC command post processing.
260 * @cmd: Completed command
261 * @good_bytes: Command reply bytes
262 * @sshdr: command sense header
264 * Called from sd_done(). Process report zones reply and handle reset zone
265 * and write commands errors.
267 void sd_zbc_complete(struct scsi_cmnd
*cmd
, unsigned int good_bytes
,
268 struct scsi_sense_hdr
*sshdr
)
270 int result
= cmd
->result
;
271 struct request
*rq
= cmd
->request
;
273 if (op_is_zone_mgmt(req_op(rq
)) &&
275 sshdr
->sense_key
== ILLEGAL_REQUEST
&&
276 sshdr
->asc
== 0x24) {
278 * INVALID FIELD IN CDB error: a zone management command was
279 * attempted on a conventional zone. Nothing to worry about,
280 * so be quiet about the error.
282 rq
->rq_flags
|= RQF_QUIET
;
287 * sd_zbc_check_zoned_characteristics - Check zoned block device characteristics
289 * @buf: Buffer where to store the VPD page data
291 * Read VPD page B6, get information and check that reads are unconstrained.
293 static int sd_zbc_check_zoned_characteristics(struct scsi_disk
*sdkp
,
297 if (scsi_get_vpd_page(sdkp
->device
, 0xb6, buf
, 64)) {
298 sd_printk(KERN_NOTICE
, sdkp
,
299 "Read zoned characteristics VPD page failed\n");
303 if (sdkp
->device
->type
!= TYPE_ZBC
) {
306 sdkp
->zones_optimal_open
= get_unaligned_be32(&buf
[8]);
307 sdkp
->zones_optimal_nonseq
= get_unaligned_be32(&buf
[12]);
308 sdkp
->zones_max_open
= 0;
311 sdkp
->urswrz
= buf
[4] & 1;
312 sdkp
->zones_optimal_open
= 0;
313 sdkp
->zones_optimal_nonseq
= 0;
314 sdkp
->zones_max_open
= get_unaligned_be32(&buf
[16]);
318 * Check for unconstrained reads: host-managed devices with
319 * constrained reads (drives failing read after write pointer)
323 if (sdkp
->first_scan
)
324 sd_printk(KERN_NOTICE
, sdkp
,
325 "constrained reads devices are not supported\n");
333 * sd_zbc_check_zones - Check the device capacity and zone sizes
336 * Check that the device capacity as reported by READ CAPACITY matches the
337 * max_lba value (plus one)of the report zones command reply. Also check that
338 * all zones of the device have an equal size, only allowing the last zone of
339 * the disk to have a smaller size (runt zone). The zone size must also be a
342 * Returns the zone size in number of blocks upon success or an error code
345 static int sd_zbc_check_zones(struct scsi_disk
*sdkp
, unsigned char *buf
,
353 /* Do a report zone to get max_lba and the size of the first zone */
354 ret
= sd_zbc_do_report_zones(sdkp
, buf
, SD_BUF_SIZE
, 0, false);
358 if (sdkp
->rc_basis
== 0) {
359 /* The max_lba field is the capacity of this device */
360 max_lba
= get_unaligned_be64(&buf
[8]);
361 if (sdkp
->capacity
!= max_lba
+ 1) {
362 if (sdkp
->first_scan
)
363 sd_printk(KERN_WARNING
, sdkp
,
364 "Changing capacity from %llu to max LBA+1 %llu\n",
365 (unsigned long long)sdkp
->capacity
,
366 (unsigned long long)max_lba
+ 1);
367 sdkp
->capacity
= max_lba
+ 1;
371 /* Parse REPORT ZONES header */
373 zone_blocks
= get_unaligned_be64(&rec
[8]);
374 if (!zone_blocks
|| !is_power_of_2(zone_blocks
)) {
375 if (sdkp
->first_scan
)
376 sd_printk(KERN_NOTICE
, sdkp
,
377 "Devices with non power of 2 zone "
378 "size are not supported\n");
382 if (logical_to_sectors(sdkp
->device
, zone_blocks
) > UINT_MAX
) {
383 if (sdkp
->first_scan
)
384 sd_printk(KERN_NOTICE
, sdkp
,
385 "Zone size too large\n");
389 *zblocks
= zone_blocks
;
394 int sd_zbc_read_zones(struct scsi_disk
*sdkp
, unsigned char *buf
)
396 struct gendisk
*disk
= sdkp
->disk
;
397 unsigned int nr_zones
;
401 if (!sd_is_zoned(sdkp
))
403 * Device managed or normal SCSI disk,
404 * no special handling required
408 /* Check zoned block device characteristics (unconstrained reads) */
409 ret
= sd_zbc_check_zoned_characteristics(sdkp
, buf
);
414 * Check zone size: only devices with a constant zone size (except
415 * an eventual last runt zone) that is a power of 2 are supported.
417 ret
= sd_zbc_check_zones(sdkp
, buf
, &zone_blocks
);
421 /* The drive satisfies the kernel restrictions: set it up */
422 blk_queue_flag_set(QUEUE_FLAG_ZONE_RESETALL
, sdkp
->disk
->queue
);
423 blk_queue_required_elevator_features(sdkp
->disk
->queue
,
424 ELEVATOR_F_ZBD_SEQ_WRITE
);
425 nr_zones
= round_up(sdkp
->capacity
, zone_blocks
) >> ilog2(zone_blocks
);
427 /* READ16/WRITE16 is mandatory for ZBC disks */
428 sdkp
->device
->use_16_for_rw
= 1;
429 sdkp
->device
->use_10_for_rw
= 0;
432 * Revalidate the disk zone bitmaps once the block device capacity is
433 * set on the second revalidate execution during disk scan and if
434 * something changed when executing a normal revalidate.
436 if (sdkp
->first_scan
) {
437 sdkp
->zone_blocks
= zone_blocks
;
438 sdkp
->nr_zones
= nr_zones
;
442 if (sdkp
->zone_blocks
!= zone_blocks
||
443 sdkp
->nr_zones
!= nr_zones
||
444 disk
->queue
->nr_zones
!= nr_zones
) {
445 ret
= blk_revalidate_disk_zones(disk
);
448 sdkp
->zone_blocks
= zone_blocks
;
449 sdkp
->nr_zones
= nr_zones
;
460 void sd_zbc_print_zones(struct scsi_disk
*sdkp
)
462 if (!sd_is_zoned(sdkp
) || !sdkp
->capacity
)
465 if (sdkp
->capacity
& (sdkp
->zone_blocks
- 1))
466 sd_printk(KERN_NOTICE
, sdkp
,
467 "%u zones of %u logical blocks + 1 runt zone\n",
471 sd_printk(KERN_NOTICE
, sdkp
,
472 "%u zones of %u logical blocks\n",