1 // SPDX-License-Identifier: GPL-2.0-only
3 * SCSI Zoned Block commands
5 * Copyright (C) 2014-2015 SUSE Linux GmbH
6 * Written by: Hannes Reinecke <hare@suse.de>
7 * Modified by: Damien Le Moal <damien.lemoal@hgst.com>
8 * Modified by: Shaun Tancheff <shaun.tancheff@seagate.com>
11 #include <linux/blkdev.h>
12 #include <linux/vmalloc.h>
13 #include <linux/sched/mm.h>
15 #include <asm/unaligned.h>
17 #include <scsi/scsi.h>
18 #include <scsi/scsi_cmnd.h>
22 static int sd_zbc_parse_report(struct scsi_disk
*sdkp
, u8
*buf
,
23 unsigned int idx
, report_zones_cb cb
, void *data
)
25 struct scsi_device
*sdp
= sdkp
->device
;
26 struct blk_zone zone
= { 0 };
28 zone
.type
= buf
[0] & 0x0f;
29 zone
.cond
= (buf
[1] >> 4) & 0xf;
35 zone
.len
= logical_to_sectors(sdp
, get_unaligned_be64(&buf
[8]));
36 zone
.start
= logical_to_sectors(sdp
, get_unaligned_be64(&buf
[16]));
37 zone
.wp
= logical_to_sectors(sdp
, get_unaligned_be64(&buf
[24]));
38 if (zone
.type
!= ZBC_ZONE_TYPE_CONV
&&
39 zone
.cond
== ZBC_ZONE_COND_FULL
)
40 zone
.wp
= zone
.start
+ zone
.len
;
42 return cb(&zone
, idx
, data
);
46 * sd_zbc_do_report_zones - Issue a REPORT ZONES scsi command.
47 * @sdkp: The target disk
48 * @buf: vmalloc-ed buffer to use for the reply
49 * @buflen: the buffer size
50 * @lba: Start LBA of the report
51 * @partial: Do partial report
53 * For internal use during device validation.
54 * Using partial=true can significantly speed up execution of a report zones
55 * command because the disk does not have to count all possible report matching
56 * zones and will only report the count of zones fitting in the command reply
59 static int sd_zbc_do_report_zones(struct scsi_disk
*sdkp
, unsigned char *buf
,
60 unsigned int buflen
, sector_t lba
,
63 struct scsi_device
*sdp
= sdkp
->device
;
64 const int timeout
= sdp
->request_queue
->rq_timeout
;
65 struct scsi_sense_hdr sshdr
;
66 unsigned char cmd
[16];
72 cmd
[1] = ZI_REPORT_ZONES
;
73 put_unaligned_be64(lba
, &cmd
[2]);
74 put_unaligned_be32(buflen
, &cmd
[10]);
76 cmd
[14] = ZBC_REPORT_ZONE_PARTIAL
;
78 result
= scsi_execute_req(sdp
, cmd
, DMA_FROM_DEVICE
,
80 timeout
, SD_MAX_RETRIES
, NULL
);
82 sd_printk(KERN_ERR
, sdkp
,
83 "REPORT ZONES start lba %llu failed\n", lba
);
84 sd_print_result(sdkp
, "REPORT ZONES", result
);
85 if (driver_byte(result
) == DRIVER_SENSE
&&
86 scsi_sense_valid(&sshdr
))
87 sd_print_sense_hdr(sdkp
, &sshdr
);
91 rep_len
= get_unaligned_be32(&buf
[0]);
93 sd_printk(KERN_ERR
, sdkp
,
94 "REPORT ZONES report invalid length %u\n",
103 * Allocate a buffer for report zones reply.
104 * @sdkp: The target disk
105 * @nr_zones: Maximum number of zones to report
106 * @buflen: Size of the buffer allocated
108 * Try to allocate a reply buffer for the number of requested zones.
109 * The size of the buffer allocated may be smaller than requested to
110 * satify the device constraint (max_hw_sectors, max_segments, etc).
112 * Return the address of the allocated buffer and update @buflen with
113 * the size of the allocated buffer.
115 static void *sd_zbc_alloc_report_buffer(struct scsi_disk
*sdkp
,
116 unsigned int nr_zones
, size_t *buflen
)
118 struct request_queue
*q
= sdkp
->disk
->queue
;
123 * Report zone buffer size should be at most 64B times the number of
124 * zones requested plus the 64B reply header, but should be at least
125 * SECTOR_SIZE for ATA devices.
126 * Make sure that this size does not exceed the hardware capabilities.
127 * Furthermore, since the report zone command cannot be split, make
128 * sure that the allocated buffer can always be mapped by limiting the
129 * number of pages allocated to the HBA max segments limit.
131 nr_zones
= min(nr_zones
, sdkp
->nr_zones
);
132 bufsize
= roundup((nr_zones
+ 1) * 64, SECTOR_SIZE
);
133 bufsize
= min_t(size_t, bufsize
,
134 queue_max_hw_sectors(q
) << SECTOR_SHIFT
);
135 bufsize
= min_t(size_t, bufsize
, queue_max_segments(q
) << PAGE_SHIFT
);
137 while (bufsize
>= SECTOR_SIZE
) {
138 buf
= __vmalloc(bufsize
,
139 GFP_KERNEL
| __GFP_ZERO
| __GFP_NORETRY
,
152 * sd_zbc_zone_sectors - Get the device zone size in number of 512B sectors.
153 * @sdkp: The target disk
155 static inline sector_t
sd_zbc_zone_sectors(struct scsi_disk
*sdkp
)
157 return logical_to_sectors(sdkp
->device
, sdkp
->zone_blocks
);
160 int sd_zbc_report_zones(struct gendisk
*disk
, sector_t sector
,
161 unsigned int nr_zones
, report_zones_cb cb
, void *data
)
163 struct scsi_disk
*sdkp
= scsi_disk(disk
);
166 size_t offset
, buflen
= 0;
170 if (!sd_is_zoned(sdkp
))
171 /* Not a zoned device */
174 buf
= sd_zbc_alloc_report_buffer(sdkp
, nr_zones
, &buflen
);
178 while (zone_idx
< nr_zones
&& sector
< get_capacity(disk
)) {
179 ret
= sd_zbc_do_report_zones(sdkp
, buf
, buflen
,
180 sectors_to_logical(sdkp
->device
, sector
), true);
185 nr
= min(nr_zones
, get_unaligned_be32(&buf
[0]) / 64);
189 for (i
= 0; i
< nr
&& zone_idx
< nr_zones
; i
++) {
191 ret
= sd_zbc_parse_report(sdkp
, buf
+ offset
, zone_idx
,
198 sector
+= sd_zbc_zone_sectors(sdkp
) * i
;
208 * sd_zbc_setup_zone_mgmt_cmnd - Prepare a zone ZBC_OUT command. The operations
209 * can be RESET WRITE POINTER, OPEN, CLOSE or FINISH.
210 * @cmd: the command to setup
211 * @op: Operation to be performed
212 * @all: All zones control
214 * Called from sd_init_command() for REQ_OP_ZONE_RESET, REQ_OP_ZONE_RESET_ALL,
215 * REQ_OP_ZONE_OPEN, REQ_OP_ZONE_CLOSE or REQ_OP_ZONE_FINISH requests.
217 blk_status_t
sd_zbc_setup_zone_mgmt_cmnd(struct scsi_cmnd
*cmd
,
218 unsigned char op
, bool all
)
220 struct request
*rq
= cmd
->request
;
221 struct scsi_disk
*sdkp
= scsi_disk(rq
->rq_disk
);
222 sector_t sector
= blk_rq_pos(rq
);
223 sector_t block
= sectors_to_logical(sdkp
->device
, sector
);
225 if (!sd_is_zoned(sdkp
))
226 /* Not a zoned device */
227 return BLK_STS_IOERR
;
229 if (sdkp
->device
->changed
)
230 return BLK_STS_IOERR
;
232 if (sector
& (sd_zbc_zone_sectors(sdkp
) - 1))
233 /* Unaligned request */
234 return BLK_STS_IOERR
;
237 memset(cmd
->cmnd
, 0, cmd
->cmd_len
);
238 cmd
->cmnd
[0] = ZBC_OUT
;
243 put_unaligned_be64(block
, &cmd
->cmnd
[2]);
245 rq
->timeout
= SD_TIMEOUT
;
246 cmd
->sc_data_direction
= DMA_NONE
;
247 cmd
->transfersize
= 0;
254 * sd_zbc_complete - ZBC command post processing.
255 * @cmd: Completed command
256 * @good_bytes: Command reply bytes
257 * @sshdr: command sense header
259 * Called from sd_done(). Process report zones reply and handle reset zone
260 * and write commands errors.
262 void sd_zbc_complete(struct scsi_cmnd
*cmd
, unsigned int good_bytes
,
263 struct scsi_sense_hdr
*sshdr
)
265 int result
= cmd
->result
;
266 struct request
*rq
= cmd
->request
;
268 if (op_is_zone_mgmt(req_op(rq
)) &&
270 sshdr
->sense_key
== ILLEGAL_REQUEST
&&
271 sshdr
->asc
== 0x24) {
273 * INVALID FIELD IN CDB error: a zone management command was
274 * attempted on a conventional zone. Nothing to worry about,
275 * so be quiet about the error.
277 rq
->rq_flags
|= RQF_QUIET
;
282 * sd_zbc_check_zoned_characteristics - Check zoned block device characteristics
284 * @buf: Buffer where to store the VPD page data
286 * Read VPD page B6, get information and check that reads are unconstrained.
288 static int sd_zbc_check_zoned_characteristics(struct scsi_disk
*sdkp
,
292 if (scsi_get_vpd_page(sdkp
->device
, 0xb6, buf
, 64)) {
293 sd_printk(KERN_NOTICE
, sdkp
,
294 "Read zoned characteristics VPD page failed\n");
298 if (sdkp
->device
->type
!= TYPE_ZBC
) {
301 sdkp
->zones_optimal_open
= get_unaligned_be32(&buf
[8]);
302 sdkp
->zones_optimal_nonseq
= get_unaligned_be32(&buf
[12]);
303 sdkp
->zones_max_open
= 0;
306 sdkp
->urswrz
= buf
[4] & 1;
307 sdkp
->zones_optimal_open
= 0;
308 sdkp
->zones_optimal_nonseq
= 0;
309 sdkp
->zones_max_open
= get_unaligned_be32(&buf
[16]);
313 * Check for unconstrained reads: host-managed devices with
314 * constrained reads (drives failing read after write pointer)
318 if (sdkp
->first_scan
)
319 sd_printk(KERN_NOTICE
, sdkp
,
320 "constrained reads devices are not supported\n");
328 * sd_zbc_check_capacity - Check the device capacity
330 * @buf: command buffer
331 * @zblock: zone size in number of blocks
333 * Get the device zone size and check that the device capacity as reported
334 * by READ CAPACITY matches the max_lba value (plus one) of the report zones
335 * command reply for devices with RC_BASIS == 0.
337 * Returns 0 upon success or an error code upon failure.
339 static int sd_zbc_check_capacity(struct scsi_disk
*sdkp
, unsigned char *buf
,
347 /* Do a report zone to get max_lba and the size of the first zone */
348 ret
= sd_zbc_do_report_zones(sdkp
, buf
, SD_BUF_SIZE
, 0, false);
352 if (sdkp
->rc_basis
== 0) {
353 /* The max_lba field is the capacity of this device */
354 max_lba
= get_unaligned_be64(&buf
[8]);
355 if (sdkp
->capacity
!= max_lba
+ 1) {
356 if (sdkp
->first_scan
)
357 sd_printk(KERN_WARNING
, sdkp
,
358 "Changing capacity from %llu to max LBA+1 %llu\n",
359 (unsigned long long)sdkp
->capacity
,
360 (unsigned long long)max_lba
+ 1);
361 sdkp
->capacity
= max_lba
+ 1;
365 /* Get the size of the first reported zone */
367 zone_blocks
= get_unaligned_be64(&rec
[8]);
368 if (logical_to_sectors(sdkp
->device
, zone_blocks
) > UINT_MAX
) {
369 if (sdkp
->first_scan
)
370 sd_printk(KERN_NOTICE
, sdkp
,
371 "Zone size too large\n");
375 *zblocks
= zone_blocks
;
380 int sd_zbc_read_zones(struct scsi_disk
*sdkp
, unsigned char *buf
)
382 struct gendisk
*disk
= sdkp
->disk
;
383 unsigned int nr_zones
;
387 if (!sd_is_zoned(sdkp
))
389 * Device managed or normal SCSI disk,
390 * no special handling required
394 /* Check zoned block device characteristics (unconstrained reads) */
395 ret
= sd_zbc_check_zoned_characteristics(sdkp
, buf
);
399 /* Check the device capacity reported by report zones */
400 ret
= sd_zbc_check_capacity(sdkp
, buf
, &zone_blocks
);
404 /* The drive satisfies the kernel restrictions: set it up */
405 blk_queue_flag_set(QUEUE_FLAG_ZONE_RESETALL
, sdkp
->disk
->queue
);
406 blk_queue_required_elevator_features(sdkp
->disk
->queue
,
407 ELEVATOR_F_ZBD_SEQ_WRITE
);
408 nr_zones
= round_up(sdkp
->capacity
, zone_blocks
) >> ilog2(zone_blocks
);
410 /* READ16/WRITE16 is mandatory for ZBC disks */
411 sdkp
->device
->use_16_for_rw
= 1;
412 sdkp
->device
->use_10_for_rw
= 0;
415 * Revalidate the disk zone bitmaps once the block device capacity is
416 * set on the second revalidate execution during disk scan and if
417 * something changed when executing a normal revalidate.
419 if (sdkp
->first_scan
) {
420 sdkp
->zone_blocks
= zone_blocks
;
421 sdkp
->nr_zones
= nr_zones
;
425 if (sdkp
->zone_blocks
!= zone_blocks
||
426 sdkp
->nr_zones
!= nr_zones
||
427 disk
->queue
->nr_zones
!= nr_zones
) {
428 ret
= blk_revalidate_disk_zones(disk
);
431 sdkp
->zone_blocks
= zone_blocks
;
432 sdkp
->nr_zones
= nr_zones
;
443 void sd_zbc_print_zones(struct scsi_disk
*sdkp
)
445 if (!sd_is_zoned(sdkp
) || !sdkp
->capacity
)
448 if (sdkp
->capacity
& (sdkp
->zone_blocks
- 1))
449 sd_printk(KERN_NOTICE
, sdkp
,
450 "%u zones of %u logical blocks + 1 runt zone\n",
454 sd_printk(KERN_NOTICE
, sdkp
,
455 "%u zones of %u logical blocks\n",