2 * Threaded data processing for Qcow2: compression, encryption
4 * Copyright (c) 2004-2006 Fabrice Bellard
5 * Copyright (c) 2018 Virtuozzo International GmbH. All rights reserved.
7 * Permission is hereby granted, free of charge, to any person obtaining a copy
8 * of this software and associated documentation files (the "Software"), to deal
9 * in the Software without restriction, including without limitation the rights
10 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
11 * copies of the Software, and to permit persons to whom the Software is
12 * furnished to do so, subject to the following conditions:
14 * The above copyright notice and this permission notice shall be included in
15 * all copies or substantial portions of the Software.
17 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
18 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
19 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
20 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
21 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
22 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
26 #include "qemu/osdep.h"
33 #include <zstd_errors.h>
37 #include "block/block-io.h"
38 #include "block/thread-pool.h"
41 static int coroutine_fn
42 qcow2_co_process(BlockDriverState
*bs
, ThreadPoolFunc
*func
, void *arg
)
45 BDRVQcow2State
*s
= bs
->opaque
;
46 ThreadPool
*pool
= aio_get_thread_pool(bdrv_get_aio_context(bs
));
48 qemu_co_mutex_lock(&s
->lock
);
49 while (s
->nb_threads
>= QCOW2_MAX_THREADS
) {
50 qemu_co_queue_wait(&s
->thread_task_queue
, &s
->lock
);
53 qemu_co_mutex_unlock(&s
->lock
);
55 ret
= thread_pool_submit_co(pool
, func
, arg
);
57 qemu_co_mutex_lock(&s
->lock
);
59 qemu_co_queue_next(&s
->thread_task_queue
);
60 qemu_co_mutex_unlock(&s
->lock
);
70 typedef ssize_t (*Qcow2CompressFunc
)(void *dest
, size_t dest_size
,
71 const void *src
, size_t src_size
);
72 typedef struct Qcow2CompressData
{
79 Qcow2CompressFunc func
;
83 * qcow2_zlib_compress()
85 * Compress @src_size bytes of data using zlib compression method
87 * @dest - destination buffer, @dest_size bytes
88 * @src - source buffer, @src_size bytes
90 * Returns: compressed size on success
91 * -ENOMEM destination buffer is not enough to store compressed data
92 * -EIO on any other error
94 static ssize_t
qcow2_zlib_compress(void *dest
, size_t dest_size
,
95 const void *src
, size_t src_size
)
100 /* best compression, small window, no zlib header */
101 memset(&strm
, 0, sizeof(strm
));
102 ret
= deflateInit2(&strm
, Z_DEFAULT_COMPRESSION
, Z_DEFLATED
,
103 -12, 9, Z_DEFAULT_STRATEGY
);
109 * strm.next_in is not const in old zlib versions, such as those used on
110 * OpenBSD/NetBSD, so cast the const away
112 strm
.avail_in
= src_size
;
113 strm
.next_in
= (void *) src
;
114 strm
.avail_out
= dest_size
;
115 strm
.next_out
= dest
;
117 ret
= deflate(&strm
, Z_FINISH
);
118 if (ret
== Z_STREAM_END
) {
119 ret
= dest_size
- strm
.avail_out
;
121 ret
= (ret
== Z_OK
? -ENOMEM
: -EIO
);
130 * qcow2_zlib_decompress()
132 * Decompress some data (not more than @src_size bytes) to produce exactly
133 * @dest_size bytes using zlib compression method
135 * @dest - destination buffer, @dest_size bytes
136 * @src - source buffer, @src_size bytes
138 * Returns: 0 on success
141 static ssize_t
qcow2_zlib_decompress(void *dest
, size_t dest_size
,
142 const void *src
, size_t src_size
)
147 memset(&strm
, 0, sizeof(strm
));
148 strm
.avail_in
= src_size
;
149 strm
.next_in
= (void *) src
;
150 strm
.avail_out
= dest_size
;
151 strm
.next_out
= dest
;
153 ret
= inflateInit2(&strm
, -12);
158 ret
= inflate(&strm
, Z_FINISH
);
159 if ((ret
== Z_STREAM_END
|| ret
== Z_BUF_ERROR
) && strm
.avail_out
== 0) {
161 * We approve Z_BUF_ERROR because we need @dest buffer to be filled, but
162 * @src buffer may be processed partly (because in qcow2 we know size of
163 * compressed data with precision of one sector)
178 * qcow2_zstd_compress()
180 * Compress @src_size bytes of data using zstd compression method
182 * @dest - destination buffer, @dest_size bytes
183 * @src - source buffer, @src_size bytes
185 * Returns: compressed size on success
186 * -ENOMEM destination buffer is not enough to store compressed data
187 * -EIO on any other error
189 static ssize_t
qcow2_zstd_compress(void *dest
, size_t dest_size
,
190 const void *src
, size_t src_size
)
194 ZSTD_outBuffer output
= {
199 ZSTD_inBuffer input
= {
204 ZSTD_CCtx
*cctx
= ZSTD_createCCtx();
210 * Use the zstd streamed interface for symmetry with decompression,
211 * where streaming is essential since we don't record the exact
214 * ZSTD_compressStream2() tries to compress everything it could
215 * with a single call. Although, ZSTD docs says that:
216 * "You must continue calling ZSTD_compressStream2() with ZSTD_e_end
217 * until it returns 0, at which point you are free to start a new frame",
218 * in out tests we saw the only case when it returned with >0 -
219 * when the output buffer was too small. In that case,
220 * ZSTD_compressStream2() expects a bigger buffer on the next call.
221 * We can't provide a bigger buffer because we are limited with dest_size
222 * which we pass to the ZSTD_compressStream2() at once.
223 * So, we don't need any loops and just abort the compression when we
224 * don't get 0 result on the first call.
226 zstd_ret
= ZSTD_compressStream2(cctx
, &output
, &input
, ZSTD_e_end
);
229 if (zstd_ret
> output
.size
- output
.pos
) {
237 /* make sure that zstd didn't overflow the dest buffer */
238 assert(output
.pos
<= dest_size
);
246 * qcow2_zstd_decompress()
248 * Decompress some data (not more than @src_size bytes) to produce exactly
249 * @dest_size bytes using zstd compression method
251 * @dest - destination buffer, @dest_size bytes
252 * @src - source buffer, @src_size bytes
254 * Returns: 0 on success
257 static ssize_t
qcow2_zstd_decompress(void *dest
, size_t dest_size
,
258 const void *src
, size_t src_size
)
262 ZSTD_outBuffer output
= {
267 ZSTD_inBuffer input
= {
272 ZSTD_DCtx
*dctx
= ZSTD_createDCtx();
279 * The compressed stream from the input buffer may consist of more
280 * than one zstd frame. So we iterate until we get a fully
281 * uncompressed cluster.
282 * From zstd docs related to ZSTD_decompressStream:
283 * "return : 0 when a frame is completely decoded and fully flushed"
284 * We suppose that this means: each time ZSTD_decompressStream reads
285 * only ONE full frame and returns 0 if and only if that frame
286 * is completely decoded and flushed. Only after returning 0,
287 * ZSTD_decompressStream reads another ONE full frame.
289 while (output
.pos
< output
.size
) {
290 size_t last_in_pos
= input
.pos
;
291 size_t last_out_pos
= output
.pos
;
292 zstd_ret
= ZSTD_decompressStream(dctx
, &output
, &input
);
294 if (ZSTD_isError(zstd_ret
)) {
300 * The ZSTD manual is vague about what to do if it reads
301 * the buffer partially, and we don't want to get stuck
302 * in an infinite loop where ZSTD_decompressStream
303 * returns > 0 waiting for another input chunk. So, we add
304 * a check which ensures that the loop makes some progress
307 if (last_in_pos
>= input
.pos
&&
308 last_out_pos
>= output
.pos
) {
314 * Make sure that we have the frame fully flushed here
315 * if not, we somehow managed to get uncompressed cluster
316 * greater then the cluster size, possibly because of its
324 assert(ret
== 0 || ret
== -EIO
);
329 static int qcow2_compress_pool_func(void *opaque
)
331 Qcow2CompressData
*data
= opaque
;
333 data
->ret
= data
->func(data
->dest
, data
->dest_size
,
334 data
->src
, data
->src_size
);
339 static ssize_t coroutine_fn
340 qcow2_co_do_compress(BlockDriverState
*bs
, void *dest
, size_t dest_size
,
341 const void *src
, size_t src_size
, Qcow2CompressFunc func
)
343 Qcow2CompressData arg
= {
345 .dest_size
= dest_size
,
347 .src_size
= src_size
,
351 qcow2_co_process(bs
, qcow2_compress_pool_func
, &arg
);
357 * qcow2_co_compress()
359 * Compress @src_size bytes of data using the compression
360 * method defined by the image compression type
362 * @dest - destination buffer, @dest_size bytes
363 * @src - source buffer, @src_size bytes
365 * Returns: compressed size on success
366 * a negative error code on failure
369 qcow2_co_compress(BlockDriverState
*bs
, void *dest
, size_t dest_size
,
370 const void *src
, size_t src_size
)
372 BDRVQcow2State
*s
= bs
->opaque
;
373 Qcow2CompressFunc fn
;
375 switch (s
->compression_type
) {
376 case QCOW2_COMPRESSION_TYPE_ZLIB
:
377 fn
= qcow2_zlib_compress
;
381 case QCOW2_COMPRESSION_TYPE_ZSTD
:
382 fn
= qcow2_zstd_compress
;
389 return qcow2_co_do_compress(bs
, dest
, dest_size
, src
, src_size
, fn
);
393 * qcow2_co_decompress()
395 * Decompress some data (not more than @src_size bytes) to produce exactly
396 * @dest_size bytes using the compression method defined by the image
399 * @dest - destination buffer, @dest_size bytes
400 * @src - source buffer, @src_size bytes
402 * Returns: 0 on success
403 * a negative error code on failure
406 qcow2_co_decompress(BlockDriverState
*bs
, void *dest
, size_t dest_size
,
407 const void *src
, size_t src_size
)
409 BDRVQcow2State
*s
= bs
->opaque
;
410 Qcow2CompressFunc fn
;
412 switch (s
->compression_type
) {
413 case QCOW2_COMPRESSION_TYPE_ZLIB
:
414 fn
= qcow2_zlib_decompress
;
418 case QCOW2_COMPRESSION_TYPE_ZSTD
:
419 fn
= qcow2_zstd_decompress
;
426 return qcow2_co_do_compress(bs
, dest
, dest_size
, src
, src_size
, fn
);
435 * Qcow2EncDecFunc: common prototype of qcrypto_block_encrypt() and
436 * qcrypto_block_decrypt() functions.
438 typedef int (*Qcow2EncDecFunc
)(QCryptoBlock
*block
, uint64_t offset
,
439 uint8_t *buf
, size_t len
, Error
**errp
);
441 typedef struct Qcow2EncDecData
{
447 Qcow2EncDecFunc func
;
450 static int qcow2_encdec_pool_func(void *opaque
)
452 Qcow2EncDecData
*data
= opaque
;
454 return data
->func(data
->block
, data
->offset
, data
->buf
, data
->len
, NULL
);
457 static int coroutine_fn
458 qcow2_co_encdec(BlockDriverState
*bs
, uint64_t host_offset
,
459 uint64_t guest_offset
, void *buf
, size_t len
,
460 Qcow2EncDecFunc func
)
462 BDRVQcow2State
*s
= bs
->opaque
;
463 Qcow2EncDecData arg
= {
465 .offset
= s
->crypt_physical_offset
? host_offset
: guest_offset
,
470 uint64_t sector_size
;
474 sector_size
= qcrypto_block_get_sector_size(s
->crypto
);
475 assert(QEMU_IS_ALIGNED(guest_offset
, sector_size
));
476 assert(QEMU_IS_ALIGNED(host_offset
, sector_size
));
477 assert(QEMU_IS_ALIGNED(len
, sector_size
));
479 return len
== 0 ? 0 : qcow2_co_process(bs
, qcow2_encdec_pool_func
, &arg
);
485 * Encrypts one or more contiguous aligned sectors
487 * @host_offset - underlying storage offset of the first sector of the
488 * data to be encrypted
490 * @guest_offset - guest (virtual) offset of the first sector of the
491 * data to be encrypted
493 * @buf - buffer with the data to encrypt, that after encryption
494 * will be written to the underlying storage device at
497 * @len - length of the buffer (must be a multiple of the encryption
500 * Depending on the encryption method, @host_offset and/or @guest_offset
501 * may be used for generating the initialization vector for
504 * Note that while the whole range must be aligned on sectors, it
505 * does not have to be aligned on clusters and can also cross cluster
509 qcow2_co_encrypt(BlockDriverState
*bs
, uint64_t host_offset
,
510 uint64_t guest_offset
, void *buf
, size_t len
)
512 return qcow2_co_encdec(bs
, host_offset
, guest_offset
, buf
, len
,
513 qcrypto_block_encrypt
);
519 * Decrypts one or more contiguous aligned sectors
520 * Similar to qcow2_co_encrypt
523 qcow2_co_decrypt(BlockDriverState
*bs
, uint64_t host_offset
,
524 uint64_t guest_offset
, void *buf
, size_t len
)
526 return qcow2_co_encdec(bs
, host_offset
, guest_offset
, buf
, len
,
527 qcrypto_block_decrypt
);