ZAP: Add by_dnode variants to lookup/prefetch_uint64
[zfs.git] / include / sys / arc.h
blob883c07b4ff3d27e1f1a600016dcd1392bc0dc977
1 /*
2 * CDDL HEADER START
4 * The contents of this file are subject to the terms of the
5 * Common Development and Distribution License (the "License").
6 * You may not use this file except in compliance with the License.
8 * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
9 * or https://opensource.org/licenses/CDDL-1.0.
10 * See the License for the specific language governing permissions
11 * and limitations under the License.
13 * When distributing Covered Code, include this CDDL HEADER in each
14 * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
15 * If applicable, add the following below this CDDL HEADER, with the
16 * fields enclosed by brackets "[]" replaced with your own identifying
17 * information: Portions Copyright [yyyy] [name of copyright owner]
19 * CDDL HEADER END
22 * Copyright (c) 2005, 2010, Oracle and/or its affiliates. All rights reserved.
23 * Copyright (c) 2012, 2016 by Delphix. All rights reserved.
24 * Copyright (c) 2013 by Saso Kiselkov. All rights reserved.
25 * Copyright (c) 2019, Allan Jude
26 * Copyright (c) 2019, Klara Inc.
29 #ifndef _SYS_ARC_H
30 #define _SYS_ARC_H
32 #include <sys/zfs_context.h>
34 #ifdef __cplusplus
35 extern "C" {
36 #endif
38 #include <sys/zio.h>
39 #include <sys/dmu.h>
40 #include <sys/spa.h>
41 #include <sys/zfs_refcount.h>
44 * Used by arc_flush() to inform arc_evict_state() that it should evict
45 * all available buffers from the arc state being passed in.
47 #define ARC_EVICT_ALL UINT64_MAX
50 * ZFS gets very unhappy when the maximum ARC size is smaller than the maximum
51 * block size and a larger block is written. To leave some safety margin, we
52 * limit the minimum for zfs_arc_max to the maximium transaction size.
54 #define MIN_ARC_MAX DMU_MAX_ACCESS
56 #define HDR_SET_LSIZE(hdr, x) do { \
57 ASSERT(IS_P2ALIGNED(x, 1U << SPA_MINBLOCKSHIFT)); \
58 (hdr)->b_lsize = ((x) >> SPA_MINBLOCKSHIFT); \
59 } while (0)
61 #define HDR_SET_PSIZE(hdr, x) do { \
62 ASSERT(IS_P2ALIGNED((x), 1U << SPA_MINBLOCKSHIFT)); \
63 (hdr)->b_psize = ((x) >> SPA_MINBLOCKSHIFT); \
64 } while (0)
66 #define HDR_GET_LSIZE(hdr) ((hdr)->b_lsize << SPA_MINBLOCKSHIFT)
67 #define HDR_GET_PSIZE(hdr) ((hdr)->b_psize << SPA_MINBLOCKSHIFT)
69 typedef struct arc_buf_hdr arc_buf_hdr_t;
70 typedef struct arc_buf arc_buf_t;
71 typedef struct arc_prune arc_prune_t;
74 * Because the ARC can store encrypted data, errors (not due to bugs) may arise
75 * while transforming data into its desired format - specifically, when
76 * decrypting, the key may not be present, or the HMAC may not be correct
77 * which signifies deliberate tampering with the on-disk state
78 * (assuming that the checksum was correct). If any error occurs, the "buf"
79 * parameter will be NULL.
81 typedef void arc_read_done_func_t(zio_t *zio, const zbookmark_phys_t *zb,
82 const blkptr_t *bp, arc_buf_t *buf, void *priv);
83 typedef void arc_write_done_func_t(zio_t *zio, arc_buf_t *buf, void *priv);
84 typedef void arc_prune_func_t(uint64_t bytes, void *priv);
86 /* Shared module parameters */
87 extern uint_t zfs_arc_average_blocksize;
88 extern int l2arc_exclude_special;
90 /* generic arc_done_func_t's which you can use */
91 arc_read_done_func_t arc_bcopy_func;
92 arc_read_done_func_t arc_getbuf_func;
94 /* generic arc_prune_func_t wrapper for callbacks */
95 struct arc_prune {
96 arc_prune_func_t *p_pfunc;
97 void *p_private;
98 uint64_t p_adjust;
99 list_node_t p_node;
100 zfs_refcount_t p_refcnt;
103 typedef enum arc_strategy {
104 ARC_STRATEGY_META_ONLY = 0, /* Evict only meta data buffers */
105 ARC_STRATEGY_META_BALANCED = 1, /* Evict data buffers if needed */
106 } arc_strategy_t;
108 typedef enum arc_flags
111 * Public flags that can be passed into the ARC by external consumers.
113 ARC_FLAG_WAIT = 1 << 0, /* perform sync I/O */
114 ARC_FLAG_NOWAIT = 1 << 1, /* perform async I/O */
115 ARC_FLAG_PREFETCH = 1 << 2, /* I/O is a prefetch */
116 ARC_FLAG_CACHED = 1 << 3, /* I/O was in cache */
117 ARC_FLAG_L2CACHE = 1 << 4, /* cache in L2ARC */
118 ARC_FLAG_UNCACHED = 1 << 5, /* evict after use */
119 ARC_FLAG_PRESCIENT_PREFETCH = 1 << 6, /* long min lifespan */
122 * Private ARC flags. These flags are private ARC only flags that
123 * will show up in b_flags in the arc_buf_hdr_t. These flags should
124 * only be set by ARC code.
126 ARC_FLAG_IN_HASH_TABLE = 1 << 7, /* buffer is hashed */
127 ARC_FLAG_IO_IN_PROGRESS = 1 << 8, /* I/O in progress */
128 ARC_FLAG_IO_ERROR = 1 << 9, /* I/O failed for buf */
129 ARC_FLAG_INDIRECT = 1 << 10, /* indirect block */
130 /* Indicates that block was read with ASYNC priority. */
131 ARC_FLAG_PRIO_ASYNC_READ = 1 << 11,
132 ARC_FLAG_L2_WRITING = 1 << 12, /* write in progress */
133 ARC_FLAG_L2_EVICTED = 1 << 13, /* evicted during I/O */
134 ARC_FLAG_L2_WRITE_HEAD = 1 << 14, /* head of write list */
136 * Encrypted or authenticated on disk (may be plaintext in memory).
137 * This header has b_crypt_hdr allocated. Does not include indirect
138 * blocks with checksums of MACs which will also have their X
139 * (encrypted) bit set in the bp.
141 ARC_FLAG_PROTECTED = 1 << 15,
142 /* data has not been authenticated yet */
143 ARC_FLAG_NOAUTH = 1 << 16,
144 /* indicates that the buffer contains metadata (otherwise, data) */
145 ARC_FLAG_BUFC_METADATA = 1 << 17,
147 /* Flags specifying whether optional hdr struct fields are defined */
148 ARC_FLAG_HAS_L1HDR = 1 << 18,
149 ARC_FLAG_HAS_L2HDR = 1 << 19,
152 * Indicates the arc_buf_hdr_t's b_pdata matches the on-disk data.
153 * This allows the l2arc to use the blkptr's checksum to verify
154 * the data without having to store the checksum in the hdr.
156 ARC_FLAG_COMPRESSED_ARC = 1 << 20,
157 ARC_FLAG_SHARED_DATA = 1 << 21,
160 * Fail this arc_read() (with ENOENT) if the data is not already present
161 * in cache.
163 ARC_FLAG_CACHED_ONLY = 1 << 22,
166 * Don't instantiate an arc_buf_t for arc_read_done.
168 ARC_FLAG_NO_BUF = 1 << 23,
171 * The arc buffer's compression mode is stored in the top 7 bits of the
172 * flags field, so these dummy flags are included so that MDB can
173 * interpret the enum properly.
175 ARC_FLAG_COMPRESS_0 = 1 << 24,
176 ARC_FLAG_COMPRESS_1 = 1 << 25,
177 ARC_FLAG_COMPRESS_2 = 1 << 26,
178 ARC_FLAG_COMPRESS_3 = 1 << 27,
179 ARC_FLAG_COMPRESS_4 = 1 << 28,
180 ARC_FLAG_COMPRESS_5 = 1 << 29,
181 ARC_FLAG_COMPRESS_6 = 1 << 30
182 } arc_flags_t;
184 typedef enum arc_buf_flags {
185 ARC_BUF_FLAG_SHARED = 1 << 0,
186 ARC_BUF_FLAG_COMPRESSED = 1 << 1,
188 * indicates whether this arc_buf_t is encrypted, regardless of
189 * state on-disk
191 ARC_BUF_FLAG_ENCRYPTED = 1 << 2
192 } arc_buf_flags_t;
194 struct arc_buf {
195 arc_buf_hdr_t *b_hdr;
196 arc_buf_t *b_next;
197 void *b_data;
198 arc_buf_flags_t b_flags;
201 typedef enum arc_buf_contents {
202 ARC_BUFC_DATA, /* buffer contains data */
203 ARC_BUFC_METADATA, /* buffer contains metadata */
204 ARC_BUFC_NUMTYPES
205 } arc_buf_contents_t;
208 * The following breakdowns of arc_size exist for kstat only.
210 typedef enum arc_space_type {
211 ARC_SPACE_DATA,
212 ARC_SPACE_META,
213 ARC_SPACE_HDRS,
214 ARC_SPACE_L2HDRS,
215 ARC_SPACE_DBUF,
216 ARC_SPACE_DNODE,
217 ARC_SPACE_BONUS,
218 ARC_SPACE_ABD_CHUNK_WASTE,
219 ARC_SPACE_NUMTYPES
220 } arc_space_type_t;
222 typedef enum arc_state_type {
223 ARC_STATE_ANON,
224 ARC_STATE_MRU,
225 ARC_STATE_MRU_GHOST,
226 ARC_STATE_MFU,
227 ARC_STATE_MFU_GHOST,
228 ARC_STATE_L2C_ONLY,
229 ARC_STATE_UNCACHED,
230 ARC_STATE_NUMTYPES
231 } arc_state_type_t;
233 typedef struct arc_buf_info {
234 arc_state_type_t abi_state_type;
235 arc_buf_contents_t abi_state_contents;
236 uint32_t abi_flags;
237 uint32_t abi_bufcnt;
238 uint64_t abi_size;
239 uint64_t abi_spa;
240 uint64_t abi_access;
241 uint32_t abi_mru_hits;
242 uint32_t abi_mru_ghost_hits;
243 uint32_t abi_mfu_hits;
244 uint32_t abi_mfu_ghost_hits;
245 uint32_t abi_l2arc_hits;
246 uint32_t abi_holds;
247 uint64_t abi_l2arc_dattr;
248 uint64_t abi_l2arc_asize;
249 enum zio_compress abi_l2arc_compress;
250 } arc_buf_info_t;
253 * Flags returned by arc_cached; describes which part of the arc
254 * the block is cached in.
256 #define ARC_CACHED_EMBEDDED (1U << 0)
257 #define ARC_CACHED_IN_L1 (1U << 1)
258 #define ARC_CACHED_IN_MRU (1U << 2)
259 #define ARC_CACHED_IN_MFU (1U << 3)
260 #define ARC_CACHED_IN_L2 (1U << 4)
262 void arc_space_consume(uint64_t space, arc_space_type_t type);
263 void arc_space_return(uint64_t space, arc_space_type_t type);
264 boolean_t arc_is_metadata(arc_buf_t *buf);
265 boolean_t arc_is_encrypted(arc_buf_t *buf);
266 boolean_t arc_is_unauthenticated(arc_buf_t *buf);
267 enum zio_compress arc_get_compression(arc_buf_t *buf);
268 void arc_get_raw_params(arc_buf_t *buf, boolean_t *byteorder, uint8_t *salt,
269 uint8_t *iv, uint8_t *mac);
270 int arc_untransform(arc_buf_t *buf, spa_t *spa, const zbookmark_phys_t *zb,
271 boolean_t in_place);
272 void arc_convert_to_raw(arc_buf_t *buf, uint64_t dsobj, boolean_t byteorder,
273 dmu_object_type_t ot, const uint8_t *salt, const uint8_t *iv,
274 const uint8_t *mac);
275 arc_buf_t *arc_alloc_buf(spa_t *spa, const void *tag, arc_buf_contents_t type,
276 int32_t size);
277 arc_buf_t *arc_alloc_compressed_buf(spa_t *spa, const void *tag,
278 uint64_t psize, uint64_t lsize, enum zio_compress compression_type,
279 uint8_t complevel);
280 arc_buf_t *arc_alloc_raw_buf(spa_t *spa, const void *tag, uint64_t dsobj,
281 boolean_t byteorder, const uint8_t *salt, const uint8_t *iv,
282 const uint8_t *mac, dmu_object_type_t ot, uint64_t psize, uint64_t lsize,
283 enum zio_compress compression_type, uint8_t complevel);
284 uint8_t arc_get_complevel(arc_buf_t *buf);
285 arc_buf_t *arc_loan_buf(spa_t *spa, boolean_t is_metadata, int size);
286 arc_buf_t *arc_loan_compressed_buf(spa_t *spa, uint64_t psize, uint64_t lsize,
287 enum zio_compress compression_type, uint8_t complevel);
288 arc_buf_t *arc_loan_raw_buf(spa_t *spa, uint64_t dsobj, boolean_t byteorder,
289 const uint8_t *salt, const uint8_t *iv, const uint8_t *mac,
290 dmu_object_type_t ot, uint64_t psize, uint64_t lsize,
291 enum zio_compress compression_type, uint8_t complevel);
292 void arc_return_buf(arc_buf_t *buf, const void *tag);
293 void arc_loan_inuse_buf(arc_buf_t *buf, const void *tag);
294 void arc_buf_destroy(arc_buf_t *buf, const void *tag);
295 void arc_buf_info(arc_buf_t *buf, arc_buf_info_t *abi, int state_index);
296 uint64_t arc_buf_size(arc_buf_t *buf);
297 uint64_t arc_buf_lsize(arc_buf_t *buf);
298 void arc_buf_access(arc_buf_t *buf);
299 void arc_release(arc_buf_t *buf, const void *tag);
300 int arc_released(arc_buf_t *buf);
301 void arc_buf_sigsegv(int sig, siginfo_t *si, void *unused);
302 void arc_buf_freeze(arc_buf_t *buf);
303 void arc_buf_thaw(arc_buf_t *buf);
304 #ifdef ZFS_DEBUG
305 int arc_referenced(arc_buf_t *buf);
306 #else
307 #define arc_referenced(buf) ((void) sizeof (buf), 0)
308 #endif
310 int arc_read(zio_t *pio, spa_t *spa, const blkptr_t *bp,
311 arc_read_done_func_t *done, void *priv, zio_priority_t priority,
312 int flags, arc_flags_t *arc_flags, const zbookmark_phys_t *zb);
313 zio_t *arc_write(zio_t *pio, spa_t *spa, uint64_t txg, blkptr_t *bp,
314 arc_buf_t *buf, boolean_t uncached, boolean_t l2arc, const zio_prop_t *zp,
315 arc_write_done_func_t *ready, arc_write_done_func_t *child_ready,
316 arc_write_done_func_t *done, void *priv, zio_priority_t priority,
317 int zio_flags, const zbookmark_phys_t *zb);
319 arc_prune_t *arc_add_prune_callback(arc_prune_func_t *func, void *priv);
320 void arc_remove_prune_callback(arc_prune_t *p);
321 void arc_freed(spa_t *spa, const blkptr_t *bp);
322 int arc_cached(spa_t *spa, const blkptr_t *bp);
324 void arc_flush(spa_t *spa, boolean_t retry);
325 void arc_tempreserve_clear(uint64_t reserve);
326 int arc_tempreserve_space(spa_t *spa, uint64_t reserve, uint64_t txg);
328 uint64_t arc_all_memory(void);
329 uint64_t arc_default_max(uint64_t min, uint64_t allmem);
330 uint64_t arc_target_bytes(void);
331 void arc_set_limits(uint64_t);
332 void arc_init(void);
333 void arc_fini(void);
336 * Level 2 ARC
339 void l2arc_add_vdev(spa_t *spa, vdev_t *vd);
340 void l2arc_remove_vdev(vdev_t *vd);
341 boolean_t l2arc_vdev_present(vdev_t *vd);
342 void l2arc_rebuild_vdev(vdev_t *vd, boolean_t reopen);
343 boolean_t l2arc_range_check_overlap(uint64_t bottom, uint64_t top,
344 uint64_t check);
345 void l2arc_init(void);
346 void l2arc_fini(void);
347 void l2arc_start(void);
348 void l2arc_stop(void);
349 void l2arc_spa_rebuild_start(spa_t *spa);
351 #ifndef _KERNEL
352 extern boolean_t arc_watch;
353 #endif
355 #ifdef __cplusplus
357 #endif
359 #endif /* _SYS_ARC_H */