buf.h
1 /* 2 * Copyright (c) 2000-2016 Apple Computer, Inc. All rights reserved. 3 * 4 * @APPLE_OSREFERENCE_LICENSE_HEADER_START@ 5 * 6 * This file contains Original Code and/or Modifications of Original Code 7 * as defined in and that are subject to the Apple Public Source License 8 * Version 2.0 (the 'License'). You may not use this file except in 9 * compliance with the License. The rights granted to you under the License 10 * may not be used to create, or enable the creation or redistribution of, 11 * unlawful or unlicensed copies of an Apple operating system, or to 12 * circumvent, violate, or enable the circumvention or violation of, any 13 * terms of an Apple operating system software license agreement. 14 * 15 * Please obtain a copy of the License at 16 * http://www.opensource.apple.com/apsl/ and read it before using this file. 17 * 18 * The Original Code and all software distributed under the License are 19 * distributed on an 'AS IS' basis, WITHOUT WARRANTY OF ANY KIND, EITHER 20 * EXPRESS OR IMPLIED, AND APPLE HEREBY DISCLAIMS ALL SUCH WARRANTIES, 21 * INCLUDING WITHOUT LIMITATION, ANY WARRANTIES OF MERCHANTABILITY, 22 * FITNESS FOR A PARTICULAR PURPOSE, QUIET ENJOYMENT OR NON-INFRINGEMENT. 23 * Please see the License for the specific language governing rights and 24 * limitations under the License. 25 * 26 * @APPLE_OSREFERENCE_LICENSE_HEADER_END@ 27 */ 28 /* Copyright (c) 1995 NeXT Computer, Inc. All Rights Reserved */ 29 /* 30 * Copyright (c) 1982, 1986, 1989, 1993 31 * The Regents of the University of California. All rights reserved. 32 * (c) UNIX System Laboratories, Inc. 33 * All or some portions of this file are derived from material licensed 34 * to the University of California by American Telephone and Telegraph 35 * Co. or Unix System Laboratories, Inc. and are reproduced herein with 36 * the permission of UNIX System Laboratories, Inc. 37 * 38 * Redistribution and use in source and binary forms, with or without 39 * modification, are permitted provided that the following conditions 40 * are met: 41 * 1. Redistributions of source code must retain the above copyright 42 * notice, this list of conditions and the following disclaimer. 43 * 2. Redistributions in binary form must reproduce the above copyright 44 * notice, this list of conditions and the following disclaimer in the 45 * documentation and/or other materials provided with the distribution. 46 * 3. All advertising materials mentioning features or use of this software 47 * must display the following acknowledgement: 48 * This product includes software developed by the University of 49 * California, Berkeley and its contributors. 50 * 4. Neither the name of the University nor the names of its contributors 51 * may be used to endorse or promote products derived from this software 52 * without specific prior written permission. 53 * 54 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND 55 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 56 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 57 * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE 58 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 59 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 60 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 61 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 62 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 63 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 64 * SUCH DAMAGE. 65 * 66 * @(#)buf.h 8.9 (Berkeley) 3/30/95 67 */ 68 69 #ifndef _SYS_BUF_H_ 70 #define _SYS_BUF_H_ 71 72 #include <sys/cdefs.h> 73 #include <sys/kernel_types.h> 74 #include <sys/ucred.h> 75 #include <mach/memory_object_types.h> 76 77 78 #define B_WRITE 0x00000000 /* Write buffer (pseudo flag). */ 79 #define B_READ 0x00000001 /* Read buffer. */ 80 #define B_ASYNC 0x00000002 /* Start I/O, do not wait. */ 81 #define B_NOCACHE 0x00000004 /* Do not cache block after use. */ 82 #define B_DELWRI 0x00000008 /* Delay I/O until buffer reused. */ 83 #define B_LOCKED 0x00000010 /* Locked in core (not reusable). */ 84 #define B_PHYS 0x00000020 /* I/O to user memory. */ 85 #define B_CLUSTER 0x00000040 /* UPL based I/O generated by cluster layer */ 86 #define B_PAGEIO 0x00000080 /* Page in/out */ 87 #define B_META 0x00000100 /* buffer contains meta-data. */ 88 #define B_RAW 0x00000200 /* Set by physio for raw transfers. */ 89 #define B_FUA 0x00000400 /* Write-through disk cache(if supported) */ 90 #define B_PASSIVE 0x00000800 /* PASSIVE I/Os are ignored by THROTTLE I/O */ 91 #define B_IOSTREAMING 0x00001000 /* sequential access pattern detected */ 92 #define B_THROTTLED_IO 0x00002000 /* low priority I/O (deprecated) */ 93 #define B_ENCRYPTED_IO 0x00004000 /* Encrypted I/O */ 94 #define B_STATICCONTENT 0x00008000 /* Buffer is likely to remain unaltered */ 95 96 /* 97 * make sure to check when adding flags that 98 * that the new flags don't overlap the definitions 99 * in buf_internal.h 100 */ 101 102 __BEGIN_DECLS 103 104 /*! 105 * @function buf_markaged 106 * @abstract Mark a buffer as "aged," i.e. as a good candidate to be discarded and reused after buf_brelse(). 107 * @param bp Buffer to mark. 108 */ 109 void buf_markaged(buf_t bp); 110 111 /*! 112 * @function buf_markinvalid 113 * @abstract Mark a buffer as not having valid data and being ready for immediate reuse after buf_brelse(). 114 * @param bp Buffer to mark. 115 */ 116 void buf_markinvalid(buf_t bp); 117 118 /*! 119 * @function buf_markdelayed 120 * @abstract Mark a buffer as a delayed write: mark it dirty without actually scheduling I/O. 121 * @discussion Data will be flushed to disk at some later time, not with brelse(). A sync()/fsync() 122 * or pressure necessitating reuse of the buffer will cause it to be written back to disk. 123 * @param bp Buffer to mark. 124 */ 125 void buf_markdelayed(buf_t bp); 126 127 void buf_markclean(buf_t); 128 129 /*! 130 * @function buf_markeintr 131 * @abstract Mark a buffer as having been interrupted during I/O. 132 * @discussion Waiters for I/O to complete (buf_biowait()) will return with EINTR when woken up. 133 * buf_markeintr does not itself do a wakeup. 134 * @param bp Buffer to mark. 135 */ 136 void buf_markeintr(buf_t bp); 137 138 /*! 139 * @function buf_markfua 140 * @abstract Mark a buffer for write through disk cache, if disk supports it. 141 * @param bp Buffer to mark. 142 */ 143 void buf_markfua(buf_t bp); 144 145 /*! 146 * @function buf_fua 147 * @abstract Check if a buffer is marked for write through disk caches. 148 * @param bp Buffer to test. 149 * @return Nonzero if buffer is marked for write-through, 0 if not. 150 */ 151 int buf_fua(buf_t bp); 152 153 /*! 154 * @function buf_valid 155 * @abstract Check if a buffer contains valid data. 156 * @param bp Buffer to test. 157 * @return Nonzero if buffer has valid data, 0 if not. 158 */ 159 int buf_valid(buf_t bp); 160 161 /*! 162 * @function buf_fromcache 163 * @abstract Check if a buffer's data was found in core. 164 * @discussion Will return truth after a buf_getblk that finds a valid buffer in the cache or the relevant 165 * data in core (but not in a buffer). 166 * @param bp Buffer to test. 167 * @return Nonzero if we got this buffer's data without doing I/O, 0 if not. 168 */ 169 int buf_fromcache(buf_t bp); 170 171 /*! 172 * @function buf_upl 173 * @abstract Get the upl (Universal Page List) associated with a buffer. 174 * @discussion Buffers allocated with buf_alloc() are not returned with a upl, and 175 * traditional buffers only have a upl while an I/O is in progress. 176 * @param bp Buffer whose upl to grab. 177 * @return Buffer's upl if it has one, else NULL. 178 */ 179 void * buf_upl(buf_t bp); 180 181 /*! 182 * @function buf_uploffset 183 * @abstract Get the offset into a UPL at which this buffer begins. 184 * @discussion This function should only be called on iobufs, i.e. buffers allocated with buf_alloc(). 185 * @param bp Buffer whose uploffset to grab. 186 * @return Buffer's uploffset--does not check whether that value makes sense for this buffer. 187 */ 188 uint32_t buf_uploffset(buf_t bp); 189 190 /*! 191 * @function buf_rcred 192 * @abstract Get the credential associated with a buffer for reading. 193 * @discussion No reference is taken; if the credential is to be held on to persistently, an additional 194 * reference must be taken with kauth_cred_ref. 195 * @param bp Buffer whose credential to grab. 196 * @return Credential if it exists, else NULL. 197 */ 198 kauth_cred_t buf_rcred(buf_t bp); 199 200 /*! 201 * @function buf_wcred 202 * @abstract Get the credential associated with a buffer for writing. 203 * @discussion No reference is taken; if the credential is to be held on to persistently, an additional 204 * reference must be taken with kauth_cred_ref. 205 * @param bp Buffer whose credential to grab. 206 * @return Credential if it exists, else NULL. 207 */ 208 kauth_cred_t buf_wcred(buf_t bp); 209 210 /*! 211 * @function buf_proc 212 * @abstract Get the process associated with this buffer. 213 * @discussion buf_proc() will generally return NULL; a process is currently only associated with 214 * a buffer in the event of a physio() call. 215 * @param bp Buffer whose associated process to find. 216 * @return Associated process, possibly NULL. 217 */ 218 proc_t buf_proc(buf_t bp); 219 220 /*! 221 * @function buf_dirtyoff 222 * @abstract Get the starting offset of the dirty region associated with a buffer. 223 * @discussion The dirty offset is zero unless someone explicitly calls buf_setdirtyoff() (which the kernel does not). 224 * @param bp Buffer whose dirty offset to get. 225 * @return Dirty offset (0 if not explicitly changed). 226 */ 227 uint32_t buf_dirtyoff(buf_t bp); 228 229 /*! 230 * @function buf_dirtyend 231 * @abstract Get the ending offset of the dirty region associated with a buffer. 232 * @discussion If the buffer's data was found incore and dirty, the dirty end is the size of the block; otherwise, unless 233 * someone outside of xnu explicitly changes it by calling buf_setdirtyend(), it will be zero. 234 * @param bp Buffer whose dirty end to get. 235 * @return 0 if buffer is found clean; size of buffer if found dirty. Can be set to any value by callers of buf_setdirtyend(). 236 */ 237 uint32_t buf_dirtyend(buf_t bp); 238 239 /*! 240 * @function buf_setdirtyoff 241 * @abstract Set the starting offset of the dirty region associated with a buffer. 242 * @discussion This value is zero unless someone set it explicitly. 243 * @param bp Buffer whose dirty end to set. 244 */ 245 void buf_setdirtyoff(buf_t bp, uint32_t); 246 247 /*! 248 * @function buf_setdirtyend 249 * @abstract Set the ending offset of the dirty region associated with a buffer. 250 * @discussion If the buffer's data was found incore and dirty, the dirty end is the size of the block; otherwise, unless 251 * someone outside of xnu explicitly changes it by calling buf_setdirtyend(), it will be zero. 252 * @param bp Buffer whose dirty end to set. 253 */ 254 void buf_setdirtyend(buf_t bp, uint32_t); 255 256 /*! 257 * @function buf_error 258 * @abstract Get the error value associated with a buffer. 259 * @discussion Errors are set with buf_seterror(). 260 * @param bp Buffer whose error value to retrieve. 261 * @return Error value, directly. 262 */ 263 errno_t buf_error(buf_t bp); 264 265 /*! 266 * @function buf_seterror 267 * @abstract Set an error value on a buffer. 268 * @param bp Buffer whose error value to set. 269 */ 270 void buf_seterror(buf_t bp, errno_t); 271 272 /*! 273 * @function buf_setflags 274 * @abstract Set flags on a buffer. 275 * @discussion buffer_flags |= flags 276 * @param bp Buffer whose flags to set. 277 * @param flags Flags to add to buffer's mask. B_LOCKED/B_NOCACHE/B_ASYNC/B_READ/B_WRITE/B_PAGEIO/B_FUA 278 */ 279 void buf_setflags(buf_t bp, int32_t flags); 280 281 /*! 282 * @function buf_clearflags 283 * @abstract Clear flags on a buffer. 284 * @discussion buffer_flags &= ~flags 285 * @param bp Buffer whose flags to clear. 286 * @param flags Flags to remove from buffer's mask. B_LOCKED/B_NOCACHE/B_ASYNC/B_READ/B_WRITE/B_PAGEIO/B_FUA 287 */ 288 void buf_clearflags(buf_t bp, int32_t flags); 289 290 /*! 291 * @function buf_flags 292 * @abstract Get flags set on a buffer. 293 * @discussion Valid flags are B_LOCKED/B_NOCACHE/B_ASYNC/B_READ/B_WRITE/B_PAGEIO/B_FUA. 294 * @param bp Buffer whose flags to grab. 295 * @return flags. 296 */ 297 int32_t buf_flags(buf_t bp); 298 299 /*! 300 * @function buf_reset 301 * @abstract Reset I/O flag state on a buffer. 302 * @discussion Clears current flags on a buffer (internal and external) and allows some new flags to be set. 303 * Used perhaps to prepare an iobuf for reuse. 304 * @param bp Buffer whose flags to grab. 305 * @param flags Flags to set on buffer: B_READ, B_WRITE, B_ASYNC, B_NOCACHE. 306 */ 307 void buf_reset(buf_t bp, int32_t flags); 308 309 /*! 310 * @function buf_map 311 * @abstract Get virtual mappings for buffer data. 312 * @discussion For buffers created through buf_getblk() (i.e. traditional buffer cache usage), 313 * buf_map() just returns the address at which data was mapped by but_getblk(). For a B_CLUSTER buffer, i.e. an iobuf 314 * whose upl state is managed manually, there are two possibilities. If the buffer was created 315 * with an underlying "real" buffer through cluster_bp(), the mapping of the "real" buffer is returned. 316 * Otherwise, the buffer was created with buf_alloc() and buf_setupl() was subsequently called; buf_map() 317 * will call ubc_upl_map() to get a mapping for the buffer's upl and return the start of that mapping 318 * plus the buffer's upl offset (set in buf_setupl()). In the last case, buf_unmap() must later be called 319 * to tear down the mapping. NOTE: buf_map() does not set the buffer data pointer; this must be done with buf_setdataptr(). 320 * @param bp Buffer whose mapping to find or create. 321 * @param io_addr Destination for mapping address. 322 * @return 0 for success, ENOMEM if unable to map the buffer. 323 */ 324 errno_t buf_map(buf_t bp, caddr_t *io_addr); 325 326 /*! 327 * @function buf_unmap 328 * @abstract Release mappings for buffer data. 329 * @discussion For buffers created through buf_getblk() (i.e. traditional buffer cache usage), 330 * buf_unmap() does nothing; buf_brelse() will take care of unmapping. For a B_CLUSTER buffer, i.e. an iobuf 331 * whose upl state is managed manually, there are two possibilities. If the buffer was created 332 * with an underlying "real" buffer through cluster_bp(), buf_unmap() does nothing; buf_brelse() on the 333 * underlying buffer will tear down the mapping. Otherwise, the buffer was created with buf_alloc() and 334 * buf_setupl() was subsequently called; buf_map() created the mapping. In this case, buf_unmap() will 335 * unmap the buffer. 336 * @param bp Buffer whose mapping to find or create. 337 * @return 0 for success, EINVAL if unable to unmap buffer. 338 */ 339 errno_t buf_unmap(buf_t bp); 340 341 /*! 342 * @function buf_setdrvdata 343 * @abstract Set driver-specific data on a buffer. 344 * @param bp Buffer whose driver-data to set. 345 * @param drvdata Opaque driver data. 346 */ 347 void buf_setdrvdata(buf_t bp, void *drvdata); 348 349 /*! 350 * @function buf_setdrvdata 351 * @abstract Get driver-specific data from a buffer. 352 * @param bp Buffer whose driver data to get. 353 * @return Opaque driver data. 354 */ 355 void * buf_drvdata(buf_t bp); 356 357 /*! 358 * @function buf_setfsprivate 359 * @abstract Set filesystem-specific data on a buffer. 360 * @param bp Buffer whose filesystem data to set. 361 * @param fsprivate Opaque filesystem data. 362 */ 363 void buf_setfsprivate(buf_t bp, void *fsprivate); 364 365 /*! 366 * @function buf_fsprivate 367 * @abstract Get filesystem-specific data from a buffer. 368 * @param bp Buffer whose filesystem data to get. 369 * @return Opaque filesystem data. 370 */ 371 void * buf_fsprivate(buf_t bp); 372 373 /*! 374 * @function buf_blkno 375 * @abstract Get physical block number associated with a buffer, in the sense of VNOP_BLOCKMAP. 376 * @discussion When a buffer's physical block number is the same is its logical block number, then the physical 377 * block number is considered uninitialized. A physical block number of -1 indicates that there is no valid 378 * physical mapping (e.g. the logical block is invalid or corresponds to a sparse region in a file). Physical 379 * block number is normally set by the cluster layer or by buf_getblk(). 380 * @param bp Buffer whose physical block number to get. 381 * @return Block number. 382 */ 383 daddr64_t buf_blkno(buf_t bp); 384 385 /*! 386 * @function buf_lblkno 387 * @abstract Get logical block number associated with a buffer. 388 * @discussion Logical block number is set on traditionally-used buffers by an argument passed to buf_getblk(), 389 * for example by buf_bread(). 390 * @param bp Buffer whose logical block number to get. 391 * @return Block number. 392 */ 393 daddr64_t buf_lblkno(buf_t bp); 394 395 /*! 396 * @function buf_setblkno 397 * @abstract Set physical block number associated with a buffer. 398 * @discussion Physical block number is generally set by the cluster layer or by buf_getblk(). 399 * @param bp Buffer whose physical block number to set. 400 * @param blkno Block number to set. 401 */ 402 void buf_setblkno(buf_t bp, daddr64_t blkno); 403 404 /*! 405 * @function buf_setlblkno 406 * @abstract Set logical block number associated with a buffer. 407 * @discussion Logical block number is set on traditionally-used buffers by an argument passed to buf_getblk(), 408 * for example by buf_bread(). 409 * @param bp Buffer whose logical block number to set. 410 * @param lblkno Block number to set. 411 */ 412 void buf_setlblkno(buf_t bp, daddr64_t lblkno); 413 414 /*! 415 * @function buf_count 416 * @abstract Get count of valid bytes in a buffer. This may be less than the space allocated to the buffer. 417 * @param bp Buffer whose byte count to get. 418 * @return Byte count. 419 */ 420 uint32_t buf_count(buf_t bp); 421 422 /*! 423 * @function buf_size 424 * @abstract Get size of data region allocated to a buffer. 425 * @discussion May be larger than amount of valid data in buffer. 426 * @param bp Buffer whose size to get. 427 * @return Size. 428 */ 429 uint32_t buf_size(buf_t bp); 430 431 /*! 432 * @function buf_resid 433 * @abstract Get a count of bytes which were not consumed by an I/O on a buffer. 434 * @discussion Set when an I/O operations completes. 435 * @param bp Buffer whose outstanding count to get. 436 * @return Count of unwritten/unread bytes. 437 */ 438 uint32_t buf_resid(buf_t bp); 439 440 /*! 441 * @function buf_setcount 442 * @abstract Set count of valid bytes in a buffer. This may be less than the space allocated to the buffer. 443 * @param bp Buffer whose byte count to set. 444 * @param bcount Count to set. 445 */ 446 void buf_setcount(buf_t bp, uint32_t bcount); 447 448 /*! 449 * @function buf_setsize 450 * @abstract Set size of data region allocated to a buffer. 451 * @discussion May be larger than amount of valid data in buffer. Should be used by 452 * code which is manually providing storage for an iobuf, one allocated with buf_alloc(). 453 * @param bp Buffer whose size to set. 454 */ 455 void buf_setsize(buf_t bp, uint32_t); 456 457 /*! 458 * @function buf_setresid 459 * @abstract Set a count of bytes outstanding for I/O in a buffer. 460 * @discussion Set when an I/O operations completes. Examples: called by IOStorageFamily when I/O 461 * completes, often called on an "original" buffer when using a manipulated buffer to perform I/O 462 * on behalf of the first. 463 * @param bp Buffer whose outstanding count to set. 464 */ 465 void buf_setresid(buf_t bp, uint32_t resid); 466 467 /*! 468 * @function buf_setdataptr 469 * @abstract Set the address at which a buffer's data will be stored. 470 * @discussion In traditional buffer use, the data pointer will be set automatically. This routine is 471 * useful with iobufs (allocated with buf_alloc()). 472 * @param bp Buffer whose data pointer to set. 473 * @param data Pointer to data region. 474 */ 475 void buf_setdataptr(buf_t bp, uintptr_t data); 476 477 /*! 478 * @function buf_dataptr 479 * @abstract Get the address at which a buffer's data is stored; for iobufs, this must 480 * be set with buf_setdataptr(). See buf_map(). 481 * @param bp Buffer whose data pointer to retrieve. 482 * @return Data pointer; NULL if unset. 483 */ 484 uintptr_t buf_dataptr(buf_t bp); 485 486 /*! 487 * @function buf_vnode 488 * @abstract Get the vnode associated with a buffer. 489 * @discussion Every buffer is associated with a file. Because there is an I/O in flight, 490 * there is an iocount on this vnode; it is returned WITHOUT an extra iocount, and vnode_put() 491 * need NOT be called. 492 * @param bp Buffer whose vnode to retrieve. 493 * @return Buffer's vnode. 494 */ 495 vnode_t buf_vnode(buf_t bp); 496 497 /*! 498 * @function buf_setvnode 499 * @abstract Set the vnode associated with a buffer. 500 * @discussion This call need not be used on traditional buffers; it is for use with iobufs. 501 * @param bp Buffer whose vnode to set. 502 * @param vp The vnode to attach to the buffer. 503 */ 504 void buf_setvnode(buf_t bp, vnode_t vp); 505 506 /*! 507 * @function buf_device 508 * @abstract Get the device ID associated with a buffer. 509 * @discussion In traditional buffer use, this value is NODEV until buf_strategy() is called unless 510 * buf_getblk() was passed a device vnode. It is set on an iobuf if buf_alloc() is passed a device 511 * vnode or if buf_setdevice() is called. 512 * @param bp Buffer whose device ID to retrieve. 513 * @return Device id. 514 */ 515 dev_t buf_device(buf_t bp); 516 517 /*! 518 * @function buf_setdevice 519 * @abstract Set the device associated with a buffer. 520 * @discussion A buffer's device is set in buf_strategy() (or in buf_getblk() if the file is a device). 521 * It is also set on an iobuf if buf_alloc() is passed a device vnode. 522 * @param bp Buffer whose device ID to set. 523 * @param vp Device to set on the buffer. 524 * @return 0 for success, EINVAL if vp is not a device file. 525 */ 526 errno_t buf_setdevice(buf_t bp, vnode_t vp); 527 528 /*! 529 * @function buf_strategy 530 * @abstract Pass an I/O request for a buffer down to the device layer. 531 * @discussion This is one of the most important routines in the buffer cache layer. For buffers obtained 532 * through buf_getblk, it handles finding physical block numbers for the I/O (with VNOP_BLKTOOFF and 533 * VNOP_BLOCKMAP), packaging the I/O into page-sized chunks, and initiating I/O on the disk by calling 534 * the device's strategy routine. If a buffer's UPL has been set manually with buf_setupl(), it assumes 535 * that the request is already correctly configured with a block number and a size divisible by page size 536 * and will just call directly to the device. 537 * @param devvp Device on which to perform I/O 538 * @param ap vnop_strategy_args structure (most importantly, a buffer). 539 * @return 0 for success, or errors from filesystem or device layers. 540 */ 541 errno_t buf_strategy(vnode_t devvp, void *ap); 542 543 /* 544 * Flags for buf_invalblkno() 545 */ 546 #define BUF_WAIT 0x01 547 548 /*! 549 * @function buf_invalblkno 550 * @abstract Invalidate a filesystem logical block in a file. 551 * @discussion buf_invalblkno() tries to make the data for a given block in a file 552 * invalid; if the buffer for that block is found in core and is not busy, we mark it 553 * invalid and call buf_brelse() (see "flags" param for what happens if the buffer is busy). 554 * buf_brelse(), noticing that it is invalid, will 555 * will return the buffer to the empty-buffer list and tell the VM subsystem to abandon 556 * the relevant pages. Data will not be written to backing store--it will be cast aside. 557 * Note that this function will only work if the block in question has been 558 * obtained with a buf_getblk(). If data has been read into core without using 559 * traditional buffer cache routines, buf_invalblkno() will not be able to invalidate it--this 560 * includes the use of iobufs. 561 * @param vp vnode whose block to invalidate. 562 * @param lblkno Logical block number. 563 * @param flags BUF_WAIT: wait for busy buffers to become unbusy and invalidate them then. Otherwise, 564 * just return EBUSY for busy blocks. 565 * @return 0 for success, EINVAL if vp is not a device file. 566 */ 567 errno_t buf_invalblkno(vnode_t vp, daddr64_t lblkno, int flags); 568 569 /*! 570 * @function buf_callback 571 * @abstract Get the function set to be called when I/O on a buffer completes. 572 * @discussion A function returned by buf_callback was originally set with buf_setcallback(). 573 * @param bp Buffer whose callback to get. 574 * @return 0 for success, or errors from filesystem or device layers. 575 */ 576 void * buf_callback(buf_t bp); 577 578 /*! 579 * @function buf_setcallback 580 * @abstract Set a function to be called once when I/O on a buffer completes. 581 * @discussion A one-shot callout set with buf_setcallback() will be called from buf_biodone() 582 * when I/O completes. It will be passed the "transaction" argument as well as the buffer. 583 * buf_setcallback() also marks the buffer as B_ASYNC. 584 * @param bp Buffer whose callback to set. 585 * @param callback function to use as callback. 586 * @param transaction Additional argument to callback function. 587 * @return 0; always succeeds. 588 */ 589 errno_t buf_setcallback(buf_t bp, void (*callback)(buf_t, void *), void *transaction); 590 591 /*! 592 * @function buf_setupl 593 * @abstract Set the UPL (Universal Page List), and offset therein, on a buffer. 594 * @discussion buf_setupl() should only be called on buffers allocated with buf_alloc(). 595 * A subsequent call to buf_map() will map the UPL and give back the address at which data 596 * begins. After buf_setupl() is called, a buffer is marked B_CLUSTER; when this is the case, 597 * buf_strategy() assumes that a buffer is correctly configured to be passed to the device 598 * layer without modification. Passing a NULL upl will clear the upl and the B_CLUSTER flag on the 599 * buffer. 600 * @param bp Buffer whose upl to set. 601 * @param upl UPL to set in the buffer. 602 * @param offset Offset within upl at which relevant data begin. 603 * @return 0 for success, EINVAL if the buffer was not allocated with buf_alloc(). 604 */ 605 errno_t buf_setupl(buf_t bp, upl_t upl, uint32_t offset); 606 607 /*! 608 * @function buf_clone 609 * @abstract Clone a buffer with a restricted range and an optional callback. 610 * @discussion Generates a buffer which is identical to its "bp" argument except that 611 * it spans a subset of the data of the original. The buffer to be cloned should 612 * have been allocated with buf_alloc(). Checks its arguments to make sure 613 * that the data subset is coherent. Optionally, adds a callback function and argument to it 614 * to be called when I/O completes (as with buf_setcallback(), but B_ASYNC is not set). If the original buffer had 615 * a upl set through buf_setupl(), this upl is copied to the new buffer; otherwise, the original's 616 * data pointer is used raw. The buffer must be released with buf_free(). 617 * @param bp Buffer to clone. 618 * @param io_offset Offset, relative to start of data in original buffer, at which new buffer's data will begin. 619 * @param io_size Size of buffer region in new buffer, in the sense of buf_count(). 620 * @param iodone Callback to be called from buf_biodone() when I/O completes, in the sense of buf_setcallback(). 621 * @param arg Argument to pass to iodone() callback. 622 * @return NULL if io_offset/io_size combination is invalid for the buffer to be cloned; otherwise, the new buffer. 623 */ 624 buf_t buf_clone(buf_t bp, int io_offset, int io_size, void (*iodone)(buf_t, void *), void *arg); 625 626 627 /*! 628 * @function buf_create_shadow 629 * @abstract Create a shadow buffer with optional private storage and an optional callback. 630 * @param bp Buffer to shadow. 631 * @param force_copy If TRUE, do not link the shadaow to 'bp' and if 'external_storage' == NULL, 632 * force a copy of the data associated with 'bp'. 633 * @param external_storage If non-NULL, associate it with the new buffer as its storage instead of the 634 * storage currently associated with 'bp'. 635 * @param iodone Callback to be called from buf_biodone() when I/O completes, in the sense of buf_setcallback(). 636 * @param arg Argument to pass to iodone() callback. 637 * @return NULL if the buffer to be shadowed is not B_META or a primary buffer (i.e. not a shadow buffer); otherwise, the new buffer. 638 */ 639 640 buf_t buf_create_shadow(buf_t bp, boolean_t force_copy, uintptr_t external_storage, void (*iodone)(buf_t, void *), void *arg); 641 642 643 /*! 644 * @function buf_shadow 645 * @abstract returns true if 'bp' is a shadow of another buffer. 646 * @param bp Buffer to query. 647 * @return 1 if 'bp' is a shadow, 0 otherwise. 648 */ 649 int buf_shadow(buf_t bp); 650 651 652 /*! 653 * @function buf_alloc 654 * @abstract Allocate an uninitialized buffer. 655 * @discussion A buffer returned by buf_alloc() is marked as busy and as an iobuf; it has no storage set up and must be 656 * set up using buf_setdataptr() or buf_setupl()/buf_map(). 657 * @param vp vnode to associate with the buffer: optionally NULL. If vp is a device file, then 658 * the buffer's associated device will be set. If vp is NULL, it can be set later with buf_setvnode(). 659 * @return New buffer. 660 */ 661 buf_t buf_alloc(vnode_t vp); 662 663 /*! 664 * @function buf_free 665 * @abstract Free a buffer that was allocated with buf_alloc(). 666 * @discussion The storage (UPL, data pointer) associated with an iobuf must be freed manually. 667 * @param bp The buffer to free. 668 */ 669 void buf_free(buf_t bp); 670 671 /* 672 * flags for buf_invalidateblks 673 */ 674 #define BUF_WRITE_DATA 0x0001 /* write data blocks first */ 675 #define BUF_SKIP_META 0x0002 /* skip over metadata blocks */ 676 #define BUF_INVALIDATE_LOCKED 0x0004 /* force B_LOCKED blocks to be invalidated */ 677 678 /*! 679 * @function buf_invalidateblks 680 * @abstract Invalidate all the blocks associated with a vnode. 681 * @discussion This function does for all blocks associated with a vnode what buf_invalblkno does for one block. 682 * Again, it will only be able to invalidate data which were populated with traditional buffer cache routines, 683 * i.e. by buf_getblk() and callers thereof. Unlike buf_invalblkno(), it can be made to write dirty data to disk 684 * rather than casting it aside. 685 * @param vp The vnode whose data to invalidate. 686 * @param flags BUF_WRITE_DATA: write dirty data to disk with VNOP_BWRITE() before kicking buffer cache entries out. 687 * BUF_SKIP_META: do not invalidate metadata blocks. 688 * @param slpflag Flags to pass to "msleep" while waiting to acquire busy buffers. 689 * @param slptimeo Timeout in "hz" (1/100 second) to wait for a buffer to become unbusy before waking from sleep 690 * and re-starting the scan. 691 * @return 0 for success, error values from msleep(). 692 */ 693 int buf_invalidateblks(vnode_t vp, int flags, int slpflag, int slptimeo); 694 695 /* 696 * flags for buf_flushdirtyblks and buf_iterate 697 */ 698 #define BUF_SKIP_NONLOCKED 0x01 699 #define BUF_SKIP_LOCKED 0x02 700 #define BUF_SCAN_CLEAN 0x04 /* scan the clean buffers */ 701 #define BUF_SCAN_DIRTY 0x08 /* scan the dirty buffers */ 702 #define BUF_NOTIFY_BUSY 0x10 /* notify the caller about the busy pages during the scan */ 703 704 705 #define BUF_RETURNED 0 706 #define BUF_RETURNED_DONE 1 707 #define BUF_CLAIMED 2 708 #define BUF_CLAIMED_DONE 3 709 /*! 710 * @function buf_flushdirtyblks 711 * @abstract Write dirty file blocks to disk. 712 * @param vp The vnode whose blocks to flush. 713 * @param wait Wait for writes to complete before returning. 714 * @param flags Can pass zero, meaning "flush all dirty buffers." 715 * BUF_SKIP_NONLOCKED: Skip buffers which are not busy when we encounter them. 716 * BUF_SKIP_LOCKED: Skip buffers which are busy when we encounter them. 717 * @param msg String to pass to msleep(). 718 */ 719 void buf_flushdirtyblks(vnode_t vp, int wait, int flags, const char *msg); 720 721 /*! 722 * @function buf_iterate 723 * @abstract Perform some operation on all buffers associated with a vnode. 724 * @param vp The vnode whose buffers to scan. 725 * @param callout Function to call on each buffer. Should return one of: 726 * BUF_RETURNED: buf_iterate() should call buf_brelse() on the buffer. 727 * BUF_RETURNED_DONE: buf_iterate() should call buf_brelse() on the buffer and then stop iterating. 728 * BUF_CLAIMED: buf_iterate() should continue iterating (and not call buf_brelse()). 729 * BUF_CLAIMED_DONE: buf_iterate() should stop iterating (and not call buf_brelse()). 730 * @param flags 731 * BUF_SKIP_NONLOCKED: Skip buffers which are not busy when we encounter them. BUF_SKIP_LOCKED: Skip buffers which are busy when we encounter them. 732 * BUF_SCAN_CLEAN: Call out on clean buffers. 733 * BUF_SCAN_DIRTY: Call out on dirty buffers. 734 * BUF_NOTIFY_BUSY: If a buffer cannot be acquired, pass a NULL buffer to callout; otherwise, 735 * that buffer will be silently skipped. 736 * @param arg Argument to pass to callout in addition to buffer. 737 */ 738 void buf_iterate(vnode_t vp, int (*callout)(buf_t, void *), int flags, void *arg); 739 740 /*! 741 * @function buf_clear 742 * @abstract Zero out the storage associated with a buffer. 743 * @discussion Calls buf_map() to get the buffer's data address; for a B_CLUSTER 744 * buffer (one which has had buf_setupl() called on it), it tries to map the buffer's 745 * UPL into memory; should only be called once during the life cycle of an iobuf (one allocated 746 * with buf_alloc()). 747 * @param bp The buffer to zero out. 748 */ 749 void buf_clear(buf_t bp); 750 751 /*! 752 * @function buf_bawrite 753 * @abstract Start an asychronous write on a buffer. 754 * @discussion Calls VNOP_BWRITE to start the process of propagating an asynchronous write down to the device layer. 755 * Callers can wait for writes to complete at their discretion using buf_biowait(). When this function is called, 756 * data should already have been written to the buffer's data region. 757 * @param bp The buffer on which to initiate I/O. 758 * @return EWOULDBLOCK if write count is high and "throttle" is zero; otherwise, errors from VNOP_BWRITE. 759 */ 760 errno_t buf_bawrite(buf_t bp); 761 762 /*! 763 * @function buf_bdwrite 764 * @abstract Mark a buffer for delayed write. 765 * @discussion Marks a buffer as waiting for delayed write and the current I/O as complete; data will be written to backing store 766 * before the buffer is reused, but it will not be queued for I/O immediately. Note that for buffers allocated 767 * with buf_alloc(), there are no such guarantees; you must take care of your own flushing to disk. If 768 * the number of delayed writes pending on the system is greater than an internal limit and the caller has not 769 * requested otherwise [see return_error] , buf_bdwrite() will unilaterally launch an asynchronous I/O with buf_bawrite() to keep the pile of 770 * delayed writes from getting too large. 771 * @param bp The buffer to mark for delayed write. 772 * @return EAGAIN for return_error != 0 case, 0 for succeess, errors from buf_bawrite. 773 */ 774 errno_t buf_bdwrite(buf_t bp); 775 776 /*! 777 * @function buf_bwrite 778 * @abstract Write a buffer's data to backing store. 779 * @discussion Once the data in a buffer has been modified, buf_bwrite() starts sending it to disk by calling 780 * VNOP_STRATEGY. Unless B_ASYNC has been set on the buffer (by buf_setflags() or otherwise), data will have 781 * been written to disk when buf_bwrite() returns. See Bach (p 56). 782 * @param bp The buffer to write to disk. 783 * @return 0 for success; errors from buf_biowait(). 784 */ 785 errno_t buf_bwrite(buf_t bp); 786 787 /*! 788 * @function buf_biodone 789 * @abstract Mark an I/O as completed. 790 * @discussion buf_biodone() should be called by whosoever decides that an I/O on a buffer is complete; for example, 791 * IOStorageFamily. It clears the dirty flag on a buffer and signals on the vnode that a write has completed 792 * with vnode_writedone(). If a callout or filter has been set on the buffer, that function is called. In the case 793 * of a callout, that function is expected to take care of cleaning up and freeing the buffer. 794 * Otherwise, if the buffer is marked B_ASYNC (e.g. it was passed to buf_bawrite()), then buf_biodone() 795 * considers itself justified in calling buf_brelse() to return it to free lists--no one is waiting for it. Finally, 796 * waiters on the bp (e.g. in buf_biowait()) are woken up. 797 * @param bp The buffer to mark as done with I/O. 798 */ 799 void buf_biodone(buf_t bp); 800 801 /*! 802 * @function buf_biowait 803 * @abstract Wait for I/O on a buffer to complete. 804 * @discussion Waits for I/O on a buffer to finish, as marked by a buf_biodone() call. 805 * @param bp The buffer to wait on. 806 * @return 0 for a successful wait; nonzero the buffer has been marked as EINTR or had an error set on it. 807 */ 808 errno_t buf_biowait(buf_t bp); 809 810 /*! 811 * @function buf_brelse 812 * @abstract Release any claim to a buffer, sending it back to free lists. 813 * @discussion buf_brelse() cleans up buffer state and releases a buffer to the free lists. If the buffer 814 * is not marked invalid and its pages are dirty (e.g. a delayed write was made), its data will be commited 815 * to backing store. If it is marked invalid, its data will be discarded completely. 816 * A valid, cacheable buffer will be put on a list and kept in the buffer hash so it 817 * can be found again; otherwise, it will be dissociated from its vnode and treated as empty. Which list a valid 818 * buffer is placed on depends on the use of buf_markaged(), whether it is metadata, and the B_LOCKED flag. A 819 * B_LOCKED buffer will not be available for reuse by other files, though its data may be paged out. 820 * Note that buf_brelse() is intended for use with traditionally allocated buffers. 821 * @param bp The buffer to release. 822 */ 823 void buf_brelse(buf_t bp); 824 825 /*! 826 * @function buf_bread 827 * @abstract Synchronously read a block of a file. 828 * @discussion buf_bread() is the traditional way to read a single logical block of a file through the buffer cache. 829 * It tries to find the buffer and corresponding page(s) in core, calls VNOP_STRATEGY if necessary to bring the data 830 * into memory, and waits for I/O to complete. It should not be used to read blocks of greater than 4K (one VM page) 831 * in size; use cluster routines for large reads. Indeed, the cluster layer is a more efficient choice for reading DATA 832 * unless you need some finely-tuned semantics that it cannot provide. 833 * @param vp The file from which to read. 834 * @param blkno The logical (filesystem) block number to read. 835 * @param size Size of block; do not use for sizes > 4K. 836 * @param cred Credential to store and use for reading from disk if data are not already in core. 837 * @param bpp Destination pointer for buffer. 838 * @return 0 for success, or an error from buf_biowait(). 839 */ 840 errno_t buf_bread(vnode_t vp, daddr64_t blkno, int size, kauth_cred_t cred, buf_t *bpp); 841 842 /*! 843 * @function buf_breadn 844 * @abstract Read a block from a file with read-ahead. 845 * @discussion buf_breadn() reads one block synchronously in the style of buf_bread() and fires 846 * off a specified set of asynchronous reads to improve the likelihood of future cache hits. 847 * It should not be used to read blocks of greater than 4K (one VM page) in size; use cluster 848 * routines for large reads. Indeed, the cluster layer is a more efficient choice for reading DATA 849 * unless you need some finely-tuned semantics that it cannot provide. 850 * @param vp The file from which to read. 851 * @param blkno The logical (filesystem) block number to read synchronously. 852 * @param size Size of block; do not use for sizes > 4K. 853 * @param rablks Array of logical block numbers for asynchronous read-aheads. 854 * @param rasizes Array of block sizes for asynchronous read-aheads, each index corresponding to same index in "rablks." 855 * @param nrablks Number of entries in read-ahead arrays. 856 * @param cred Credential to store and use for reading from disk if data are not already in core. 857 * @param bpp Destination pointer for buffer. 858 * @return 0 for success, or an error from buf_biowait(). 859 */ 860 errno_t buf_breadn(vnode_t vp, daddr64_t blkno, int size, daddr64_t *rablks, int *rasizes, int nrablks, kauth_cred_t cred, buf_t *bpp); 861 862 /*! 863 * @function buf_meta_bread 864 * @abstract Synchronously read a metadata block of a file. 865 * @discussion buf_meta_bread() is the traditional way to read a single logical block of a file through the buffer cache. 866 * It tries to find the buffer and corresponding page(s) in core, calls VNOP_STRATEGY if necessary to bring the data 867 * into memory, and waits for I/O to complete. It should not be used to read blocks of greater than 4K (one VM page) 868 * in size; use cluster routines for large reads. Reading meta-data through the traditional buffer cache, unlike 869 * reading data, is efficient and encouraged, especially if the blocks being read are significantly smaller than page size. 870 * @param vp The file from which to read. 871 * @param blkno The logical (filesystem) block number to read. 872 * @param size Size of block; do not use for sizes > 4K. 873 * @param cred Credential to store and use for reading from disk if data are not already in core. 874 * @param bpp Destination pointer for buffer. 875 * @return 0 for success, or an error from buf_biowait(). 876 */ 877 errno_t buf_meta_bread(vnode_t vp, daddr64_t blkno, int size, kauth_cred_t cred, buf_t *bpp); 878 879 /*! 880 * @function buf_meta_breadn 881 * @abstract Read a metadata block from a file with read-ahead. 882 * @discussion buf_meta_breadn() reads one block synchronously in the style of buf_meta_bread() and fires 883 * off a specified set of asynchronous reads to improve the likelihood of future cache hits. 884 * It should not be used to read blocks of greater than 4K (one VM page) in size; use cluster 885 * routines for large reads. 886 * @param vp The file from which to read. 887 * @param blkno The logical (filesystem) block number to read synchronously. 888 * @param size Size of block; do not use for sizes > 4K. 889 * @param rablks Array of logical block numbers for asynchronous read-aheads. 890 * @param rasizes Array of block sizes for asynchronous read-aheads, each index corresponding to same index in "rablks." 891 * @param nrablks Number of entries in read-ahead arrays. 892 * @param cred Credential to store and use for reading from disk if data are not already in core. 893 * @param bpp Destination pointer for buffer. 894 * @return 0 for success, or an error from buf_biowait(). 895 */ 896 errno_t buf_meta_breadn(vnode_t vp, daddr64_t blkno, int size, daddr64_t *rablks, int *rasizes, int nrablks, kauth_cred_t cred, buf_t *bpp); 897 898 /*! 899 * @function minphys 900 * @abstract Adjust a buffer's count to be no more than maximum physical I/O transfer size for the host architecture. 901 * @discussion physio() takes as a parameter a function to bound transfer sizes for each VNOP_STRATEGY() call. minphys() 902 * is a default implementation. It calls buf_setcount() to make the buffer's count the min() of its current count 903 * and the max I/O size for the host architecture. 904 * @param bp The buffer whose byte count to modify. 905 * @return New byte count. 906 */ 907 u_int minphys(buf_t bp); 908 909 /*! 910 * @function physio 911 * @abstract Perform I/O on a device to/from target memory described by a uio. 912 * @discussion physio() allows I/O directly from a device to user-space memory. It waits 913 * for all I/O to complete before returning. 914 * @param f_strategy Strategy routine to call to initiate I/O. 915 * @param bp Buffer to configure and pass to strategy routine; can be NULL. 916 * @param dev Device on which to perform I/O. 917 * @param flags B_READ or B_WRITE. 918 * @param f_minphys Function which calls buf_setcount() to set a byte count which is suitably 919 * small for the device in question. Returns byte count that has been set (or unchanged) on the buffer. 920 * @param uio UIO describing the I/O operation. 921 * @param blocksize Logical block size for this vnode. 922 * @return 0 for success; EFAULT for an invalid uio; errors from buf_biowait(). 923 */ 924 int physio(void (*f_strategy)(buf_t), buf_t bp, dev_t dev, int flags, u_int (*f_minphys)(buf_t), struct uio *uio, int blocksize); 925 926 927 /* 928 * Flags for operation type in getblk() 929 */ 930 #define BLK_READ 0x01 /* buffer for read */ 931 #define BLK_WRITE 0x02 /* buffer for write */ 932 #define BLK_META 0x10 /* buffer for metadata */ 933 /* 934 * modifier for above flags... if set, getblk will only return 935 * a bp that is already valid... i.e. found in the cache 936 */ 937 #define BLK_ONLYVALID 0x80000000 938 939 /*! 940 * @function buf_getblk 941 * @abstract Traditional buffer cache routine to get a buffer corresponding to a logical block in a file. 942 * @discussion buf_getblk() gets a buffer, not necessarily containing valid data, representing a block in a file. 943 * A metadata buffer will be returned with its own zone-allocated storage, managed by the traditional buffer-cache 944 * layer, whereas data buffers will be returned hooked into backing by the UBC (which in fact controls the caching of data). 945 * buf_getblk() first looks for the buffer header in cache; if the buffer is in-core but busy, buf_getblk() will wait for it to become 946 * unbusy, depending on the slpflag and slptimeo parameters. If the buffer is found unbusy and is a metadata buffer, 947 * it must already contain valid data and will be returned directly; data buffers will have a UPL configured to 948 * prepare for interaction with the underlying UBC. If the buffer is found in core, it will be marked as such 949 * and buf_fromcache() will return truth. A buffer is allocated and initialized (but not filled with data) 950 * if none is found in core. buf_bread(), buf_breadn(), buf_meta_bread(), and buf_meta_breadn() all 951 * return buffers obtained with buf_getblk(). 952 * @param vp File for which to get block. 953 * @param blkno Logical block number. 954 * @param size Size of block. 955 * @param slpflag Flag to pass to msleep() while waiting for buffer to become unbusy. 956 * @param slptimeo Time, in milliseconds, to wait for buffer to become unbusy. 0 means to wait indefinitely. 957 * @param operation BLK_READ: want a read buffer. BLK_WRITE: want a write buffer. BLK_META: want a metadata buffer. BLK_ONLYVALID: 958 * only return buffers which are found in core (do not allocate anew), and do not change buffer size. The last remark means 959 * that if a given logical block is found in core with a different size than what is requested, the buffer size will not be modified. 960 * @return Buffer found in core or newly allocated, either containing valid data or ready for I/O. 961 */ 962 buf_t buf_getblk(vnode_t vp, daddr64_t blkno, int size, int slpflag, int slptimeo, int operation); 963 964 /*! 965 * @function buf_geteblk 966 * @abstract Get a metadata buffer which is marked invalid and not associated with any vnode. 967 * @discussion A buffer is returned with zone-allocated storage of the specified size, marked B_META and invalid. 968 * It has no vnode and is not visible in the buffer hash. 969 * @param size Size of buffer. 970 * @return Always returns a new buffer. 971 */ 972 buf_t buf_geteblk(int size); 973 974 /*! 975 * @function buf_clear_redundancy_flags 976 * @abstract Clear flags on a buffer. 977 * @discussion buffer_redundancy_flags &= ~flags 978 * @param bp Buffer whose flags to clear. 979 * @param flags Flags to remove from buffer's mask 980 */ 981 void buf_clear_redundancy_flags(buf_t bp, uint32_t flags); 982 983 /*! 984 * @function buf_redundancyflags 985 * @abstract Get redundancy flags set on a buffer. 986 * @param bp Buffer whose redundancy flags to grab. 987 * @return flags. 988 */ 989 uint32_t buf_redundancy_flags(buf_t bp); 990 991 /*! 992 * @function buf_setredundancyflags 993 * @abstract Set redundancy flags on a buffer. 994 * @discussion buffer_redundancy_flags |= flags 995 * @param bp Buffer whose flags to set. 996 * @param flags Flags to add to buffer's redundancy flags 997 */ 998 void buf_set_redundancy_flags(buf_t bp, uint32_t flags); 999 1000 /*! 1001 * @function buf_attr 1002 * @abstract Gets the attributes for this buf. 1003 * @param bp Buffer whose attributes to get. 1004 * @return bufattr_t. 1005 */ 1006 bufattr_t buf_attr(buf_t bp); 1007 1008 /*! 1009 * @function buf_markstatic 1010 * @abstract Mark a buffer as being likely to contain static data. 1011 * @param bp Buffer to mark. 1012 */ 1013 void buf_markstatic(buf_t bp); 1014 1015 /*! 1016 * @function buf_static 1017 * @abstract Check if a buffer contains static data. 1018 * @param bp Buffer to test. 1019 * @return Nonzero if buffer has static data, 0 otherwise. 1020 */ 1021 int buf_static(buf_t bp); 1022 1023 /*! 1024 * @function bufattr_markiosched 1025 * @abstract Mark a buffer as belonging to an io scheduled mount point 1026 * @param bap Buffer attributes to mark. 1027 * @discussion Marks the buffer so that spec_strategy() will know that it belongs to an io scheduled mount point 1028 */ 1029 void bufattr_markioscheduled(bufattr_t bap); 1030 1031 /*! 1032 * @function bufattr_iosched 1033 * @abstract Check if a buffer is marked as io scheduled 1034 * @param bap Buffer attributes to test. 1035 * @return Nonzero if the buffer is marked io scheduled, 0 otherwise. 1036 */ 1037 int bufattr_ioscheduled(bufattr_t bap); 1038 1039 /*! 1040 * @function bufattr_markexpeditedmeta 1041 * @abstract Mark a metadata I/O buffer as expedited (i.e. requires a high I/O tier). 1042 * @param bap Buffer attributes to mark. 1043 * @discussion Marks the buffer so that spec_strategy() will know that it should be expedited 1044 */ 1045 void bufattr_markexpeditedmeta(bufattr_t bap); 1046 1047 /*! 1048 * @function bufattr_expeditedmeta 1049 * @abstract Check if a buffer is marked as expedited metadata I/O. 1050 * @param bap Buffer attributes to test. 1051 * @return Nonzero if the buffer is marked expedited metadata I/O, 0 otherwise. 1052 */ 1053 int bufattr_expeditedmeta(bufattr_t bap); 1054 1055 #ifdef KERNEL_PRIVATE 1056 void buf_setfilter(buf_t, void (*)(buf_t, void *), void *, void(**)(buf_t, void *), void **); 1057 1058 /* bufattr allocation/duplication/deallocation functions */ 1059 bufattr_t bufattr_alloc(void); 1060 bufattr_t bufattr_dup(bufattr_t bap); 1061 void bufattr_free(bufattr_t bap); 1062 1063 /*! 1064 * @function bufattr_cpx 1065 * @abstract Returns a pointer to a cpx_t structure. 1066 * @param bap Buffer Attribute whose cpx_t structure you wish to get. 1067 * @return Returns a cpx_t structure, or NULL if not valid 1068 */ 1069 struct cpx *bufattr_cpx(bufattr_t bap); 1070 1071 /*! 1072 * @function bufattr_setcpx 1073 * @abstract Set the cp_ctx on a buffer attribute. 1074 * @param bap Buffer Attribute that you wish to change 1075 */ 1076 void bufattr_setcpx(bufattr_t bap, struct cpx *cpx); 1077 1078 /*! 1079 * @function bufattr_cpoff 1080 * @abstract Gets the file offset on the buffer. 1081 * @param bap Buffer Attribute whose file offset value is used 1082 */ 1083 uint64_t bufattr_cpoff(bufattr_t bap); 1084 1085 /*! 1086 * @function bufattr_setcpoff 1087 * @abstract Set the file offset for a content protected I/O on 1088 * a buffer attribute. 1089 * @param bap Buffer Attribute whose cp file offset has to be set 1090 */ 1091 void bufattr_setcpoff(bufattr_t bap, uint64_t); 1092 1093 /*! 1094 * @function bufattr_rawencrypted 1095 * @abstract Check if a buffer contains raw encrypted data. 1096 * @param bap Buffer attribute to test. 1097 * @return Nonzero if buffer has raw encrypted data, 0 otherwise. 1098 */ 1099 int bufattr_rawencrypted(bufattr_t bap); 1100 1101 /*! 1102 * @function bufattr_markgreedymode 1103 * @abstract Mark a buffer to use the greedy mode for writing. 1104 * @param bap Buffer attributes to mark. 1105 * @discussion Greedy Mode: request improved write performance from the underlying device at the expense of storage efficiency 1106 */ 1107 void bufattr_markgreedymode(bufattr_t bap); 1108 1109 /*! 1110 * @function bufattr_greedymode 1111 * @abstract Check if a buffer is written using the Greedy Mode 1112 * @param bap Buffer attributes to test. 1113 * @discussion Greedy Mode: request improved write performance from the underlying device at the expense of storage efficiency 1114 * @return Nonzero if buffer uses greedy mode, 0 otherwise. 1115 */ 1116 int bufattr_greedymode(bufattr_t bap); 1117 1118 /*! 1119 * @function bufattr_markisochronous 1120 * @abstract Mark a buffer to use the isochronous throughput mode for writing. 1121 * @param bap Buffer attributes to mark. 1122 * @discussion isochronous mode: request improved write performance from the underlying device at the expense of storage efficiency 1123 */ 1124 void bufattr_markisochronous(bufattr_t bap); 1125 1126 /*! 1127 * @function bufattr_isochronous 1128 * @abstract Check if a buffer is written using the isochronous 1129 * @param bap Buffer attributes to test. 1130 * @discussion isochronous mode: request improved write performance from the underlying device at the expense of storage efficiency 1131 * @return Nonzero if buffer uses isochronous mode, 0 otherwise. 1132 */ 1133 int bufattr_isochronous(bufattr_t bap); 1134 1135 1136 /*! 1137 * @function bufattr_throttled 1138 * @abstract Check if a buffer is throttled. 1139 * @param bap Buffer attribute to test. 1140 * @return Nonzero if the buffer is throttled, 0 otherwise. 1141 */ 1142 int bufattr_throttled(bufattr_t bap); 1143 1144 /*! 1145 * @function bufattr_passive 1146 * @abstract Check if a buffer is marked passive. 1147 * @param bap Buffer attribute to test. 1148 * @return Nonzero if the buffer is marked passive, 0 otherwise. 1149 */ 1150 int bufattr_passive(bufattr_t bap); 1151 1152 /*! 1153 * @function bufattr_nocache 1154 * @abstract Check if a buffer has nocache attribute. 1155 * @param bap Buffer attribute to test. 1156 * @return Nonzero if the buffer is not cached, 0 otherwise. 1157 */ 1158 int bufattr_nocache(bufattr_t bap); 1159 1160 /*! 1161 * @function bufattr_meta 1162 * @abstract Check if a buffer has the bufattr meta attribute. 1163 * @param bap Buffer attribute to test. 1164 * @return Nonzero if the buffer has meta attribute, 0 otherwise. 1165 */ 1166 1167 int bufattr_meta(bufattr_t bap); 1168 1169 /*! 1170 * @function bufattr_markmeta 1171 * @abstract Set the bufattr meta attribute. 1172 * @param bap Buffer attribute to manipulate. 1173 */ 1174 void bufattr_markmeta(bufattr_t bap); 1175 1176 1177 /*! 1178 * @function bufattr_delayidlesleep 1179 * @abstract Check if a buffer is marked to delay idle sleep on disk IO. 1180 * @param bap Buffer attribute to test. 1181 * @return Nonzero if the buffer is marked to delay idle sleep on disk IO, 0 otherwise. 1182 */ 1183 int bufattr_delayidlesleep(bufattr_t bap); 1184 1185 /*! 1186 * @function buf_kernel_addrperm_addr 1187 * @abstract Obfuscate the buf pointers. 1188 * @param addr Buf_t pointer. 1189 * @return Obfuscated pointer if addr is non zero, 0 otherwise. 1190 */ 1191 vm_offset_t buf_kernel_addrperm_addr(void * addr); 1192 1193 /*! 1194 * @function bufattr_markquickcomplete 1195 * @abstract Mark a buffer to hint quick completion to the driver. 1196 * @discussion This flag hints the storage driver that some thread is waiting for this I/O to complete. 1197 * It should therefore attempt to complete it as soon as possible at the cost of device efficiency. 1198 * @param bap Buffer attributes to mark. 1199 */ 1200 void bufattr_markquickcomplete(bufattr_t bap); 1201 1202 /*! 1203 * @function bufattr_quickcomplete 1204 * @abstract Check if a buffer is marked for quick completion 1205 * @discussion This flag hints the storage driver that some thread is waiting for this I/O to complete. 1206 * It should therefore attempt to complete it as soon as possible at the cost of device efficiency. 1207 * @param bap Buffer attribute to test. 1208 * @return Nonzero if the buffer is marked for quick completion, 0 otherwise. 1209 */ 1210 int bufattr_quickcomplete(bufattr_t bap); 1211 1212 int count_lock_queue(void); 1213 1214 /* 1215 * Flags for buf_acquire 1216 */ 1217 #define BAC_NOWAIT 0x01 /* Don't wait if buffer is busy */ 1218 #define BAC_REMOVE 0x02 /* Remove from free list once buffer is acquired */ 1219 #define BAC_SKIP_NONLOCKED 0x04 /* Don't return LOCKED buffers */ 1220 #define BAC_SKIP_LOCKED 0x08 /* Only return LOCKED buffers */ 1221 1222 errno_t buf_acquire(buf_t, int, int, int); 1223 1224 buf_t buf_create_shadow_priv(buf_t bp, boolean_t force_copy, uintptr_t external_storage, void (*iodone)(buf_t, void *), void *arg); 1225 1226 void buf_drop(buf_t); 1227 1228 #endif /* KERNEL_PRIVATE */ 1229 1230 __END_DECLS 1231 1232 1233 /* Macros to clear/set/test flags. */ 1234 #define SET(t, f) (t) |= (f) 1235 #define CLR(t, f) (t) &= ~(f) 1236 #define ISSET(t, f) ((t) & (f)) 1237 1238 1239 #endif /* !_SYS_BUF_H_ */