1e974f91cSConrad Meyer.\" Copyright (c) 2015 EMC / Isilon Storage Division 2e974f91cSConrad Meyer.\" All rights reserved. 3e974f91cSConrad Meyer.\" 4e974f91cSConrad Meyer.\" Redistribution and use in source and binary forms, with or without 5e974f91cSConrad Meyer.\" modification, are permitted provided that the following conditions 6e974f91cSConrad Meyer.\" are met: 7e974f91cSConrad Meyer.\" 1. Redistributions of source code must retain the above copyright 8e974f91cSConrad Meyer.\" notice, this list of conditions and the following disclaimer. 9e974f91cSConrad Meyer.\" 2. Redistributions in binary form must reproduce the above copyright 10e974f91cSConrad Meyer.\" notice, this list of conditions and the following disclaimer in the 11e974f91cSConrad Meyer.\" documentation and/or other materials provided with the distribution. 12e974f91cSConrad Meyer.\" 13e974f91cSConrad Meyer.\" THIS SOFTWARE IS PROVIDED BY THE AUTHORS AND CONTRIBUTORS ``AS IS'' AND 14e974f91cSConrad Meyer.\" ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 15e974f91cSConrad Meyer.\" IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 16e974f91cSConrad Meyer.\" ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHORS OR CONTRIBUTORS BE LIABLE 17e974f91cSConrad Meyer.\" FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 18e974f91cSConrad Meyer.\" DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 19e974f91cSConrad Meyer.\" OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 20e974f91cSConrad Meyer.\" HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 21e974f91cSConrad Meyer.\" LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 22e974f91cSConrad Meyer.\" OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 23e974f91cSConrad Meyer.\" SUCH DAMAGE. 24e974f91cSConrad Meyer.\" 25e974f91cSConrad Meyer.\" $FreeBSD$ 26e974f91cSConrad Meyer.\" 27*5ca9fc2aSConrad Meyer.Dd December 14, 2015 28e974f91cSConrad Meyer.Dt IOAT 4 29e974f91cSConrad Meyer.Os 30e974f91cSConrad Meyer.Sh NAME 31e974f91cSConrad Meyer.Nm I/OAT 32e974f91cSConrad Meyer.Nd Intel I/O Acceleration Technology 33e974f91cSConrad Meyer.Sh SYNOPSIS 34faefad9cSConrad MeyerTo compile this driver into your kernel, 35faefad9cSConrad Meyerplace the following line in your kernel configuration file: 36faefad9cSConrad Meyer.Bd -ragged -offset indent 37e974f91cSConrad Meyer.Cd "device ioat" 38faefad9cSConrad Meyer.Ed 39faefad9cSConrad Meyer.Pp 40faefad9cSConrad MeyerOr, to load the driver as a module at boot, place the following line in 41faefad9cSConrad Meyer.Xr loader.conf 5 : 42faefad9cSConrad Meyer.Bd -literal -offset indent 43faefad9cSConrad Meyerioat_load="YES" 44faefad9cSConrad Meyer.Ed 45faefad9cSConrad Meyer.Pp 46e974f91cSConrad MeyerIn 47e974f91cSConrad Meyer.Xr loader.conf 5 : 48e974f91cSConrad Meyer.Pp 49e974f91cSConrad Meyer.Cd hw.ioat.force_legacy_interrupts=0 50e974f91cSConrad Meyer.Pp 51e974f91cSConrad MeyerIn 52e974f91cSConrad Meyer.Xr loader.conf 5 or 53e974f91cSConrad Meyer.Xr sysctl.conf 5 : 54e974f91cSConrad Meyer.Pp 55e974f91cSConrad Meyer.Cd hw.ioat.enable_ioat_test=0 56e974f91cSConrad Meyer.Cd hw.ioat.debug_level=0 57e974f91cSConrad Meyer(only critical errors; maximum of 3) 58e974f91cSConrad Meyer.Pp 59e974f91cSConrad Meyer.Ft typedef void 60faefad9cSConrad Meyer.Fn (*bus_dmaengine_callback_t) "void *arg" "int error" 61e974f91cSConrad Meyer.Pp 62e974f91cSConrad Meyer.Ft bus_dmaengine_t 63e974f91cSConrad Meyer.Fn ioat_get_dmaengine "uint32_t channel_index" 64e974f91cSConrad Meyer.Ft void 65faefad9cSConrad Meyer.Fn ioat_put_dmaengine "bus_dmaengine_t dmaengine" 66*5ca9fc2aSConrad Meyer.Ft int 67*5ca9fc2aSConrad Meyer.Fn ioat_set_interrupt_coalesce "bus_dmaengine_t dmaengine" "uint16_t delay" 68*5ca9fc2aSConrad Meyer.Ft uint16_t 69*5ca9fc2aSConrad Meyer.Fn ioat_get_max_coalesce_period "bus_dmaengine_t dmaengine" 70faefad9cSConrad Meyer.Ft void 71e974f91cSConrad Meyer.Fn ioat_acquire "bus_dmaengine_t dmaengine" 72e974f91cSConrad Meyer.Ft void 73e974f91cSConrad Meyer.Fn ioat_release "bus_dmaengine_t dmaengine" 74e974f91cSConrad Meyer.Ft struct bus_dmadesc * 75e974f91cSConrad Meyer.Fo ioat_copy 76e974f91cSConrad Meyer.Fa "bus_dmaengine_t dmaengine" 77e974f91cSConrad Meyer.Fa "bus_addr_t dst" 78e974f91cSConrad Meyer.Fa "bus_addr_t src" 79e974f91cSConrad Meyer.Fa "bus_size_t len" 80e974f91cSConrad Meyer.Fa "bus_dmaengine_callback_t callback_fn" 81e974f91cSConrad Meyer.Fa "void *callback_arg" 82e974f91cSConrad Meyer.Fa "uint32_t flags" 83e974f91cSConrad Meyer.Fc 84e974f91cSConrad Meyer.Ft struct bus_dmadesc * 859950fde0SConrad Meyer.Fo ioat_copy_8k_aligned 869950fde0SConrad Meyer.Fa "bus_dmaengine_t dmaengine" 879950fde0SConrad Meyer.Fa "bus_addr_t dst1" 889950fde0SConrad Meyer.Fa "bus_addr_t dst2" 899950fde0SConrad Meyer.Fa "bus_addr_t src1" 909950fde0SConrad Meyer.Fa "bus_addr_t src2" 919950fde0SConrad Meyer.Fa "bus_dmaengine_callback_t callback_fn" 929950fde0SConrad Meyer.Fa "void *callback_arg" 939950fde0SConrad Meyer.Fa "uint32_t flags" 949950fde0SConrad Meyer.Fc 959950fde0SConrad Meyer.Ft struct bus_dmadesc * 96faefad9cSConrad Meyer.Fo ioat_blockfill 97faefad9cSConrad Meyer.Fa "bus_dmaengine_t dmaengine" 98faefad9cSConrad Meyer.Fa "bus_addr_t dst" 99faefad9cSConrad Meyer.Fa "uint64_t fillpattern" 100faefad9cSConrad Meyer.Fa "bus_size_t len" 101faefad9cSConrad Meyer.Fa "bus_dmaengine_callback_t callback_fn" 102faefad9cSConrad Meyer.Fa "void *callback_arg" 103faefad9cSConrad Meyer.Fa "uint32_t flags" 104faefad9cSConrad Meyer.Fc 105faefad9cSConrad Meyer.Ft struct bus_dmadesc * 106e974f91cSConrad Meyer.Fo ioat_null 107e974f91cSConrad Meyer.Fa "bus_dmaengine_t dmaengine" 108e974f91cSConrad Meyer.Fa "bus_dmaengine_callback_t callback_fn" 109e974f91cSConrad Meyer.Fa "void *callback_arg" 110e974f91cSConrad Meyer.Fa "uint32_t flags" 111e974f91cSConrad Meyer.Fc 112e974f91cSConrad Meyer.Sh DESCRIPTION 113e974f91cSConrad MeyerThe 114e974f91cSConrad Meyer.Nm 115e974f91cSConrad Meyerdriver provides a kernel API to a variety of DMA engines on some Intel server 116e974f91cSConrad Meyerplatforms. 117e974f91cSConrad Meyer.Pp 118e974f91cSConrad MeyerThere is a number of DMA channels per CPU package. 119e974f91cSConrad Meyer(Typically 4 or 8.) 120e974f91cSConrad MeyerEach may be used independently. 121e974f91cSConrad MeyerOperations on a single channel proceed sequentially. 122e974f91cSConrad Meyer.Pp 123faefad9cSConrad MeyerBlockfill operations can be used to write a 64-bit pattern to memory. 124faefad9cSConrad Meyer.Pp 125faefad9cSConrad MeyerCopy operations can be used to offload memory copies to the DMA engines. 126e974f91cSConrad Meyer.Pp 127e974f91cSConrad MeyerNull operations do nothing, but may be used to test the interrupt and callback 128e974f91cSConrad Meyermechanism. 129e974f91cSConrad Meyer.Pp 130e974f91cSConrad MeyerAll operations can optionally trigger an interrupt at completion with the 131e974f91cSConrad Meyer.Ar DMA_EN_INT 132e974f91cSConrad Meyerflag. 133e974f91cSConrad MeyerFor example, a user might submit multiple operations to the same channel and 134e974f91cSConrad Meyeronly enable an interrupt and callback for the last operation. 135faefad9cSConrad Meyer.Pp 136*5ca9fc2aSConrad MeyerThe hardware can delay and coalesce interrupts on a given channel for a 137*5ca9fc2aSConrad Meyerconfigurable period of time, in microseconds. 138*5ca9fc2aSConrad MeyerThis may be desired to reduce the processing and interrupt overhead per 139*5ca9fc2aSConrad Meyerdescriptor, especially for workflows consisting of many small operations. 140*5ca9fc2aSConrad MeyerSoftware can control this on a per-channel basis with the 141*5ca9fc2aSConrad Meyer.Fn ioat_set_interrupt_coalesce 142*5ca9fc2aSConrad MeyerAPI. 143*5ca9fc2aSConrad MeyerThe 144*5ca9fc2aSConrad Meyer.Fn ioat_get_max_coalesce_period 145*5ca9fc2aSConrad MeyerAPI can be used to determine the maximum coalescing period supported by the 146*5ca9fc2aSConrad Meyerhardware, in microseconds. 147*5ca9fc2aSConrad MeyerCurrent platforms support up to a 16.383 millisecond coalescing period. 148*5ca9fc2aSConrad MeyerOptimal configuration will vary by workflow and desired operation latency. 149*5ca9fc2aSConrad Meyer.Pp 150faefad9cSConrad MeyerAll operations are safe to use in a non-blocking context with the 151faefad9cSConrad Meyer.Ar DMA_NO_WAIT 152faefad9cSConrad Meyerflag. 153faefad9cSConrad Meyer(Of course, allocations may fail and operations requested with 154faefad9cSConrad Meyer.Ar DMA_NO_WAIT 155faefad9cSConrad Meyermay return NULL.) 156faefad9cSConrad Meyer.Pp 157faefad9cSConrad MeyerAll operations, as well as 158faefad9cSConrad Meyer.Fn ioat_get_dmaengine , 159faefad9cSConrad Meyercan return NULL in special circumstances. 160faefad9cSConrad MeyerFor example, if the 161faefad9cSConrad Meyer.Nm 162faefad9cSConrad Meyerdriver is being unloaded, or the administrator has induced a hardware reset, or 163faefad9cSConrad Meyera usage error has resulted in a hardware error state that needs to be recovered 164faefad9cSConrad Meyerfrom. 165faefad9cSConrad Meyer.Pp 166faefad9cSConrad MeyerIt is invalid to attempt to submit new DMA operations in a 167faefad9cSConrad Meyer.Fa bus_dmaengine_callback_t 168faefad9cSConrad Meyercontext. 169e974f91cSConrad Meyer.Sh USAGE 170e974f91cSConrad MeyerA typical user will lookup the DMA engine object for a given channel with 171e974f91cSConrad Meyer.Fn ioat_get_dmaengine . 172e974f91cSConrad MeyerWhen the user wants to offload a copy, they will first 173e974f91cSConrad Meyer.Fn ioat_acquire 174e974f91cSConrad Meyerthe 175e974f91cSConrad Meyer.Ar bus_dmaengine_t 176e974f91cSConrad Meyerobject for exclusive access to enqueue operations on that channel. 177e974f91cSConrad MeyerThen, they will submit one or more operations using 178faefad9cSConrad Meyer.Fn ioat_blockfill , 179faefad9cSConrad Meyer.Fn ioat_copy , 180e974f91cSConrad Meyeror 181e974f91cSConrad Meyer.Fn ioat_null . 1829950fde0SConrad MeyerAfter queuing one or more individual DMA operations, they will 183e974f91cSConrad Meyer.Fn ioat_release 184e974f91cSConrad Meyerthe 185e974f91cSConrad Meyer.Ar bus_dmaengine_t 186e974f91cSConrad Meyerto drop their exclusive access to the channel. 187e974f91cSConrad MeyerThe routine they provided for the 188e974f91cSConrad Meyer.Fa callback_fn 189e974f91cSConrad Meyerargument will be invoked with the provided 190e974f91cSConrad Meyer.Fa callback_arg 191e974f91cSConrad Meyerwhen the operation is complete. 192faefad9cSConrad MeyerWhen they are finished with the 193faefad9cSConrad Meyer.Ar bus_dmaengine_t , 194faefad9cSConrad Meyerthe user should 195faefad9cSConrad Meyer.Fn ioat_put_dmaengine . 196faefad9cSConrad Meyer.Pp 197faefad9cSConrad MeyerUsers MUST NOT block between 198faefad9cSConrad Meyer.Fn ioat_acquire 199faefad9cSConrad Meyerand 200faefad9cSConrad Meyer.Fn ioat_release . 201faefad9cSConrad MeyerUsers SHOULD NOT hold 202faefad9cSConrad Meyer.Ar bus_dmaengine_t 203faefad9cSConrad Meyerreferences for a very long time to enable fault recovery and kernel module 204faefad9cSConrad Meyerunload. 205e974f91cSConrad Meyer.Pp 206e974f91cSConrad MeyerFor an example of usage, see 207e974f91cSConrad Meyer.Pa src/sys/dev/ioat/ioat_test.c . 208e974f91cSConrad Meyer.Sh FILES 209280186c7SChristian Brueffer.Bl -tag 210e974f91cSConrad Meyer.It Pa /dev/ioat_test 211e974f91cSConrad Meyertest device for 212e974f91cSConrad Meyer.Xr ioatcontrol 8 213e974f91cSConrad Meyer.El 214e974f91cSConrad Meyer.Sh SEE ALSO 215e974f91cSConrad Meyer.Xr ioatcontrol 8 216e974f91cSConrad Meyer.Sh HISTORY 217e974f91cSConrad MeyerThe 218e974f91cSConrad Meyer.Nm 219e974f91cSConrad Meyerdriver first appeared in 220e974f91cSConrad Meyer.Fx 11.0 . 221e974f91cSConrad Meyer.Sh AUTHORS 222e974f91cSConrad MeyerThe 223e974f91cSConrad Meyer.Nm 224e974f91cSConrad Meyerdriver was developed by 225e974f91cSConrad Meyer.An \&Jim Harris Aq Mt jimharris@FreeBSD.org , 226faefad9cSConrad Meyer.An \&Carl Delsey Aq Mt carl.r.delsey@intel.com , 227e974f91cSConrad Meyerand 228faefad9cSConrad Meyer.An \&Conrad Meyer Aq Mt cem@FreeBSD.org . 229e974f91cSConrad MeyerThis manual page was written by 230e974f91cSConrad Meyer.An \&Conrad Meyer Aq Mt cem@FreeBSD.org . 231e974f91cSConrad Meyer.Sh CAVEATS 232e974f91cSConrad MeyerCopy operation takes bus addresses as parameters, not virtual addresses. 233e974f91cSConrad Meyer.Pp 234faefad9cSConrad MeyerBuffers for individual copy operations must be physically contiguous. 235faefad9cSConrad Meyer.Pp 236faefad9cSConrad MeyerCopies larger than max transfer size (1MB, but may vary by hardware) are not 237faefad9cSConrad Meyersupported. 238e974f91cSConrad MeyerFuture versions will likely support this by breaking up the transfer into 239e974f91cSConrad Meyersmaller sizes. 240e974f91cSConrad Meyer.Sh BUGS 241e974f91cSConrad MeyerThe 242e974f91cSConrad Meyer.Nm 243faefad9cSConrad Meyerdriver only supports blockfill, copy, and null operations at this time. 244e974f91cSConrad MeyerThe driver does not yet support advanced DMA modes, such as XOR, that some 245e974f91cSConrad MeyerI/OAT devices support. 246