1e974f91cSConrad Meyer /*- 2e974f91cSConrad Meyer * Copyright (C) 2012 Intel Corporation 3e974f91cSConrad Meyer * All rights reserved. 4e974f91cSConrad Meyer * 5e974f91cSConrad Meyer * Redistribution and use in source and binary forms, with or without 6e974f91cSConrad Meyer * modification, are permitted provided that the following conditions 7e974f91cSConrad Meyer * are met: 8e974f91cSConrad Meyer * 1. Redistributions of source code must retain the above copyright 9e974f91cSConrad Meyer * notice, this list of conditions and the following disclaimer. 10e974f91cSConrad Meyer * 2. Redistributions in binary form must reproduce the above copyright 11e974f91cSConrad Meyer * notice, this list of conditions and the following disclaimer in the 12e974f91cSConrad Meyer * documentation and/or other materials provided with the distribution. 13e974f91cSConrad Meyer * 14e974f91cSConrad Meyer * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND 15e974f91cSConrad Meyer * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 16e974f91cSConrad Meyer * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 17e974f91cSConrad Meyer * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE 18e974f91cSConrad Meyer * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 19e974f91cSConrad Meyer * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 20e974f91cSConrad Meyer * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 21e974f91cSConrad Meyer * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 22e974f91cSConrad Meyer * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 23e974f91cSConrad Meyer * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 24e974f91cSConrad Meyer * SUCH DAMAGE. 25e974f91cSConrad Meyer */ 26e974f91cSConrad Meyer 27e974f91cSConrad Meyer #include <sys/cdefs.h> 28e974f91cSConrad Meyer __FBSDID("$FreeBSD$"); 29e974f91cSConrad Meyer 30e974f91cSConrad Meyer #include <sys/param.h> 31e974f91cSConrad Meyer #include <sys/systm.h> 32e974f91cSConrad Meyer #include <sys/bus.h> 33e974f91cSConrad Meyer #include <sys/conf.h> 34e974f91cSConrad Meyer #include <sys/ioccom.h> 35e974f91cSConrad Meyer #include <sys/kernel.h> 36e974f91cSConrad Meyer #include <sys/lock.h> 37e974f91cSConrad Meyer #include <sys/malloc.h> 38e974f91cSConrad Meyer #include <sys/module.h> 39e974f91cSConrad Meyer #include <sys/mutex.h> 40e974f91cSConrad Meyer #include <sys/rman.h> 41e974f91cSConrad Meyer #include <sys/sysctl.h> 42e974f91cSConrad Meyer #include <sys/time.h> 43e974f91cSConrad Meyer #include <dev/pci/pcireg.h> 44e974f91cSConrad Meyer #include <dev/pci/pcivar.h> 45e974f91cSConrad Meyer #include <machine/bus.h> 46e974f91cSConrad Meyer #include <machine/resource.h> 47e974f91cSConrad Meyer #include <machine/stdarg.h> 48e974f91cSConrad Meyer 49e974f91cSConrad Meyer #include "ioat.h" 50e974f91cSConrad Meyer #include "ioat_hw.h" 51e974f91cSConrad Meyer #include "ioat_internal.h" 52e974f91cSConrad Meyer 53e974f91cSConrad Meyer static int ioat_probe(device_t device); 54e974f91cSConrad Meyer static int ioat_attach(device_t device); 55e974f91cSConrad Meyer static int ioat_detach(device_t device); 56*4253ea50SConrad Meyer static int ioat_setup_intr(struct ioat_softc *ioat); 57*4253ea50SConrad Meyer static int ioat_teardown_intr(struct ioat_softc *ioat); 58e974f91cSConrad Meyer static int ioat3_attach(device_t device); 59e974f91cSConrad Meyer static int ioat_map_pci_bar(struct ioat_softc *ioat); 60e974f91cSConrad Meyer static void ioat_dmamap_cb(void *arg, bus_dma_segment_t *segs, int nseg, 61e974f91cSConrad Meyer int error); 62e974f91cSConrad Meyer static void ioat_interrupt_handler(void *arg); 63*4253ea50SConrad Meyer static boolean_t ioat_is_bdxde(struct ioat_softc *ioat); 64e974f91cSConrad Meyer static void ioat_process_events(struct ioat_softc *ioat); 65e974f91cSConrad Meyer static inline uint32_t ioat_get_active(struct ioat_softc *ioat); 66e974f91cSConrad Meyer static inline uint32_t ioat_get_ring_space(struct ioat_softc *ioat); 67e974f91cSConrad Meyer static void ioat_free_ring_entry(struct ioat_softc *ioat, 68e974f91cSConrad Meyer struct ioat_descriptor *desc); 69e974f91cSConrad Meyer static struct ioat_descriptor * ioat_alloc_ring_entry(struct ioat_softc *ioat); 70e974f91cSConrad Meyer static int ioat_reserve_space_and_lock(struct ioat_softc *ioat, int num_descs); 71e974f91cSConrad Meyer static struct ioat_descriptor * ioat_get_ring_entry(struct ioat_softc *ioat, 72e974f91cSConrad Meyer uint32_t index); 73e974f91cSConrad Meyer static boolean_t resize_ring(struct ioat_softc *ioat, int order); 74e974f91cSConrad Meyer static void ioat_timer_callback(void *arg); 75e974f91cSConrad Meyer static void dump_descriptor(void *hw_desc); 76e974f91cSConrad Meyer static void ioat_submit_single(struct ioat_softc *ioat); 77e974f91cSConrad Meyer static void ioat_comp_update_map(void *arg, bus_dma_segment_t *seg, int nseg, 78e974f91cSConrad Meyer int error); 79e974f91cSConrad Meyer static int ioat_reset_hw(struct ioat_softc *ioat); 80e974f91cSConrad Meyer static void ioat_setup_sysctl(device_t device); 81e974f91cSConrad Meyer 82e974f91cSConrad Meyer MALLOC_DEFINE(M_IOAT, "ioat", "ioat driver memory allocations"); 83e974f91cSConrad Meyer SYSCTL_NODE(_hw, OID_AUTO, ioat, CTLFLAG_RD, 0, "ioat node"); 84e974f91cSConrad Meyer 85e974f91cSConrad Meyer static int g_force_legacy_interrupts; 86e974f91cSConrad Meyer SYSCTL_INT(_hw_ioat, OID_AUTO, force_legacy_interrupts, CTLFLAG_RDTUN, 87e974f91cSConrad Meyer &g_force_legacy_interrupts, 0, "Set to non-zero to force MSI-X disabled"); 88e974f91cSConrad Meyer 89e974f91cSConrad Meyer static int g_ioat_debug_level = 0; 90e974f91cSConrad Meyer SYSCTL_INT(_hw_ioat, OID_AUTO, debug_level, CTLFLAG_RWTUN, &g_ioat_debug_level, 91e974f91cSConrad Meyer 0, "Set log level (0-3) for ioat(4). Higher is more verbose."); 92e974f91cSConrad Meyer 93e974f91cSConrad Meyer /* 94e974f91cSConrad Meyer * OS <-> Driver interface structures 95e974f91cSConrad Meyer */ 96e974f91cSConrad Meyer static device_method_t ioat_pci_methods[] = { 97e974f91cSConrad Meyer /* Device interface */ 98e974f91cSConrad Meyer DEVMETHOD(device_probe, ioat_probe), 99e974f91cSConrad Meyer DEVMETHOD(device_attach, ioat_attach), 100e974f91cSConrad Meyer DEVMETHOD(device_detach, ioat_detach), 101e974f91cSConrad Meyer { 0, 0 } 102e974f91cSConrad Meyer }; 103e974f91cSConrad Meyer 104e974f91cSConrad Meyer static driver_t ioat_pci_driver = { 105e974f91cSConrad Meyer "ioat", 106e974f91cSConrad Meyer ioat_pci_methods, 107e974f91cSConrad Meyer sizeof(struct ioat_softc), 108e974f91cSConrad Meyer }; 109e974f91cSConrad Meyer 110e974f91cSConrad Meyer static devclass_t ioat_devclass; 111e974f91cSConrad Meyer DRIVER_MODULE(ioat, pci, ioat_pci_driver, ioat_devclass, 0, 0); 112e974f91cSConrad Meyer 113e974f91cSConrad Meyer /* 114e974f91cSConrad Meyer * Private data structures 115e974f91cSConrad Meyer */ 116e974f91cSConrad Meyer static struct ioat_softc *ioat_channel[IOAT_MAX_CHANNELS]; 117e974f91cSConrad Meyer static int ioat_channel_index = 0; 118e974f91cSConrad Meyer SYSCTL_INT(_hw_ioat, OID_AUTO, channels, CTLFLAG_RD, &ioat_channel_index, 0, 119e974f91cSConrad Meyer "Number of IOAT channels attached"); 120e974f91cSConrad Meyer 121e974f91cSConrad Meyer static struct _pcsid 122e974f91cSConrad Meyer { 123e974f91cSConrad Meyer u_int32_t type; 124e974f91cSConrad Meyer const char *desc; 125e974f91cSConrad Meyer } pci_ids[] = { 126e974f91cSConrad Meyer { 0x34308086, "TBG IOAT Ch0" }, 127e974f91cSConrad Meyer { 0x34318086, "TBG IOAT Ch1" }, 128e974f91cSConrad Meyer { 0x34328086, "TBG IOAT Ch2" }, 129e974f91cSConrad Meyer { 0x34338086, "TBG IOAT Ch3" }, 130e974f91cSConrad Meyer { 0x34298086, "TBG IOAT Ch4" }, 131e974f91cSConrad Meyer { 0x342a8086, "TBG IOAT Ch5" }, 132e974f91cSConrad Meyer { 0x342b8086, "TBG IOAT Ch6" }, 133e974f91cSConrad Meyer { 0x342c8086, "TBG IOAT Ch7" }, 134e974f91cSConrad Meyer 135e974f91cSConrad Meyer { 0x37108086, "JSF IOAT Ch0" }, 136e974f91cSConrad Meyer { 0x37118086, "JSF IOAT Ch1" }, 137e974f91cSConrad Meyer { 0x37128086, "JSF IOAT Ch2" }, 138e974f91cSConrad Meyer { 0x37138086, "JSF IOAT Ch3" }, 139e974f91cSConrad Meyer { 0x37148086, "JSF IOAT Ch4" }, 140e974f91cSConrad Meyer { 0x37158086, "JSF IOAT Ch5" }, 141e974f91cSConrad Meyer { 0x37168086, "JSF IOAT Ch6" }, 142e974f91cSConrad Meyer { 0x37178086, "JSF IOAT Ch7" }, 143e974f91cSConrad Meyer { 0x37188086, "JSF IOAT Ch0 (RAID)" }, 144e974f91cSConrad Meyer { 0x37198086, "JSF IOAT Ch1 (RAID)" }, 145e974f91cSConrad Meyer 146e974f91cSConrad Meyer { 0x3c208086, "SNB IOAT Ch0" }, 147e974f91cSConrad Meyer { 0x3c218086, "SNB IOAT Ch1" }, 148e974f91cSConrad Meyer { 0x3c228086, "SNB IOAT Ch2" }, 149e974f91cSConrad Meyer { 0x3c238086, "SNB IOAT Ch3" }, 150e974f91cSConrad Meyer { 0x3c248086, "SNB IOAT Ch4" }, 151e974f91cSConrad Meyer { 0x3c258086, "SNB IOAT Ch5" }, 152e974f91cSConrad Meyer { 0x3c268086, "SNB IOAT Ch6" }, 153e974f91cSConrad Meyer { 0x3c278086, "SNB IOAT Ch7" }, 154e974f91cSConrad Meyer { 0x3c2e8086, "SNB IOAT Ch0 (RAID)" }, 155e974f91cSConrad Meyer { 0x3c2f8086, "SNB IOAT Ch1 (RAID)" }, 156e974f91cSConrad Meyer 157e974f91cSConrad Meyer { 0x0e208086, "IVB IOAT Ch0" }, 158e974f91cSConrad Meyer { 0x0e218086, "IVB IOAT Ch1" }, 159e974f91cSConrad Meyer { 0x0e228086, "IVB IOAT Ch2" }, 160e974f91cSConrad Meyer { 0x0e238086, "IVB IOAT Ch3" }, 161e974f91cSConrad Meyer { 0x0e248086, "IVB IOAT Ch4" }, 162e974f91cSConrad Meyer { 0x0e258086, "IVB IOAT Ch5" }, 163e974f91cSConrad Meyer { 0x0e268086, "IVB IOAT Ch6" }, 164e974f91cSConrad Meyer { 0x0e278086, "IVB IOAT Ch7" }, 165e974f91cSConrad Meyer { 0x0e2e8086, "IVB IOAT Ch0 (RAID)" }, 166e974f91cSConrad Meyer { 0x0e2f8086, "IVB IOAT Ch1 (RAID)" }, 167e974f91cSConrad Meyer 168e974f91cSConrad Meyer { 0x2f208086, "HSW IOAT Ch0" }, 169e974f91cSConrad Meyer { 0x2f218086, "HSW IOAT Ch1" }, 170e974f91cSConrad Meyer { 0x2f228086, "HSW IOAT Ch2" }, 171e974f91cSConrad Meyer { 0x2f238086, "HSW IOAT Ch3" }, 172e974f91cSConrad Meyer { 0x2f248086, "HSW IOAT Ch4" }, 173e974f91cSConrad Meyer { 0x2f258086, "HSW IOAT Ch5" }, 174e974f91cSConrad Meyer { 0x2f268086, "HSW IOAT Ch6" }, 175e974f91cSConrad Meyer { 0x2f278086, "HSW IOAT Ch7" }, 176e974f91cSConrad Meyer { 0x2f2e8086, "HSW IOAT Ch0 (RAID)" }, 177e974f91cSConrad Meyer { 0x2f2f8086, "HSW IOAT Ch1 (RAID)" }, 178e974f91cSConrad Meyer 179e974f91cSConrad Meyer { 0x0c508086, "BWD IOAT Ch0" }, 180e974f91cSConrad Meyer { 0x0c518086, "BWD IOAT Ch1" }, 181e974f91cSConrad Meyer { 0x0c528086, "BWD IOAT Ch2" }, 182e974f91cSConrad Meyer { 0x0c538086, "BWD IOAT Ch3" }, 183e974f91cSConrad Meyer 184e974f91cSConrad Meyer { 0x6f508086, "BDXDE IOAT Ch0" }, 185e974f91cSConrad Meyer { 0x6f518086, "BDXDE IOAT Ch1" }, 186e974f91cSConrad Meyer { 0x6f528086, "BDXDE IOAT Ch2" }, 187e974f91cSConrad Meyer { 0x6f538086, "BDXDE IOAT Ch3" }, 188e974f91cSConrad Meyer 189e974f91cSConrad Meyer { 0x00000000, NULL } 190e974f91cSConrad Meyer }; 191e974f91cSConrad Meyer 192e974f91cSConrad Meyer /* 193e974f91cSConrad Meyer * OS <-> Driver linkage functions 194e974f91cSConrad Meyer */ 195e974f91cSConrad Meyer static int 196e974f91cSConrad Meyer ioat_probe(device_t device) 197e974f91cSConrad Meyer { 198e974f91cSConrad Meyer struct _pcsid *ep; 199e974f91cSConrad Meyer u_int32_t type; 200e974f91cSConrad Meyer 201e974f91cSConrad Meyer type = pci_get_devid(device); 202e974f91cSConrad Meyer for (ep = pci_ids; ep->type; ep++) { 203e974f91cSConrad Meyer if (ep->type == type) { 204e974f91cSConrad Meyer device_set_desc(device, ep->desc); 205e974f91cSConrad Meyer return (0); 206e974f91cSConrad Meyer } 207e974f91cSConrad Meyer } 208e974f91cSConrad Meyer return (ENXIO); 209e974f91cSConrad Meyer } 210e974f91cSConrad Meyer 211e974f91cSConrad Meyer static int 212e974f91cSConrad Meyer ioat_attach(device_t device) 213e974f91cSConrad Meyer { 214e974f91cSConrad Meyer struct ioat_softc *ioat; 215e974f91cSConrad Meyer int error; 216e974f91cSConrad Meyer 217e974f91cSConrad Meyer ioat = DEVICE2SOFTC(device); 218e974f91cSConrad Meyer ioat->device = device; 219e974f91cSConrad Meyer 220e974f91cSConrad Meyer error = ioat_map_pci_bar(ioat); 221e974f91cSConrad Meyer if (error != 0) 222e974f91cSConrad Meyer goto err; 223e974f91cSConrad Meyer 224e974f91cSConrad Meyer ioat->version = ioat_read_cbver(ioat); 225e974f91cSConrad Meyer if (ioat->version < IOAT_VER_3_0) { 226e974f91cSConrad Meyer error = ENODEV; 227e974f91cSConrad Meyer goto err; 228e974f91cSConrad Meyer } 229e974f91cSConrad Meyer 230*4253ea50SConrad Meyer error = ioat_setup_intr(ioat); 231*4253ea50SConrad Meyer if (error != 0) 232*4253ea50SConrad Meyer return (error); 233*4253ea50SConrad Meyer 234e974f91cSConrad Meyer error = ioat3_attach(device); 235e974f91cSConrad Meyer if (error != 0) 236e974f91cSConrad Meyer goto err; 237e974f91cSConrad Meyer 238e974f91cSConrad Meyer error = pci_enable_busmaster(device); 239e974f91cSConrad Meyer if (error != 0) 240e974f91cSConrad Meyer goto err; 241e974f91cSConrad Meyer 242e974f91cSConrad Meyer ioat_channel[ioat_channel_index++] = ioat; 243e974f91cSConrad Meyer 244e974f91cSConrad Meyer err: 245e974f91cSConrad Meyer if (error != 0) 246e974f91cSConrad Meyer ioat_detach(device); 247e974f91cSConrad Meyer return (error); 248e974f91cSConrad Meyer } 249e974f91cSConrad Meyer 250e974f91cSConrad Meyer static int 251e974f91cSConrad Meyer ioat_detach(device_t device) 252e974f91cSConrad Meyer { 253e974f91cSConrad Meyer struct ioat_softc *ioat; 254e974f91cSConrad Meyer uint32_t i; 255e974f91cSConrad Meyer 256e974f91cSConrad Meyer ioat = DEVICE2SOFTC(device); 257e974f91cSConrad Meyer callout_drain(&ioat->timer); 258e974f91cSConrad Meyer 259e974f91cSConrad Meyer pci_disable_busmaster(device); 260e974f91cSConrad Meyer 261e974f91cSConrad Meyer if (ioat->pci_resource != NULL) 262e974f91cSConrad Meyer bus_release_resource(device, SYS_RES_MEMORY, 263e974f91cSConrad Meyer ioat->pci_resource_id, ioat->pci_resource); 264e974f91cSConrad Meyer 265e974f91cSConrad Meyer if (ioat->ring != NULL) { 266e974f91cSConrad Meyer for (i = 0; i < (1 << ioat->ring_size_order); i++) 267e974f91cSConrad Meyer ioat_free_ring_entry(ioat, ioat->ring[i]); 268e974f91cSConrad Meyer free(ioat->ring, M_IOAT); 269e974f91cSConrad Meyer } 270e974f91cSConrad Meyer 271e974f91cSConrad Meyer if (ioat->comp_update != NULL) { 272e974f91cSConrad Meyer bus_dmamap_unload(ioat->comp_update_tag, ioat->comp_update_map); 273e974f91cSConrad Meyer bus_dmamem_free(ioat->comp_update_tag, ioat->comp_update, 274e974f91cSConrad Meyer ioat->comp_update_map); 275e974f91cSConrad Meyer bus_dma_tag_destroy(ioat->comp_update_tag); 276e974f91cSConrad Meyer } 277e974f91cSConrad Meyer 278e974f91cSConrad Meyer bus_dma_tag_destroy(ioat->hw_desc_tag); 279e974f91cSConrad Meyer 280*4253ea50SConrad Meyer ioat_teardown_intr(ioat); 281*4253ea50SConrad Meyer 282*4253ea50SConrad Meyer return (0); 283*4253ea50SConrad Meyer } 284*4253ea50SConrad Meyer 285*4253ea50SConrad Meyer static int 286*4253ea50SConrad Meyer ioat_teardown_intr(struct ioat_softc *ioat) 287*4253ea50SConrad Meyer { 288*4253ea50SConrad Meyer 289e974f91cSConrad Meyer if (ioat->tag != NULL) 290*4253ea50SConrad Meyer bus_teardown_intr(ioat->device, ioat->res, ioat->tag); 291e974f91cSConrad Meyer 292e974f91cSConrad Meyer if (ioat->res != NULL) 293*4253ea50SConrad Meyer bus_release_resource(ioat->device, SYS_RES_IRQ, 294e974f91cSConrad Meyer rman_get_rid(ioat->res), ioat->res); 295e974f91cSConrad Meyer 296*4253ea50SConrad Meyer pci_release_msi(ioat->device); 297e974f91cSConrad Meyer return (0); 298e974f91cSConrad Meyer } 299e974f91cSConrad Meyer 300e974f91cSConrad Meyer static int 301e974f91cSConrad Meyer ioat3_selftest(struct ioat_softc *ioat) 302e974f91cSConrad Meyer { 303e974f91cSConrad Meyer uint64_t status; 304e974f91cSConrad Meyer uint32_t chanerr; 305e974f91cSConrad Meyer int i; 306e974f91cSConrad Meyer 307e974f91cSConrad Meyer ioat_acquire(&ioat->dmaengine); 308e974f91cSConrad Meyer ioat_null(&ioat->dmaengine, NULL, NULL, 0); 309e974f91cSConrad Meyer ioat_release(&ioat->dmaengine); 310e974f91cSConrad Meyer 311e974f91cSConrad Meyer for (i = 0; i < 100; i++) { 312e974f91cSConrad Meyer DELAY(1); 313e974f91cSConrad Meyer status = ioat_get_chansts(ioat); 314e974f91cSConrad Meyer if (is_ioat_idle(status)) 315e974f91cSConrad Meyer return (0); 316e974f91cSConrad Meyer } 317e974f91cSConrad Meyer 318e974f91cSConrad Meyer chanerr = ioat_read_4(ioat, IOAT_CHANERR_OFFSET); 319e974f91cSConrad Meyer ioat_log_message(0, "could not start channel: " 320e974f91cSConrad Meyer "status = %#jx error = %x\n", (uintmax_t)status, chanerr); 321e974f91cSConrad Meyer return (ENXIO); 322e974f91cSConrad Meyer } 323e974f91cSConrad Meyer 324e974f91cSConrad Meyer /* 325e974f91cSConrad Meyer * Initialize Hardware 326e974f91cSConrad Meyer */ 327e974f91cSConrad Meyer static int 328e974f91cSConrad Meyer ioat3_attach(device_t device) 329e974f91cSConrad Meyer { 330e974f91cSConrad Meyer struct ioat_softc *ioat; 331e974f91cSConrad Meyer struct ioat_descriptor **ring; 332e974f91cSConrad Meyer struct ioat_descriptor *next; 333e974f91cSConrad Meyer struct ioat_dma_hw_descriptor *dma_hw_desc; 334e974f91cSConrad Meyer uint32_t capabilities; 335e974f91cSConrad Meyer int i, num_descriptors; 336e974f91cSConrad Meyer int error; 337e974f91cSConrad Meyer uint8_t xfercap; 338e974f91cSConrad Meyer 339e974f91cSConrad Meyer error = 0; 340e974f91cSConrad Meyer ioat = DEVICE2SOFTC(device); 341e974f91cSConrad Meyer capabilities = ioat_read_dmacapability(ioat); 342e974f91cSConrad Meyer 343e974f91cSConrad Meyer xfercap = ioat_read_xfercap(ioat); 344e974f91cSConrad Meyer 345e974f91cSConrad Meyer /* Only bits [4:0] are valid. */ 346e974f91cSConrad Meyer xfercap &= 0x1f; 347e974f91cSConrad Meyer ioat->max_xfer_size = 1 << xfercap; 348e974f91cSConrad Meyer 349e974f91cSConrad Meyer /* TODO: need to check DCA here if we ever do XOR/PQ */ 350e974f91cSConrad Meyer 351e974f91cSConrad Meyer mtx_init(&ioat->submit_lock, "ioat_submit", NULL, MTX_DEF); 352e974f91cSConrad Meyer mtx_init(&ioat->cleanup_lock, "ioat_process_events", NULL, MTX_DEF); 353e974f91cSConrad Meyer callout_init(&ioat->timer, CALLOUT_MPSAFE); 354e974f91cSConrad Meyer 355e974f91cSConrad Meyer ioat->is_resize_pending = FALSE; 356e974f91cSConrad Meyer ioat->is_completion_pending = FALSE; 357e974f91cSConrad Meyer ioat->is_reset_pending = FALSE; 358e974f91cSConrad Meyer ioat->is_channel_running = FALSE; 359e974f91cSConrad Meyer ioat->is_waiting_for_ack = FALSE; 360e974f91cSConrad Meyer 361e974f91cSConrad Meyer bus_dma_tag_create(bus_get_dma_tag(ioat->device), sizeof(uint64_t), 0x0, 362e974f91cSConrad Meyer BUS_SPACE_MAXADDR, BUS_SPACE_MAXADDR, NULL, NULL, 363e974f91cSConrad Meyer sizeof(uint64_t), 1, sizeof(uint64_t), 0, NULL, NULL, 364e974f91cSConrad Meyer &ioat->comp_update_tag); 365e974f91cSConrad Meyer 366e974f91cSConrad Meyer error = bus_dmamem_alloc(ioat->comp_update_tag, 367e974f91cSConrad Meyer (void **)&ioat->comp_update, BUS_DMA_ZERO, &ioat->comp_update_map); 368e974f91cSConrad Meyer if (ioat->comp_update == NULL) 369e974f91cSConrad Meyer return (ENOMEM); 370e974f91cSConrad Meyer 371e974f91cSConrad Meyer error = bus_dmamap_load(ioat->comp_update_tag, ioat->comp_update_map, 372e974f91cSConrad Meyer ioat->comp_update, sizeof(uint64_t), ioat_comp_update_map, ioat, 373e974f91cSConrad Meyer 0); 374e974f91cSConrad Meyer if (error != 0) 375e974f91cSConrad Meyer return (error); 376e974f91cSConrad Meyer 377e974f91cSConrad Meyer ioat->ring_size_order = IOAT_MIN_ORDER; 378e974f91cSConrad Meyer 379e974f91cSConrad Meyer num_descriptors = 1 << ioat->ring_size_order; 380e974f91cSConrad Meyer 381e974f91cSConrad Meyer bus_dma_tag_create(bus_get_dma_tag(ioat->device), 0x40, 0x0, 382e974f91cSConrad Meyer BUS_SPACE_MAXADDR, BUS_SPACE_MAXADDR, NULL, NULL, 383e974f91cSConrad Meyer sizeof(struct ioat_dma_hw_descriptor), 1, 384e974f91cSConrad Meyer sizeof(struct ioat_dma_hw_descriptor), 0, NULL, NULL, 385e974f91cSConrad Meyer &ioat->hw_desc_tag); 386e974f91cSConrad Meyer 387e974f91cSConrad Meyer ioat->ring = malloc(num_descriptors * sizeof(*ring), M_IOAT, 388e974f91cSConrad Meyer M_ZERO | M_NOWAIT); 389e974f91cSConrad Meyer if (ioat->ring == NULL) 390e974f91cSConrad Meyer return (ENOMEM); 391e974f91cSConrad Meyer 392e974f91cSConrad Meyer ring = ioat->ring; 393e974f91cSConrad Meyer for (i = 0; i < num_descriptors; i++) { 394e974f91cSConrad Meyer ring[i] = ioat_alloc_ring_entry(ioat); 395e974f91cSConrad Meyer if (ring[i] == NULL) 396e974f91cSConrad Meyer return (ENOMEM); 397e974f91cSConrad Meyer 398e974f91cSConrad Meyer ring[i]->id = i; 399e974f91cSConrad Meyer } 400e974f91cSConrad Meyer 401e974f91cSConrad Meyer for (i = 0; i < num_descriptors - 1; i++) { 402e974f91cSConrad Meyer next = ring[i + 1]; 403e974f91cSConrad Meyer dma_hw_desc = ring[i]->u.dma; 404e974f91cSConrad Meyer 405e974f91cSConrad Meyer dma_hw_desc->next = next->hw_desc_bus_addr; 406e974f91cSConrad Meyer } 407e974f91cSConrad Meyer 408e974f91cSConrad Meyer ring[i]->u.dma->next = ring[0]->hw_desc_bus_addr; 409e974f91cSConrad Meyer 410e974f91cSConrad Meyer ioat->head = 0; 411e974f91cSConrad Meyer ioat->tail = 0; 412e974f91cSConrad Meyer ioat->last_seen = 0; 413e974f91cSConrad Meyer 414e974f91cSConrad Meyer error = ioat_reset_hw(ioat); 415e974f91cSConrad Meyer if (error != 0) 416e974f91cSConrad Meyer return (error); 417e974f91cSConrad Meyer 418e974f91cSConrad Meyer ioat_write_chanctrl(ioat, IOAT_CHANCTRL_RUN); 419e974f91cSConrad Meyer ioat_write_chancmp(ioat, ioat->comp_update_bus_addr); 420e974f91cSConrad Meyer ioat_write_chainaddr(ioat, ring[0]->hw_desc_bus_addr); 421e974f91cSConrad Meyer 422e974f91cSConrad Meyer error = ioat3_selftest(ioat); 423e974f91cSConrad Meyer if (error != 0) 424e974f91cSConrad Meyer return (error); 425e974f91cSConrad Meyer 426e974f91cSConrad Meyer ioat_process_events(ioat); 427e974f91cSConrad Meyer ioat_setup_sysctl(device); 428e974f91cSConrad Meyer return (0); 429e974f91cSConrad Meyer } 430e974f91cSConrad Meyer 431e974f91cSConrad Meyer static int 432e974f91cSConrad Meyer ioat_map_pci_bar(struct ioat_softc *ioat) 433e974f91cSConrad Meyer { 434e974f91cSConrad Meyer 435e974f91cSConrad Meyer ioat->pci_resource_id = PCIR_BAR(0); 436e974f91cSConrad Meyer ioat->pci_resource = bus_alloc_resource(ioat->device, SYS_RES_MEMORY, 437e974f91cSConrad Meyer &ioat->pci_resource_id, 0, ~0, 1, RF_ACTIVE); 438e974f91cSConrad Meyer 439e974f91cSConrad Meyer if (ioat->pci_resource == NULL) { 440e974f91cSConrad Meyer ioat_log_message(0, "unable to allocate pci resource\n"); 441e974f91cSConrad Meyer return (ENODEV); 442e974f91cSConrad Meyer } 443e974f91cSConrad Meyer 444e974f91cSConrad Meyer ioat->pci_bus_tag = rman_get_bustag(ioat->pci_resource); 445e974f91cSConrad Meyer ioat->pci_bus_handle = rman_get_bushandle(ioat->pci_resource); 446e974f91cSConrad Meyer return (0); 447e974f91cSConrad Meyer } 448e974f91cSConrad Meyer 449e974f91cSConrad Meyer static void 450e974f91cSConrad Meyer ioat_comp_update_map(void *arg, bus_dma_segment_t *seg, int nseg, int error) 451e974f91cSConrad Meyer { 452e974f91cSConrad Meyer struct ioat_softc *ioat = arg; 453e974f91cSConrad Meyer 454e974f91cSConrad Meyer ioat->comp_update_bus_addr = seg[0].ds_addr; 455e974f91cSConrad Meyer } 456e974f91cSConrad Meyer 457e974f91cSConrad Meyer static void 458e974f91cSConrad Meyer ioat_dmamap_cb(void *arg, bus_dma_segment_t *segs, int nseg, int error) 459e974f91cSConrad Meyer { 460e974f91cSConrad Meyer bus_addr_t *baddr; 461e974f91cSConrad Meyer 462e974f91cSConrad Meyer baddr = arg; 463e974f91cSConrad Meyer *baddr = segs->ds_addr; 464e974f91cSConrad Meyer } 465e974f91cSConrad Meyer 466e974f91cSConrad Meyer /* 467e974f91cSConrad Meyer * Interrupt setup and handlers 468e974f91cSConrad Meyer */ 469e974f91cSConrad Meyer static int 470*4253ea50SConrad Meyer ioat_setup_intr(struct ioat_softc *ioat) 471e974f91cSConrad Meyer { 472e974f91cSConrad Meyer uint32_t num_vectors; 473e974f91cSConrad Meyer int error; 474e974f91cSConrad Meyer boolean_t use_msix; 475e974f91cSConrad Meyer boolean_t force_legacy_interrupts; 476e974f91cSConrad Meyer 477e974f91cSConrad Meyer use_msix = FALSE; 478e974f91cSConrad Meyer force_legacy_interrupts = FALSE; 479e974f91cSConrad Meyer 480e974f91cSConrad Meyer if (!g_force_legacy_interrupts && pci_msix_count(ioat->device) >= 1) { 481e974f91cSConrad Meyer num_vectors = 1; 482e974f91cSConrad Meyer pci_alloc_msix(ioat->device, &num_vectors); 483e974f91cSConrad Meyer if (num_vectors == 1) 484e974f91cSConrad Meyer use_msix = TRUE; 485e974f91cSConrad Meyer } 486e974f91cSConrad Meyer 487e974f91cSConrad Meyer if (use_msix) { 488e974f91cSConrad Meyer ioat->rid = 1; 489e974f91cSConrad Meyer ioat->res = bus_alloc_resource_any(ioat->device, SYS_RES_IRQ, 490e974f91cSConrad Meyer &ioat->rid, RF_ACTIVE); 491e974f91cSConrad Meyer } else { 492e974f91cSConrad Meyer ioat->rid = 0; 493e974f91cSConrad Meyer ioat->res = bus_alloc_resource_any(ioat->device, SYS_RES_IRQ, 494e974f91cSConrad Meyer &ioat->rid, RF_SHAREABLE | RF_ACTIVE); 495e974f91cSConrad Meyer } 496e974f91cSConrad Meyer if (ioat->res == NULL) { 497e974f91cSConrad Meyer ioat_log_message(0, "bus_alloc_resource failed\n"); 498e974f91cSConrad Meyer return (ENOMEM); 499e974f91cSConrad Meyer } 500e974f91cSConrad Meyer 501e974f91cSConrad Meyer ioat->tag = NULL; 502e974f91cSConrad Meyer error = bus_setup_intr(ioat->device, ioat->res, INTR_MPSAFE | 503e974f91cSConrad Meyer INTR_TYPE_MISC, NULL, ioat_interrupt_handler, ioat, &ioat->tag); 504e974f91cSConrad Meyer if (error != 0) { 505e974f91cSConrad Meyer ioat_log_message(0, "bus_setup_intr failed\n"); 506e974f91cSConrad Meyer return (error); 507e974f91cSConrad Meyer } 508e974f91cSConrad Meyer 509e974f91cSConrad Meyer ioat_write_intrctrl(ioat, IOAT_INTRCTRL_MASTER_INT_EN); 510e974f91cSConrad Meyer return (0); 511e974f91cSConrad Meyer } 512e974f91cSConrad Meyer 513*4253ea50SConrad Meyer static boolean_t 514*4253ea50SConrad Meyer ioat_is_bdxde(struct ioat_softc *ioat) 515*4253ea50SConrad Meyer { 516*4253ea50SConrad Meyer u_int32_t pciid; 517*4253ea50SConrad Meyer 518*4253ea50SConrad Meyer pciid = pci_get_devid(ioat->device); 519*4253ea50SConrad Meyer switch (pciid) { 520*4253ea50SConrad Meyer case 0x6f508086: 521*4253ea50SConrad Meyer case 0x6f518086: 522*4253ea50SConrad Meyer case 0x6f528086: 523*4253ea50SConrad Meyer case 0x6f538086: 524*4253ea50SConrad Meyer return (TRUE); 525*4253ea50SConrad Meyer } 526*4253ea50SConrad Meyer 527*4253ea50SConrad Meyer return (FALSE); 528*4253ea50SConrad Meyer } 529*4253ea50SConrad Meyer 530e974f91cSConrad Meyer static void 531e974f91cSConrad Meyer ioat_interrupt_handler(void *arg) 532e974f91cSConrad Meyer { 533e974f91cSConrad Meyer struct ioat_softc *ioat = arg; 534e974f91cSConrad Meyer 535e974f91cSConrad Meyer ioat_process_events(ioat); 536e974f91cSConrad Meyer } 537e974f91cSConrad Meyer 538e974f91cSConrad Meyer static void 539e974f91cSConrad Meyer ioat_process_events(struct ioat_softc *ioat) 540e974f91cSConrad Meyer { 541e974f91cSConrad Meyer struct ioat_descriptor *desc; 542e974f91cSConrad Meyer struct bus_dmadesc *dmadesc; 543e974f91cSConrad Meyer uint64_t comp_update, status; 544e974f91cSConrad Meyer uint32_t completed; 545e974f91cSConrad Meyer 546e974f91cSConrad Meyer mtx_lock(&ioat->cleanup_lock); 547e974f91cSConrad Meyer 548e974f91cSConrad Meyer completed = 0; 549e974f91cSConrad Meyer comp_update = *ioat->comp_update; 550e974f91cSConrad Meyer status = comp_update & IOAT_CHANSTS_COMPLETED_DESCRIPTOR_MASK; 551e974f91cSConrad Meyer 552e974f91cSConrad Meyer ioat_log_message(3, "%s\n", __func__); 553e974f91cSConrad Meyer 554e974f91cSConrad Meyer if (status == ioat->last_seen) { 555e974f91cSConrad Meyer mtx_unlock(&ioat->cleanup_lock); 556e974f91cSConrad Meyer return; 557e974f91cSConrad Meyer } 558e974f91cSConrad Meyer 559e974f91cSConrad Meyer while (1) { 560e974f91cSConrad Meyer desc = ioat_get_ring_entry(ioat, ioat->tail); 561e974f91cSConrad Meyer dmadesc = &desc->bus_dmadesc; 562e974f91cSConrad Meyer ioat_log_message(3, "completing desc %d\n", ioat->tail); 563e974f91cSConrad Meyer 564e974f91cSConrad Meyer if (dmadesc->callback_fn) 565e974f91cSConrad Meyer (*dmadesc->callback_fn)(dmadesc->callback_arg); 566e974f91cSConrad Meyer 567e974f91cSConrad Meyer ioat->tail++; 568e974f91cSConrad Meyer if (desc->hw_desc_bus_addr == status) 569e974f91cSConrad Meyer break; 570e974f91cSConrad Meyer } 571e974f91cSConrad Meyer 572e974f91cSConrad Meyer ioat->last_seen = desc->hw_desc_bus_addr; 573e974f91cSConrad Meyer 574e974f91cSConrad Meyer if (ioat->head == ioat->tail) { 575e974f91cSConrad Meyer ioat->is_completion_pending = FALSE; 576e974f91cSConrad Meyer callout_reset(&ioat->timer, 5 * hz, ioat_timer_callback, ioat); 577e974f91cSConrad Meyer } 578e974f91cSConrad Meyer 579e974f91cSConrad Meyer ioat_write_chanctrl(ioat, IOAT_CHANCTRL_RUN); 580e974f91cSConrad Meyer mtx_unlock(&ioat->cleanup_lock); 581e974f91cSConrad Meyer } 582e974f91cSConrad Meyer 583e974f91cSConrad Meyer /* 584e974f91cSConrad Meyer * User API functions 585e974f91cSConrad Meyer */ 586e974f91cSConrad Meyer bus_dmaengine_t 587e974f91cSConrad Meyer ioat_get_dmaengine(uint32_t index) 588e974f91cSConrad Meyer { 589e974f91cSConrad Meyer 590e974f91cSConrad Meyer if (index < ioat_channel_index) 591e974f91cSConrad Meyer return (&ioat_channel[index]->dmaengine); 592e974f91cSConrad Meyer return (NULL); 593e974f91cSConrad Meyer } 594e974f91cSConrad Meyer 595e974f91cSConrad Meyer void 596e974f91cSConrad Meyer ioat_acquire(bus_dmaengine_t dmaengine) 597e974f91cSConrad Meyer { 598e974f91cSConrad Meyer struct ioat_softc *ioat; 599e974f91cSConrad Meyer 600e974f91cSConrad Meyer ioat = to_ioat_softc(dmaengine); 601e974f91cSConrad Meyer mtx_lock(&ioat->submit_lock); 602e974f91cSConrad Meyer ioat_log_message(3, "%s\n", __func__); 603e974f91cSConrad Meyer } 604e974f91cSConrad Meyer 605e974f91cSConrad Meyer void 606e974f91cSConrad Meyer ioat_release(bus_dmaengine_t dmaengine) 607e974f91cSConrad Meyer { 608e974f91cSConrad Meyer struct ioat_softc *ioat; 609e974f91cSConrad Meyer 610e974f91cSConrad Meyer ioat_log_message(3, "%s\n", __func__); 611e974f91cSConrad Meyer ioat = to_ioat_softc(dmaengine); 612e974f91cSConrad Meyer ioat_write_2(ioat, IOAT_DMACOUNT_OFFSET, (uint16_t)ioat->head); 613e974f91cSConrad Meyer mtx_unlock(&ioat->submit_lock); 614e974f91cSConrad Meyer } 615e974f91cSConrad Meyer 616e974f91cSConrad Meyer struct bus_dmadesc * 617e974f91cSConrad Meyer ioat_null(bus_dmaengine_t dmaengine, bus_dmaengine_callback_t callback_fn, 618e974f91cSConrad Meyer void *callback_arg, uint32_t flags) 619e974f91cSConrad Meyer { 620e974f91cSConrad Meyer struct ioat_softc *ioat; 621e974f91cSConrad Meyer struct ioat_descriptor *desc; 622e974f91cSConrad Meyer struct ioat_dma_hw_descriptor *hw_desc; 623e974f91cSConrad Meyer 624e974f91cSConrad Meyer KASSERT((flags & ~DMA_ALL_FLAGS) == 0, ("Unrecognized flag(s): %#x", 625e974f91cSConrad Meyer flags & ~DMA_ALL_FLAGS)); 626e974f91cSConrad Meyer 627e974f91cSConrad Meyer ioat = to_ioat_softc(dmaengine); 628e974f91cSConrad Meyer 629e974f91cSConrad Meyer if (ioat_reserve_space_and_lock(ioat, 1) != 0) 630e974f91cSConrad Meyer return (NULL); 631e974f91cSConrad Meyer 632e974f91cSConrad Meyer ioat_log_message(3, "%s\n", __func__); 633e974f91cSConrad Meyer 634e974f91cSConrad Meyer desc = ioat_get_ring_entry(ioat, ioat->head); 635e974f91cSConrad Meyer hw_desc = desc->u.dma; 636e974f91cSConrad Meyer 637e974f91cSConrad Meyer hw_desc->u.control_raw = 0; 638e974f91cSConrad Meyer hw_desc->u.control.null = 1; 639e974f91cSConrad Meyer hw_desc->u.control.completion_update = 1; 640e974f91cSConrad Meyer 641e974f91cSConrad Meyer if ((flags & DMA_INT_EN) != 0) 642e974f91cSConrad Meyer hw_desc->u.control.int_enable = 1; 643e974f91cSConrad Meyer 644e974f91cSConrad Meyer hw_desc->size = 8; 645e974f91cSConrad Meyer hw_desc->src_addr = 0; 646e974f91cSConrad Meyer hw_desc->dest_addr = 0; 647e974f91cSConrad Meyer 648e974f91cSConrad Meyer desc->bus_dmadesc.callback_fn = callback_fn; 649e974f91cSConrad Meyer desc->bus_dmadesc.callback_arg = callback_arg; 650e974f91cSConrad Meyer 651e974f91cSConrad Meyer ioat_submit_single(ioat); 652e974f91cSConrad Meyer return (&desc->bus_dmadesc); 653e974f91cSConrad Meyer } 654e974f91cSConrad Meyer 655e974f91cSConrad Meyer struct bus_dmadesc * 656e974f91cSConrad Meyer ioat_copy(bus_dmaengine_t dmaengine, bus_addr_t dst, 657e974f91cSConrad Meyer bus_addr_t src, bus_size_t len, bus_dmaengine_callback_t callback_fn, 658e974f91cSConrad Meyer void *callback_arg, uint32_t flags) 659e974f91cSConrad Meyer { 660e974f91cSConrad Meyer struct ioat_descriptor *desc; 661e974f91cSConrad Meyer struct ioat_dma_hw_descriptor *hw_desc; 662e974f91cSConrad Meyer struct ioat_softc *ioat; 663e974f91cSConrad Meyer 664e974f91cSConrad Meyer KASSERT((flags & ~DMA_ALL_FLAGS) == 0, ("Unrecognized flag(s): %#x", 665e974f91cSConrad Meyer flags & ~DMA_ALL_FLAGS)); 666e974f91cSConrad Meyer 667e974f91cSConrad Meyer ioat = to_ioat_softc(dmaengine); 668e974f91cSConrad Meyer 669e974f91cSConrad Meyer if (len > ioat->max_xfer_size) { 670e974f91cSConrad Meyer ioat_log_message(0, "%s: max_xfer_size = %d, requested = %d\n", 671e974f91cSConrad Meyer __func__, ioat->max_xfer_size, (int)len); 672e974f91cSConrad Meyer return (NULL); 673e974f91cSConrad Meyer } 674e974f91cSConrad Meyer 675e974f91cSConrad Meyer if (ioat_reserve_space_and_lock(ioat, 1) != 0) 676e974f91cSConrad Meyer return (NULL); 677e974f91cSConrad Meyer 678e974f91cSConrad Meyer ioat_log_message(3, "%s\n", __func__); 679e974f91cSConrad Meyer 680e974f91cSConrad Meyer desc = ioat_get_ring_entry(ioat, ioat->head); 681e974f91cSConrad Meyer hw_desc = desc->u.dma; 682e974f91cSConrad Meyer 683e974f91cSConrad Meyer hw_desc->u.control_raw = 0; 684e974f91cSConrad Meyer hw_desc->u.control.completion_update = 1; 685e974f91cSConrad Meyer 686e974f91cSConrad Meyer if ((flags & DMA_INT_EN) != 0) 687e974f91cSConrad Meyer hw_desc->u.control.int_enable = 1; 688e974f91cSConrad Meyer 689e974f91cSConrad Meyer hw_desc->size = len; 690e974f91cSConrad Meyer hw_desc->src_addr = src; 691e974f91cSConrad Meyer hw_desc->dest_addr = dst; 692e974f91cSConrad Meyer 693e974f91cSConrad Meyer if (g_ioat_debug_level >= 3) 694e974f91cSConrad Meyer dump_descriptor(hw_desc); 695e974f91cSConrad Meyer 696e974f91cSConrad Meyer desc->bus_dmadesc.callback_fn = callback_fn; 697e974f91cSConrad Meyer desc->bus_dmadesc.callback_arg = callback_arg; 698e974f91cSConrad Meyer 699e974f91cSConrad Meyer ioat_submit_single(ioat); 700e974f91cSConrad Meyer return (&desc->bus_dmadesc); 701e974f91cSConrad Meyer } 702e974f91cSConrad Meyer 703e974f91cSConrad Meyer /* 704e974f91cSConrad Meyer * Ring Management 705e974f91cSConrad Meyer */ 706e974f91cSConrad Meyer static inline uint32_t 707e974f91cSConrad Meyer ioat_get_active(struct ioat_softc *ioat) 708e974f91cSConrad Meyer { 709e974f91cSConrad Meyer 710e974f91cSConrad Meyer return ((ioat->head - ioat->tail) & ((1 << ioat->ring_size_order) - 1)); 711e974f91cSConrad Meyer } 712e974f91cSConrad Meyer 713e974f91cSConrad Meyer static inline uint32_t 714e974f91cSConrad Meyer ioat_get_ring_space(struct ioat_softc *ioat) 715e974f91cSConrad Meyer { 716e974f91cSConrad Meyer 717e974f91cSConrad Meyer return ((1 << ioat->ring_size_order) - ioat_get_active(ioat) - 1); 718e974f91cSConrad Meyer } 719e974f91cSConrad Meyer 720e974f91cSConrad Meyer static struct ioat_descriptor * 721e974f91cSConrad Meyer ioat_alloc_ring_entry(struct ioat_softc *ioat) 722e974f91cSConrad Meyer { 723e974f91cSConrad Meyer struct ioat_dma_hw_descriptor *hw_desc; 724e974f91cSConrad Meyer struct ioat_descriptor *desc; 725e974f91cSConrad Meyer 726e974f91cSConrad Meyer desc = malloc(sizeof(struct ioat_descriptor), M_IOAT, M_NOWAIT); 727e974f91cSConrad Meyer if (desc == NULL) 728e974f91cSConrad Meyer return (NULL); 729e974f91cSConrad Meyer 730e974f91cSConrad Meyer bus_dmamem_alloc(ioat->hw_desc_tag, (void **)&hw_desc, BUS_DMA_ZERO, 731e974f91cSConrad Meyer &ioat->hw_desc_map); 732e974f91cSConrad Meyer if (hw_desc == NULL) { 733e974f91cSConrad Meyer free(desc, M_IOAT); 734e974f91cSConrad Meyer return (NULL); 735e974f91cSConrad Meyer } 736e974f91cSConrad Meyer 737e974f91cSConrad Meyer bus_dmamap_load(ioat->hw_desc_tag, ioat->hw_desc_map, hw_desc, 738e974f91cSConrad Meyer sizeof(*hw_desc), ioat_dmamap_cb, &desc->hw_desc_bus_addr, 0); 739e974f91cSConrad Meyer 740e974f91cSConrad Meyer desc->u.dma = hw_desc; 741e974f91cSConrad Meyer return (desc); 742e974f91cSConrad Meyer } 743e974f91cSConrad Meyer 744e974f91cSConrad Meyer static void 745e974f91cSConrad Meyer ioat_free_ring_entry(struct ioat_softc *ioat, struct ioat_descriptor *desc) 746e974f91cSConrad Meyer { 747e974f91cSConrad Meyer 748e974f91cSConrad Meyer if (desc == NULL) 749e974f91cSConrad Meyer return; 750e974f91cSConrad Meyer 751e974f91cSConrad Meyer if (desc->u.dma) 752e974f91cSConrad Meyer bus_dmamem_free(ioat->hw_desc_tag, desc->u.dma, 753e974f91cSConrad Meyer ioat->hw_desc_map); 754e974f91cSConrad Meyer free(desc, M_IOAT); 755e974f91cSConrad Meyer } 756e974f91cSConrad Meyer 757e974f91cSConrad Meyer static int 758e974f91cSConrad Meyer ioat_reserve_space_and_lock(struct ioat_softc *ioat, int num_descs) 759e974f91cSConrad Meyer { 760e974f91cSConrad Meyer boolean_t retry; 761e974f91cSConrad Meyer 762e974f91cSConrad Meyer while (1) { 763e974f91cSConrad Meyer if (ioat_get_ring_space(ioat) >= num_descs) 764e974f91cSConrad Meyer return (0); 765e974f91cSConrad Meyer 766e974f91cSConrad Meyer mtx_lock(&ioat->cleanup_lock); 767e974f91cSConrad Meyer retry = resize_ring(ioat, ioat->ring_size_order + 1); 768e974f91cSConrad Meyer mtx_unlock(&ioat->cleanup_lock); 769e974f91cSConrad Meyer 770e974f91cSConrad Meyer if (!retry) 771e974f91cSConrad Meyer return (ENOMEM); 772e974f91cSConrad Meyer } 773e974f91cSConrad Meyer } 774e974f91cSConrad Meyer 775e974f91cSConrad Meyer static struct ioat_descriptor * 776e974f91cSConrad Meyer ioat_get_ring_entry(struct ioat_softc *ioat, uint32_t index) 777e974f91cSConrad Meyer { 778e974f91cSConrad Meyer 779e974f91cSConrad Meyer return (ioat->ring[index % (1 << ioat->ring_size_order)]); 780e974f91cSConrad Meyer } 781e974f91cSConrad Meyer 782e974f91cSConrad Meyer static boolean_t 783e974f91cSConrad Meyer resize_ring(struct ioat_softc *ioat, int order) 784e974f91cSConrad Meyer { 785e974f91cSConrad Meyer struct ioat_descriptor **ring; 786e974f91cSConrad Meyer struct ioat_descriptor *next; 787e974f91cSConrad Meyer struct ioat_dma_hw_descriptor *hw; 788e974f91cSConrad Meyer struct ioat_descriptor *ent; 789e974f91cSConrad Meyer uint32_t current_size, active, new_size, i, new_idx, current_idx; 790e974f91cSConrad Meyer uint32_t new_idx2; 791e974f91cSConrad Meyer 792e974f91cSConrad Meyer current_size = 1 << ioat->ring_size_order; 793e974f91cSConrad Meyer active = (ioat->head - ioat->tail) & (current_size - 1); 794e974f91cSConrad Meyer new_size = 1 << order; 795e974f91cSConrad Meyer 796e974f91cSConrad Meyer if (order > IOAT_MAX_ORDER) 797e974f91cSConrad Meyer return (FALSE); 798e974f91cSConrad Meyer 799e974f91cSConrad Meyer /* 800e974f91cSConrad Meyer * when shrinking, verify that we can hold the current active 801e974f91cSConrad Meyer * set in the new ring 802e974f91cSConrad Meyer */ 803e974f91cSConrad Meyer if (active >= new_size) 804e974f91cSConrad Meyer return (FALSE); 805e974f91cSConrad Meyer 806e974f91cSConrad Meyer /* allocate the array to hold the software ring */ 807e974f91cSConrad Meyer ring = malloc(new_size * sizeof(*ring), M_IOAT, M_ZERO | M_NOWAIT); 808e974f91cSConrad Meyer if (ring == NULL) 809e974f91cSConrad Meyer return (FALSE); 810e974f91cSConrad Meyer 811e974f91cSConrad Meyer ioat_log_message(2, "ring resize: new: %d old: %d\n", 812e974f91cSConrad Meyer new_size, current_size); 813e974f91cSConrad Meyer 814e974f91cSConrad Meyer /* allocate/trim descriptors as needed */ 815e974f91cSConrad Meyer if (new_size > current_size) { 816e974f91cSConrad Meyer /* copy current descriptors to the new ring */ 817e974f91cSConrad Meyer for (i = 0; i < current_size; i++) { 818e974f91cSConrad Meyer current_idx = (ioat->tail + i) & (current_size - 1); 819e974f91cSConrad Meyer new_idx = (ioat->tail + i) & (new_size - 1); 820e974f91cSConrad Meyer 821e974f91cSConrad Meyer ring[new_idx] = ioat->ring[current_idx]; 822e974f91cSConrad Meyer ring[new_idx]->id = new_idx; 823e974f91cSConrad Meyer } 824e974f91cSConrad Meyer 825e974f91cSConrad Meyer /* add new descriptors to the ring */ 826e974f91cSConrad Meyer for (i = current_size; i < new_size; i++) { 827e974f91cSConrad Meyer new_idx = (ioat->tail + i) & (new_size - 1); 828e974f91cSConrad Meyer 829e974f91cSConrad Meyer ring[new_idx] = ioat_alloc_ring_entry(ioat); 8308c8e8487SConrad Meyer if (ring[new_idx] == NULL) { 831e974f91cSConrad Meyer while (i--) { 832e974f91cSConrad Meyer new_idx2 = (ioat->tail + i) & 833e974f91cSConrad Meyer (new_size - 1); 834e974f91cSConrad Meyer 835e974f91cSConrad Meyer ioat_free_ring_entry(ioat, 836e974f91cSConrad Meyer ring[new_idx2]); 837e974f91cSConrad Meyer } 838e974f91cSConrad Meyer free(ring, M_IOAT); 839e974f91cSConrad Meyer return (FALSE); 840e974f91cSConrad Meyer } 841e974f91cSConrad Meyer ring[new_idx]->id = new_idx; 842e974f91cSConrad Meyer } 843e974f91cSConrad Meyer 844e974f91cSConrad Meyer for (i = current_size - 1; i < new_size; i++) { 845e974f91cSConrad Meyer new_idx = (ioat->tail + i) & (new_size - 1); 846e974f91cSConrad Meyer next = ring[(new_idx + 1) & (new_size - 1)]; 847e974f91cSConrad Meyer hw = ring[new_idx]->u.dma; 848e974f91cSConrad Meyer 849e974f91cSConrad Meyer hw->next = next->hw_desc_bus_addr; 850e974f91cSConrad Meyer } 851e974f91cSConrad Meyer } else { 852e974f91cSConrad Meyer /* 853e974f91cSConrad Meyer * copy current descriptors to the new ring, dropping the 854e974f91cSConrad Meyer * removed descriptors 855e974f91cSConrad Meyer */ 856e974f91cSConrad Meyer for (i = 0; i < new_size; i++) { 857e974f91cSConrad Meyer current_idx = (ioat->tail + i) & (current_size - 1); 858e974f91cSConrad Meyer new_idx = (ioat->tail + i) & (new_size - 1); 859e974f91cSConrad Meyer 860e974f91cSConrad Meyer ring[new_idx] = ioat->ring[current_idx]; 861e974f91cSConrad Meyer ring[new_idx]->id = new_idx; 862e974f91cSConrad Meyer } 863e974f91cSConrad Meyer 864e974f91cSConrad Meyer /* free deleted descriptors */ 865e974f91cSConrad Meyer for (i = new_size; i < current_size; i++) { 866e974f91cSConrad Meyer ent = ioat_get_ring_entry(ioat, ioat->tail + i); 867e974f91cSConrad Meyer ioat_free_ring_entry(ioat, ent); 868e974f91cSConrad Meyer } 869e974f91cSConrad Meyer 870e974f91cSConrad Meyer /* fix up hardware ring */ 871e974f91cSConrad Meyer hw = ring[(ioat->tail + new_size - 1) & (new_size - 1)]->u.dma; 872e974f91cSConrad Meyer next = ring[(ioat->tail + new_size) & (new_size - 1)]; 873e974f91cSConrad Meyer hw->next = next->hw_desc_bus_addr; 874e974f91cSConrad Meyer } 875e974f91cSConrad Meyer 876e974f91cSConrad Meyer free(ioat->ring, M_IOAT); 877e974f91cSConrad Meyer ioat->ring = ring; 878e974f91cSConrad Meyer ioat->ring_size_order = order; 879e974f91cSConrad Meyer 880e974f91cSConrad Meyer return (TRUE); 881e974f91cSConrad Meyer } 882e974f91cSConrad Meyer 883e974f91cSConrad Meyer static void 884e974f91cSConrad Meyer ioat_timer_callback(void *arg) 885e974f91cSConrad Meyer { 886e974f91cSConrad Meyer struct ioat_descriptor *desc; 887e974f91cSConrad Meyer struct ioat_softc *ioat; 888e974f91cSConrad Meyer uint64_t status; 889e974f91cSConrad Meyer uint32_t chanerr; 890e974f91cSConrad Meyer 891e974f91cSConrad Meyer ioat = arg; 892e974f91cSConrad Meyer ioat_log_message(2, "%s\n", __func__); 893e974f91cSConrad Meyer 894e974f91cSConrad Meyer if (ioat->is_completion_pending) { 895e974f91cSConrad Meyer status = ioat_get_chansts(ioat); 896e974f91cSConrad Meyer 897e974f91cSConrad Meyer /* 898e974f91cSConrad Meyer * When halted due to errors, check for channel programming 899e974f91cSConrad Meyer * errors before advancing the completion state. 900e974f91cSConrad Meyer */ 901e974f91cSConrad Meyer if (is_ioat_halted(status)) { 902e974f91cSConrad Meyer chanerr = ioat_read_4(ioat, IOAT_CHANERR_OFFSET); 903e974f91cSConrad Meyer ioat_log_message(0, "Channel halted (%x)\n", chanerr); 904e974f91cSConrad Meyer 905e974f91cSConrad Meyer desc = ioat_get_ring_entry(ioat, ioat->tail + 0); 906e974f91cSConrad Meyer dump_descriptor(desc->u.raw); 907e974f91cSConrad Meyer 908e974f91cSConrad Meyer desc = ioat_get_ring_entry(ioat, ioat->tail + 1); 909e974f91cSConrad Meyer dump_descriptor(desc->u.raw); 910e974f91cSConrad Meyer } 911e974f91cSConrad Meyer ioat_process_events(ioat); 912e974f91cSConrad Meyer } else { 913e974f91cSConrad Meyer mtx_lock(&ioat->submit_lock); 914e974f91cSConrad Meyer mtx_lock(&ioat->cleanup_lock); 915e974f91cSConrad Meyer 916e974f91cSConrad Meyer if (ioat_get_active(ioat) == 0 && 917e974f91cSConrad Meyer ioat->ring_size_order > IOAT_MIN_ORDER) 918e974f91cSConrad Meyer resize_ring(ioat, ioat->ring_size_order - 1); 919e974f91cSConrad Meyer 920e974f91cSConrad Meyer mtx_unlock(&ioat->cleanup_lock); 921e974f91cSConrad Meyer mtx_unlock(&ioat->submit_lock); 922e974f91cSConrad Meyer 923e974f91cSConrad Meyer if (ioat->ring_size_order > IOAT_MIN_ORDER) 924e974f91cSConrad Meyer callout_reset(&ioat->timer, 5 * hz, 925e974f91cSConrad Meyer ioat_timer_callback, ioat); 926e974f91cSConrad Meyer } 927e974f91cSConrad Meyer } 928e974f91cSConrad Meyer 929e974f91cSConrad Meyer /* 930e974f91cSConrad Meyer * Support Functions 931e974f91cSConrad Meyer */ 932e974f91cSConrad Meyer static void 933e974f91cSConrad Meyer ioat_submit_single(struct ioat_softc *ioat) 934e974f91cSConrad Meyer { 935e974f91cSConrad Meyer 936e974f91cSConrad Meyer atomic_add_rel_int(&ioat->head, 1); 937e974f91cSConrad Meyer 938e974f91cSConrad Meyer if (!ioat->is_completion_pending) { 939e974f91cSConrad Meyer ioat->is_completion_pending = TRUE; 940e974f91cSConrad Meyer callout_reset(&ioat->timer, 10 * hz, ioat_timer_callback, 941e974f91cSConrad Meyer ioat); 942e974f91cSConrad Meyer } 943e974f91cSConrad Meyer } 944e974f91cSConrad Meyer 945e974f91cSConrad Meyer static int 946e974f91cSConrad Meyer ioat_reset_hw(struct ioat_softc *ioat) 947e974f91cSConrad Meyer { 948e974f91cSConrad Meyer uint64_t status; 949e974f91cSConrad Meyer uint32_t chanerr; 950*4253ea50SConrad Meyer int timeout, error; 951e974f91cSConrad Meyer 952e974f91cSConrad Meyer status = ioat_get_chansts(ioat); 953e974f91cSConrad Meyer if (is_ioat_active(status) || is_ioat_idle(status)) 954e974f91cSConrad Meyer ioat_suspend(ioat); 955e974f91cSConrad Meyer 956e974f91cSConrad Meyer /* Wait at most 20 ms */ 957e974f91cSConrad Meyer for (timeout = 0; (is_ioat_active(status) || is_ioat_idle(status)) && 958e974f91cSConrad Meyer timeout < 20; timeout++) { 959e974f91cSConrad Meyer DELAY(1000); 960e974f91cSConrad Meyer status = ioat_get_chansts(ioat); 961e974f91cSConrad Meyer } 962e974f91cSConrad Meyer if (timeout == 20) 963e974f91cSConrad Meyer return (ETIMEDOUT); 964e974f91cSConrad Meyer 965e974f91cSConrad Meyer chanerr = ioat_read_4(ioat, IOAT_CHANERR_OFFSET); 966e974f91cSConrad Meyer ioat_write_4(ioat, IOAT_CHANERR_OFFSET, chanerr); 967e974f91cSConrad Meyer 968e974f91cSConrad Meyer /* 969e974f91cSConrad Meyer * IOAT v3 workaround - CHANERRMSK_INT with 3E07h to masks out errors 970e974f91cSConrad Meyer * that can cause stability issues for IOAT v3. 971e974f91cSConrad Meyer */ 972e974f91cSConrad Meyer pci_write_config(ioat->device, IOAT_CFG_CHANERRMASK_INT_OFFSET, 0x3e07, 973e974f91cSConrad Meyer 4); 974e974f91cSConrad Meyer chanerr = pci_read_config(ioat->device, IOAT_CFG_CHANERR_INT_OFFSET, 4); 975e974f91cSConrad Meyer pci_write_config(ioat->device, IOAT_CFG_CHANERR_INT_OFFSET, chanerr, 4); 976e974f91cSConrad Meyer 977e974f91cSConrad Meyer ioat_reset(ioat); 978e974f91cSConrad Meyer 979e974f91cSConrad Meyer /* Wait at most 20 ms */ 980e974f91cSConrad Meyer for (timeout = 0; ioat_reset_pending(ioat) && timeout < 20; timeout++) 981e974f91cSConrad Meyer DELAY(1000); 982e974f91cSConrad Meyer if (timeout == 20) 983e974f91cSConrad Meyer return (ETIMEDOUT); 984e974f91cSConrad Meyer 985*4253ea50SConrad Meyer /* 986*4253ea50SConrad Meyer * BDXDE models reset MSI-X registers on device reset. We must 987*4253ea50SConrad Meyer * teardown and re-setup interrupts. 988*4253ea50SConrad Meyer */ 989*4253ea50SConrad Meyer if (ioat_is_bdxde(ioat)) { 990*4253ea50SConrad Meyer error = ioat_teardown_intr(ioat); 991*4253ea50SConrad Meyer if (error) 992*4253ea50SConrad Meyer return (error); 993*4253ea50SConrad Meyer 994*4253ea50SConrad Meyer error = ioat_setup_intr(ioat); 995*4253ea50SConrad Meyer if (error) 996*4253ea50SConrad Meyer return (error); 997*4253ea50SConrad Meyer } 998*4253ea50SConrad Meyer 999e974f91cSConrad Meyer return (0); 1000e974f91cSConrad Meyer } 1001e974f91cSConrad Meyer 1002e974f91cSConrad Meyer static void 1003e974f91cSConrad Meyer dump_descriptor(void *hw_desc) 1004e974f91cSConrad Meyer { 1005e974f91cSConrad Meyer int i, j; 1006e974f91cSConrad Meyer 1007e974f91cSConrad Meyer for (i = 0; i < 2; i++) { 1008e974f91cSConrad Meyer for (j = 0; j < 8; j++) 1009e974f91cSConrad Meyer printf("%08x ", ((uint32_t *)hw_desc)[i * 8 + j]); 1010e974f91cSConrad Meyer printf("\n"); 1011e974f91cSConrad Meyer } 1012e974f91cSConrad Meyer } 1013e974f91cSConrad Meyer 1014e974f91cSConrad Meyer static void 1015e974f91cSConrad Meyer ioat_setup_sysctl(device_t device) 1016e974f91cSConrad Meyer { 1017e974f91cSConrad Meyer struct sysctl_ctx_list *sysctl_ctx; 1018e974f91cSConrad Meyer struct sysctl_oid *sysctl_tree; 1019e974f91cSConrad Meyer struct ioat_softc *ioat; 1020e974f91cSConrad Meyer 1021e974f91cSConrad Meyer ioat = DEVICE2SOFTC(device); 1022e974f91cSConrad Meyer sysctl_ctx = device_get_sysctl_ctx(device); 1023e974f91cSConrad Meyer sysctl_tree = device_get_sysctl_tree(device); 1024e974f91cSConrad Meyer 1025e974f91cSConrad Meyer SYSCTL_ADD_UINT(sysctl_ctx, SYSCTL_CHILDREN(sysctl_tree), OID_AUTO, 1026e974f91cSConrad Meyer "ring_size_order", CTLFLAG_RD, &ioat->ring_size_order, 1027e974f91cSConrad Meyer 0, "HW descriptor ring size order"); 1028e974f91cSConrad Meyer SYSCTL_ADD_UINT(sysctl_ctx, SYSCTL_CHILDREN(sysctl_tree), OID_AUTO, 1029e974f91cSConrad Meyer "head", CTLFLAG_RD, &ioat->head, 1030e974f91cSConrad Meyer 0, "HW descriptor head pointer index"); 1031e974f91cSConrad Meyer SYSCTL_ADD_UINT(sysctl_ctx, SYSCTL_CHILDREN(sysctl_tree), OID_AUTO, 1032e974f91cSConrad Meyer "tail", CTLFLAG_RD, &ioat->tail, 1033e974f91cSConrad Meyer 0, "HW descriptor tail pointer index"); 1034e974f91cSConrad Meyer } 1035e974f91cSConrad Meyer 1036e974f91cSConrad Meyer void 1037e974f91cSConrad Meyer ioat_log_message(int verbosity, char *fmt, ...) 1038e974f91cSConrad Meyer { 1039e974f91cSConrad Meyer va_list argp; 1040e974f91cSConrad Meyer char buffer[512]; 1041e974f91cSConrad Meyer struct timeval tv; 1042e974f91cSConrad Meyer 1043e974f91cSConrad Meyer if (verbosity > g_ioat_debug_level) 1044e974f91cSConrad Meyer return; 1045e974f91cSConrad Meyer 1046e974f91cSConrad Meyer va_start(argp, fmt); 1047e974f91cSConrad Meyer vsnprintf(buffer, sizeof(buffer) - 1, fmt, argp); 1048e974f91cSConrad Meyer va_end(argp); 1049e974f91cSConrad Meyer microuptime(&tv); 1050e974f91cSConrad Meyer 1051e974f91cSConrad Meyer printf("[%d:%06d] ioat: %s", (int)tv.tv_sec, (int)tv.tv_usec, buffer); 1052e974f91cSConrad Meyer } 1053