1e974f91cSConrad Meyer /*- 2e974f91cSConrad Meyer * Copyright (C) 2012 Intel Corporation 3e974f91cSConrad Meyer * All rights reserved. 4e974f91cSConrad Meyer * 5e974f91cSConrad Meyer * Redistribution and use in source and binary forms, with or without 6e974f91cSConrad Meyer * modification, are permitted provided that the following conditions 7e974f91cSConrad Meyer * are met: 8e974f91cSConrad Meyer * 1. Redistributions of source code must retain the above copyright 9e974f91cSConrad Meyer * notice, this list of conditions and the following disclaimer. 10e974f91cSConrad Meyer * 2. Redistributions in binary form must reproduce the above copyright 11e974f91cSConrad Meyer * notice, this list of conditions and the following disclaimer in the 12e974f91cSConrad Meyer * documentation and/or other materials provided with the distribution. 13e974f91cSConrad Meyer * 14e974f91cSConrad Meyer * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND 15e974f91cSConrad Meyer * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 16e974f91cSConrad Meyer * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 17e974f91cSConrad Meyer * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE 18e974f91cSConrad Meyer * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 19e974f91cSConrad Meyer * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 20e974f91cSConrad Meyer * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 21e974f91cSConrad Meyer * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 22e974f91cSConrad Meyer * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 23e974f91cSConrad Meyer * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 24e974f91cSConrad Meyer * SUCH DAMAGE. 25e974f91cSConrad Meyer */ 26e974f91cSConrad Meyer 27e974f91cSConrad Meyer #include <sys/cdefs.h> 28e974f91cSConrad Meyer __FBSDID("$FreeBSD$"); 29e974f91cSConrad Meyer 30e974f91cSConrad Meyer #include <sys/param.h> 31e974f91cSConrad Meyer #include <sys/systm.h> 32e974f91cSConrad Meyer #include <sys/bus.h> 33e974f91cSConrad Meyer #include <sys/conf.h> 34e974f91cSConrad Meyer #include <sys/ioccom.h> 35e974f91cSConrad Meyer #include <sys/kernel.h> 36e974f91cSConrad Meyer #include <sys/lock.h> 37e974f91cSConrad Meyer #include <sys/malloc.h> 38e974f91cSConrad Meyer #include <sys/module.h> 39e974f91cSConrad Meyer #include <sys/mutex.h> 40e974f91cSConrad Meyer #include <sys/rman.h> 41e974f91cSConrad Meyer #include <sys/sysctl.h> 42e974f91cSConrad Meyer #include <sys/time.h> 43e974f91cSConrad Meyer #include <dev/pci/pcireg.h> 44e974f91cSConrad Meyer #include <dev/pci/pcivar.h> 45e974f91cSConrad Meyer #include <machine/bus.h> 46e974f91cSConrad Meyer #include <machine/resource.h> 47e974f91cSConrad Meyer #include <machine/stdarg.h> 48e974f91cSConrad Meyer 49e974f91cSConrad Meyer #include "ioat.h" 50e974f91cSConrad Meyer #include "ioat_hw.h" 51e974f91cSConrad Meyer #include "ioat_internal.h" 52e974f91cSConrad Meyer 53e974f91cSConrad Meyer static int ioat_probe(device_t device); 54e974f91cSConrad Meyer static int ioat_attach(device_t device); 55e974f91cSConrad Meyer static int ioat_detach(device_t device); 564253ea50SConrad Meyer static int ioat_setup_intr(struct ioat_softc *ioat); 574253ea50SConrad Meyer static int ioat_teardown_intr(struct ioat_softc *ioat); 58e974f91cSConrad Meyer static int ioat3_attach(device_t device); 59*7afbb263SConrad Meyer static int ioat3_selftest(struct ioat_softc *ioat); 60e974f91cSConrad Meyer static int ioat_map_pci_bar(struct ioat_softc *ioat); 61e974f91cSConrad Meyer static void ioat_dmamap_cb(void *arg, bus_dma_segment_t *segs, int nseg, 62e974f91cSConrad Meyer int error); 63e974f91cSConrad Meyer static void ioat_interrupt_handler(void *arg); 640d1a05d9SConrad Meyer static boolean_t ioat_model_resets_msix(struct ioat_softc *ioat); 65e974f91cSConrad Meyer static void ioat_process_events(struct ioat_softc *ioat); 66e974f91cSConrad Meyer static inline uint32_t ioat_get_active(struct ioat_softc *ioat); 67e974f91cSConrad Meyer static inline uint32_t ioat_get_ring_space(struct ioat_softc *ioat); 68e974f91cSConrad Meyer static void ioat_free_ring_entry(struct ioat_softc *ioat, 69e974f91cSConrad Meyer struct ioat_descriptor *desc); 70e974f91cSConrad Meyer static struct ioat_descriptor * ioat_alloc_ring_entry(struct ioat_softc *ioat); 71e974f91cSConrad Meyer static int ioat_reserve_space_and_lock(struct ioat_softc *ioat, int num_descs); 72e974f91cSConrad Meyer static struct ioat_descriptor * ioat_get_ring_entry(struct ioat_softc *ioat, 73e974f91cSConrad Meyer uint32_t index); 74e974f91cSConrad Meyer static boolean_t resize_ring(struct ioat_softc *ioat, int order); 75e974f91cSConrad Meyer static void ioat_timer_callback(void *arg); 76e974f91cSConrad Meyer static void dump_descriptor(void *hw_desc); 77e974f91cSConrad Meyer static void ioat_submit_single(struct ioat_softc *ioat); 78e974f91cSConrad Meyer static void ioat_comp_update_map(void *arg, bus_dma_segment_t *seg, int nseg, 79e974f91cSConrad Meyer int error); 80e974f91cSConrad Meyer static int ioat_reset_hw(struct ioat_softc *ioat); 81e974f91cSConrad Meyer static void ioat_setup_sysctl(device_t device); 82e974f91cSConrad Meyer 83e974f91cSConrad Meyer MALLOC_DEFINE(M_IOAT, "ioat", "ioat driver memory allocations"); 84e974f91cSConrad Meyer SYSCTL_NODE(_hw, OID_AUTO, ioat, CTLFLAG_RD, 0, "ioat node"); 85e974f91cSConrad Meyer 86e974f91cSConrad Meyer static int g_force_legacy_interrupts; 87e974f91cSConrad Meyer SYSCTL_INT(_hw_ioat, OID_AUTO, force_legacy_interrupts, CTLFLAG_RDTUN, 88e974f91cSConrad Meyer &g_force_legacy_interrupts, 0, "Set to non-zero to force MSI-X disabled"); 89e974f91cSConrad Meyer 90e974f91cSConrad Meyer static int g_ioat_debug_level = 0; 91e974f91cSConrad Meyer SYSCTL_INT(_hw_ioat, OID_AUTO, debug_level, CTLFLAG_RWTUN, &g_ioat_debug_level, 92e974f91cSConrad Meyer 0, "Set log level (0-3) for ioat(4). Higher is more verbose."); 93e974f91cSConrad Meyer 94e974f91cSConrad Meyer /* 95e974f91cSConrad Meyer * OS <-> Driver interface structures 96e974f91cSConrad Meyer */ 97e974f91cSConrad Meyer static device_method_t ioat_pci_methods[] = { 98e974f91cSConrad Meyer /* Device interface */ 99e974f91cSConrad Meyer DEVMETHOD(device_probe, ioat_probe), 100e974f91cSConrad Meyer DEVMETHOD(device_attach, ioat_attach), 101e974f91cSConrad Meyer DEVMETHOD(device_detach, ioat_detach), 102e974f91cSConrad Meyer { 0, 0 } 103e974f91cSConrad Meyer }; 104e974f91cSConrad Meyer 105e974f91cSConrad Meyer static driver_t ioat_pci_driver = { 106e974f91cSConrad Meyer "ioat", 107e974f91cSConrad Meyer ioat_pci_methods, 108e974f91cSConrad Meyer sizeof(struct ioat_softc), 109e974f91cSConrad Meyer }; 110e974f91cSConrad Meyer 111e974f91cSConrad Meyer static devclass_t ioat_devclass; 112e974f91cSConrad Meyer DRIVER_MODULE(ioat, pci, ioat_pci_driver, ioat_devclass, 0, 0); 113e974f91cSConrad Meyer 114e974f91cSConrad Meyer /* 115e974f91cSConrad Meyer * Private data structures 116e974f91cSConrad Meyer */ 117e974f91cSConrad Meyer static struct ioat_softc *ioat_channel[IOAT_MAX_CHANNELS]; 118e974f91cSConrad Meyer static int ioat_channel_index = 0; 119e974f91cSConrad Meyer SYSCTL_INT(_hw_ioat, OID_AUTO, channels, CTLFLAG_RD, &ioat_channel_index, 0, 120e974f91cSConrad Meyer "Number of IOAT channels attached"); 121e974f91cSConrad Meyer 122e974f91cSConrad Meyer static struct _pcsid 123e974f91cSConrad Meyer { 124e974f91cSConrad Meyer u_int32_t type; 125e974f91cSConrad Meyer const char *desc; 126e974f91cSConrad Meyer } pci_ids[] = { 127e974f91cSConrad Meyer { 0x34308086, "TBG IOAT Ch0" }, 128e974f91cSConrad Meyer { 0x34318086, "TBG IOAT Ch1" }, 129e974f91cSConrad Meyer { 0x34328086, "TBG IOAT Ch2" }, 130e974f91cSConrad Meyer { 0x34338086, "TBG IOAT Ch3" }, 131e974f91cSConrad Meyer { 0x34298086, "TBG IOAT Ch4" }, 132e974f91cSConrad Meyer { 0x342a8086, "TBG IOAT Ch5" }, 133e974f91cSConrad Meyer { 0x342b8086, "TBG IOAT Ch6" }, 134e974f91cSConrad Meyer { 0x342c8086, "TBG IOAT Ch7" }, 135e974f91cSConrad Meyer 136e974f91cSConrad Meyer { 0x37108086, "JSF IOAT Ch0" }, 137e974f91cSConrad Meyer { 0x37118086, "JSF IOAT Ch1" }, 138e974f91cSConrad Meyer { 0x37128086, "JSF IOAT Ch2" }, 139e974f91cSConrad Meyer { 0x37138086, "JSF IOAT Ch3" }, 140e974f91cSConrad Meyer { 0x37148086, "JSF IOAT Ch4" }, 141e974f91cSConrad Meyer { 0x37158086, "JSF IOAT Ch5" }, 142e974f91cSConrad Meyer { 0x37168086, "JSF IOAT Ch6" }, 143e974f91cSConrad Meyer { 0x37178086, "JSF IOAT Ch7" }, 144e974f91cSConrad Meyer { 0x37188086, "JSF IOAT Ch0 (RAID)" }, 145e974f91cSConrad Meyer { 0x37198086, "JSF IOAT Ch1 (RAID)" }, 146e974f91cSConrad Meyer 147e974f91cSConrad Meyer { 0x3c208086, "SNB IOAT Ch0" }, 148e974f91cSConrad Meyer { 0x3c218086, "SNB IOAT Ch1" }, 149e974f91cSConrad Meyer { 0x3c228086, "SNB IOAT Ch2" }, 150e974f91cSConrad Meyer { 0x3c238086, "SNB IOAT Ch3" }, 151e974f91cSConrad Meyer { 0x3c248086, "SNB IOAT Ch4" }, 152e974f91cSConrad Meyer { 0x3c258086, "SNB IOAT Ch5" }, 153e974f91cSConrad Meyer { 0x3c268086, "SNB IOAT Ch6" }, 154e974f91cSConrad Meyer { 0x3c278086, "SNB IOAT Ch7" }, 155e974f91cSConrad Meyer { 0x3c2e8086, "SNB IOAT Ch0 (RAID)" }, 156e974f91cSConrad Meyer { 0x3c2f8086, "SNB IOAT Ch1 (RAID)" }, 157e974f91cSConrad Meyer 158e974f91cSConrad Meyer { 0x0e208086, "IVB IOAT Ch0" }, 159e974f91cSConrad Meyer { 0x0e218086, "IVB IOAT Ch1" }, 160e974f91cSConrad Meyer { 0x0e228086, "IVB IOAT Ch2" }, 161e974f91cSConrad Meyer { 0x0e238086, "IVB IOAT Ch3" }, 162e974f91cSConrad Meyer { 0x0e248086, "IVB IOAT Ch4" }, 163e974f91cSConrad Meyer { 0x0e258086, "IVB IOAT Ch5" }, 164e974f91cSConrad Meyer { 0x0e268086, "IVB IOAT Ch6" }, 165e974f91cSConrad Meyer { 0x0e278086, "IVB IOAT Ch7" }, 166e974f91cSConrad Meyer { 0x0e2e8086, "IVB IOAT Ch0 (RAID)" }, 167e974f91cSConrad Meyer { 0x0e2f8086, "IVB IOAT Ch1 (RAID)" }, 168e974f91cSConrad Meyer 169e974f91cSConrad Meyer { 0x2f208086, "HSW IOAT Ch0" }, 170e974f91cSConrad Meyer { 0x2f218086, "HSW IOAT Ch1" }, 171e974f91cSConrad Meyer { 0x2f228086, "HSW IOAT Ch2" }, 172e974f91cSConrad Meyer { 0x2f238086, "HSW IOAT Ch3" }, 173e974f91cSConrad Meyer { 0x2f248086, "HSW IOAT Ch4" }, 174e974f91cSConrad Meyer { 0x2f258086, "HSW IOAT Ch5" }, 175e974f91cSConrad Meyer { 0x2f268086, "HSW IOAT Ch6" }, 176e974f91cSConrad Meyer { 0x2f278086, "HSW IOAT Ch7" }, 177e974f91cSConrad Meyer { 0x2f2e8086, "HSW IOAT Ch0 (RAID)" }, 178e974f91cSConrad Meyer { 0x2f2f8086, "HSW IOAT Ch1 (RAID)" }, 179e974f91cSConrad Meyer 180e974f91cSConrad Meyer { 0x0c508086, "BWD IOAT Ch0" }, 181e974f91cSConrad Meyer { 0x0c518086, "BWD IOAT Ch1" }, 182e974f91cSConrad Meyer { 0x0c528086, "BWD IOAT Ch2" }, 183e974f91cSConrad Meyer { 0x0c538086, "BWD IOAT Ch3" }, 184e974f91cSConrad Meyer 185e974f91cSConrad Meyer { 0x6f508086, "BDXDE IOAT Ch0" }, 186e974f91cSConrad Meyer { 0x6f518086, "BDXDE IOAT Ch1" }, 187e974f91cSConrad Meyer { 0x6f528086, "BDXDE IOAT Ch2" }, 188e974f91cSConrad Meyer { 0x6f538086, "BDXDE IOAT Ch3" }, 189e974f91cSConrad Meyer 190e974f91cSConrad Meyer { 0x00000000, NULL } 191e974f91cSConrad Meyer }; 192e974f91cSConrad Meyer 193e974f91cSConrad Meyer /* 194e974f91cSConrad Meyer * OS <-> Driver linkage functions 195e974f91cSConrad Meyer */ 196e974f91cSConrad Meyer static int 197e974f91cSConrad Meyer ioat_probe(device_t device) 198e974f91cSConrad Meyer { 199e974f91cSConrad Meyer struct _pcsid *ep; 200e974f91cSConrad Meyer u_int32_t type; 201e974f91cSConrad Meyer 202e974f91cSConrad Meyer type = pci_get_devid(device); 203e974f91cSConrad Meyer for (ep = pci_ids; ep->type; ep++) { 204e974f91cSConrad Meyer if (ep->type == type) { 205e974f91cSConrad Meyer device_set_desc(device, ep->desc); 206e974f91cSConrad Meyer return (0); 207e974f91cSConrad Meyer } 208e974f91cSConrad Meyer } 209e974f91cSConrad Meyer return (ENXIO); 210e974f91cSConrad Meyer } 211e974f91cSConrad Meyer 212e974f91cSConrad Meyer static int 213e974f91cSConrad Meyer ioat_attach(device_t device) 214e974f91cSConrad Meyer { 215e974f91cSConrad Meyer struct ioat_softc *ioat; 216e974f91cSConrad Meyer int error; 217e974f91cSConrad Meyer 218e974f91cSConrad Meyer ioat = DEVICE2SOFTC(device); 219e974f91cSConrad Meyer ioat->device = device; 220e974f91cSConrad Meyer 221e974f91cSConrad Meyer error = ioat_map_pci_bar(ioat); 222e974f91cSConrad Meyer if (error != 0) 223e974f91cSConrad Meyer goto err; 224e974f91cSConrad Meyer 225e974f91cSConrad Meyer ioat->version = ioat_read_cbver(ioat); 226e974f91cSConrad Meyer if (ioat->version < IOAT_VER_3_0) { 227e974f91cSConrad Meyer error = ENODEV; 228e974f91cSConrad Meyer goto err; 229e974f91cSConrad Meyer } 230e974f91cSConrad Meyer 2314253ea50SConrad Meyer error = ioat_setup_intr(ioat); 2324253ea50SConrad Meyer if (error != 0) 2334253ea50SConrad Meyer return (error); 2344253ea50SConrad Meyer 235e974f91cSConrad Meyer error = ioat3_attach(device); 236e974f91cSConrad Meyer if (error != 0) 237e974f91cSConrad Meyer goto err; 238e974f91cSConrad Meyer 239e974f91cSConrad Meyer error = pci_enable_busmaster(device); 240e974f91cSConrad Meyer if (error != 0) 241e974f91cSConrad Meyer goto err; 242e974f91cSConrad Meyer 243*7afbb263SConrad Meyer error = ioat3_selftest(ioat); 244*7afbb263SConrad Meyer if (error != 0) 245*7afbb263SConrad Meyer return (error); 246*7afbb263SConrad Meyer 247*7afbb263SConrad Meyer ioat_process_events(ioat); 248*7afbb263SConrad Meyer ioat_setup_sysctl(device); 249*7afbb263SConrad Meyer 250e974f91cSConrad Meyer ioat_channel[ioat_channel_index++] = ioat; 251*7afbb263SConrad Meyer ioat_test_attach(); 252e974f91cSConrad Meyer 253e974f91cSConrad Meyer err: 254e974f91cSConrad Meyer if (error != 0) 255e974f91cSConrad Meyer ioat_detach(device); 256e974f91cSConrad Meyer return (error); 257e974f91cSConrad Meyer } 258e974f91cSConrad Meyer 259e974f91cSConrad Meyer static int 260e974f91cSConrad Meyer ioat_detach(device_t device) 261e974f91cSConrad Meyer { 262e974f91cSConrad Meyer struct ioat_softc *ioat; 263e974f91cSConrad Meyer uint32_t i; 264e974f91cSConrad Meyer 265e974f91cSConrad Meyer ioat = DEVICE2SOFTC(device); 266*7afbb263SConrad Meyer 267*7afbb263SConrad Meyer ioat_test_detach(); 268e974f91cSConrad Meyer callout_drain(&ioat->timer); 269e974f91cSConrad Meyer 270e974f91cSConrad Meyer pci_disable_busmaster(device); 271e974f91cSConrad Meyer 272e974f91cSConrad Meyer if (ioat->pci_resource != NULL) 273e974f91cSConrad Meyer bus_release_resource(device, SYS_RES_MEMORY, 274e974f91cSConrad Meyer ioat->pci_resource_id, ioat->pci_resource); 275e974f91cSConrad Meyer 276e974f91cSConrad Meyer if (ioat->ring != NULL) { 277e974f91cSConrad Meyer for (i = 0; i < (1 << ioat->ring_size_order); i++) 278e974f91cSConrad Meyer ioat_free_ring_entry(ioat, ioat->ring[i]); 279e974f91cSConrad Meyer free(ioat->ring, M_IOAT); 280e974f91cSConrad Meyer } 281e974f91cSConrad Meyer 282e974f91cSConrad Meyer if (ioat->comp_update != NULL) { 283e974f91cSConrad Meyer bus_dmamap_unload(ioat->comp_update_tag, ioat->comp_update_map); 284e974f91cSConrad Meyer bus_dmamem_free(ioat->comp_update_tag, ioat->comp_update, 285e974f91cSConrad Meyer ioat->comp_update_map); 286e974f91cSConrad Meyer bus_dma_tag_destroy(ioat->comp_update_tag); 287e974f91cSConrad Meyer } 288e974f91cSConrad Meyer 289e974f91cSConrad Meyer bus_dma_tag_destroy(ioat->hw_desc_tag); 290e974f91cSConrad Meyer 2914253ea50SConrad Meyer ioat_teardown_intr(ioat); 2924253ea50SConrad Meyer 2934253ea50SConrad Meyer return (0); 2944253ea50SConrad Meyer } 2954253ea50SConrad Meyer 2964253ea50SConrad Meyer static int 2974253ea50SConrad Meyer ioat_teardown_intr(struct ioat_softc *ioat) 2984253ea50SConrad Meyer { 2994253ea50SConrad Meyer 300e974f91cSConrad Meyer if (ioat->tag != NULL) 3014253ea50SConrad Meyer bus_teardown_intr(ioat->device, ioat->res, ioat->tag); 302e974f91cSConrad Meyer 303e974f91cSConrad Meyer if (ioat->res != NULL) 3044253ea50SConrad Meyer bus_release_resource(ioat->device, SYS_RES_IRQ, 305e974f91cSConrad Meyer rman_get_rid(ioat->res), ioat->res); 306e974f91cSConrad Meyer 3074253ea50SConrad Meyer pci_release_msi(ioat->device); 308e974f91cSConrad Meyer return (0); 309e974f91cSConrad Meyer } 310e974f91cSConrad Meyer 311e974f91cSConrad Meyer static int 312e974f91cSConrad Meyer ioat3_selftest(struct ioat_softc *ioat) 313e974f91cSConrad Meyer { 314e974f91cSConrad Meyer uint64_t status; 315e974f91cSConrad Meyer uint32_t chanerr; 316e974f91cSConrad Meyer int i; 317e974f91cSConrad Meyer 318e974f91cSConrad Meyer ioat_acquire(&ioat->dmaengine); 319e974f91cSConrad Meyer ioat_null(&ioat->dmaengine, NULL, NULL, 0); 320e974f91cSConrad Meyer ioat_release(&ioat->dmaengine); 321e974f91cSConrad Meyer 322e974f91cSConrad Meyer for (i = 0; i < 100; i++) { 323e974f91cSConrad Meyer DELAY(1); 324e974f91cSConrad Meyer status = ioat_get_chansts(ioat); 325e974f91cSConrad Meyer if (is_ioat_idle(status)) 326e974f91cSConrad Meyer return (0); 327e974f91cSConrad Meyer } 328e974f91cSConrad Meyer 329e974f91cSConrad Meyer chanerr = ioat_read_4(ioat, IOAT_CHANERR_OFFSET); 330e974f91cSConrad Meyer ioat_log_message(0, "could not start channel: " 331e974f91cSConrad Meyer "status = %#jx error = %x\n", (uintmax_t)status, chanerr); 332e974f91cSConrad Meyer return (ENXIO); 333e974f91cSConrad Meyer } 334e974f91cSConrad Meyer 335e974f91cSConrad Meyer /* 336e974f91cSConrad Meyer * Initialize Hardware 337e974f91cSConrad Meyer */ 338e974f91cSConrad Meyer static int 339e974f91cSConrad Meyer ioat3_attach(device_t device) 340e974f91cSConrad Meyer { 341e974f91cSConrad Meyer struct ioat_softc *ioat; 342e974f91cSConrad Meyer struct ioat_descriptor **ring; 343e974f91cSConrad Meyer struct ioat_descriptor *next; 344e974f91cSConrad Meyer struct ioat_dma_hw_descriptor *dma_hw_desc; 345e974f91cSConrad Meyer uint32_t capabilities; 346e974f91cSConrad Meyer int i, num_descriptors; 347e974f91cSConrad Meyer int error; 348e974f91cSConrad Meyer uint8_t xfercap; 349e974f91cSConrad Meyer 350e974f91cSConrad Meyer error = 0; 351e974f91cSConrad Meyer ioat = DEVICE2SOFTC(device); 352e974f91cSConrad Meyer capabilities = ioat_read_dmacapability(ioat); 353e974f91cSConrad Meyer 354e974f91cSConrad Meyer xfercap = ioat_read_xfercap(ioat); 355e974f91cSConrad Meyer ioat->max_xfer_size = 1 << xfercap; 356e974f91cSConrad Meyer 357e974f91cSConrad Meyer /* TODO: need to check DCA here if we ever do XOR/PQ */ 358e974f91cSConrad Meyer 359e974f91cSConrad Meyer mtx_init(&ioat->submit_lock, "ioat_submit", NULL, MTX_DEF); 360e974f91cSConrad Meyer mtx_init(&ioat->cleanup_lock, "ioat_process_events", NULL, MTX_DEF); 361*7afbb263SConrad Meyer callout_init(&ioat->timer, 1); 362e974f91cSConrad Meyer 363e974f91cSConrad Meyer ioat->is_resize_pending = FALSE; 364e974f91cSConrad Meyer ioat->is_completion_pending = FALSE; 365e974f91cSConrad Meyer ioat->is_reset_pending = FALSE; 366e974f91cSConrad Meyer ioat->is_channel_running = FALSE; 367e974f91cSConrad Meyer ioat->is_waiting_for_ack = FALSE; 368e974f91cSConrad Meyer 369e974f91cSConrad Meyer bus_dma_tag_create(bus_get_dma_tag(ioat->device), sizeof(uint64_t), 0x0, 370e974f91cSConrad Meyer BUS_SPACE_MAXADDR, BUS_SPACE_MAXADDR, NULL, NULL, 371e974f91cSConrad Meyer sizeof(uint64_t), 1, sizeof(uint64_t), 0, NULL, NULL, 372e974f91cSConrad Meyer &ioat->comp_update_tag); 373e974f91cSConrad Meyer 374e974f91cSConrad Meyer error = bus_dmamem_alloc(ioat->comp_update_tag, 375e974f91cSConrad Meyer (void **)&ioat->comp_update, BUS_DMA_ZERO, &ioat->comp_update_map); 376e974f91cSConrad Meyer if (ioat->comp_update == NULL) 377e974f91cSConrad Meyer return (ENOMEM); 378e974f91cSConrad Meyer 379e974f91cSConrad Meyer error = bus_dmamap_load(ioat->comp_update_tag, ioat->comp_update_map, 380e974f91cSConrad Meyer ioat->comp_update, sizeof(uint64_t), ioat_comp_update_map, ioat, 381e974f91cSConrad Meyer 0); 382e974f91cSConrad Meyer if (error != 0) 383e974f91cSConrad Meyer return (error); 384e974f91cSConrad Meyer 385e974f91cSConrad Meyer ioat->ring_size_order = IOAT_MIN_ORDER; 386e974f91cSConrad Meyer 387e974f91cSConrad Meyer num_descriptors = 1 << ioat->ring_size_order; 388e974f91cSConrad Meyer 389e974f91cSConrad Meyer bus_dma_tag_create(bus_get_dma_tag(ioat->device), 0x40, 0x0, 390e974f91cSConrad Meyer BUS_SPACE_MAXADDR, BUS_SPACE_MAXADDR, NULL, NULL, 391e974f91cSConrad Meyer sizeof(struct ioat_dma_hw_descriptor), 1, 392e974f91cSConrad Meyer sizeof(struct ioat_dma_hw_descriptor), 0, NULL, NULL, 393e974f91cSConrad Meyer &ioat->hw_desc_tag); 394e974f91cSConrad Meyer 395e974f91cSConrad Meyer ioat->ring = malloc(num_descriptors * sizeof(*ring), M_IOAT, 396e974f91cSConrad Meyer M_ZERO | M_NOWAIT); 397e974f91cSConrad Meyer if (ioat->ring == NULL) 398e974f91cSConrad Meyer return (ENOMEM); 399e974f91cSConrad Meyer 400e974f91cSConrad Meyer ring = ioat->ring; 401e974f91cSConrad Meyer for (i = 0; i < num_descriptors; i++) { 402e974f91cSConrad Meyer ring[i] = ioat_alloc_ring_entry(ioat); 403e974f91cSConrad Meyer if (ring[i] == NULL) 404e974f91cSConrad Meyer return (ENOMEM); 405e974f91cSConrad Meyer 406e974f91cSConrad Meyer ring[i]->id = i; 407e974f91cSConrad Meyer } 408e974f91cSConrad Meyer 409e974f91cSConrad Meyer for (i = 0; i < num_descriptors - 1; i++) { 410e974f91cSConrad Meyer next = ring[i + 1]; 411e974f91cSConrad Meyer dma_hw_desc = ring[i]->u.dma; 412e974f91cSConrad Meyer 413e974f91cSConrad Meyer dma_hw_desc->next = next->hw_desc_bus_addr; 414e974f91cSConrad Meyer } 415e974f91cSConrad Meyer 416e974f91cSConrad Meyer ring[i]->u.dma->next = ring[0]->hw_desc_bus_addr; 417e974f91cSConrad Meyer 418e974f91cSConrad Meyer ioat->head = 0; 419e974f91cSConrad Meyer ioat->tail = 0; 420e974f91cSConrad Meyer ioat->last_seen = 0; 421e974f91cSConrad Meyer 422e974f91cSConrad Meyer error = ioat_reset_hw(ioat); 423e974f91cSConrad Meyer if (error != 0) 424e974f91cSConrad Meyer return (error); 425e974f91cSConrad Meyer 426e974f91cSConrad Meyer ioat_write_chanctrl(ioat, IOAT_CHANCTRL_RUN); 427e974f91cSConrad Meyer ioat_write_chancmp(ioat, ioat->comp_update_bus_addr); 428e974f91cSConrad Meyer ioat_write_chainaddr(ioat, ring[0]->hw_desc_bus_addr); 429e974f91cSConrad Meyer return (0); 430e974f91cSConrad Meyer } 431e974f91cSConrad Meyer 432e974f91cSConrad Meyer static int 433e974f91cSConrad Meyer ioat_map_pci_bar(struct ioat_softc *ioat) 434e974f91cSConrad Meyer { 435e974f91cSConrad Meyer 436e974f91cSConrad Meyer ioat->pci_resource_id = PCIR_BAR(0); 437e974f91cSConrad Meyer ioat->pci_resource = bus_alloc_resource(ioat->device, SYS_RES_MEMORY, 438e974f91cSConrad Meyer &ioat->pci_resource_id, 0, ~0, 1, RF_ACTIVE); 439e974f91cSConrad Meyer 440e974f91cSConrad Meyer if (ioat->pci_resource == NULL) { 441e974f91cSConrad Meyer ioat_log_message(0, "unable to allocate pci resource\n"); 442e974f91cSConrad Meyer return (ENODEV); 443e974f91cSConrad Meyer } 444e974f91cSConrad Meyer 445e974f91cSConrad Meyer ioat->pci_bus_tag = rman_get_bustag(ioat->pci_resource); 446e974f91cSConrad Meyer ioat->pci_bus_handle = rman_get_bushandle(ioat->pci_resource); 447e974f91cSConrad Meyer return (0); 448e974f91cSConrad Meyer } 449e974f91cSConrad Meyer 450e974f91cSConrad Meyer static void 451e974f91cSConrad Meyer ioat_comp_update_map(void *arg, bus_dma_segment_t *seg, int nseg, int error) 452e974f91cSConrad Meyer { 453e974f91cSConrad Meyer struct ioat_softc *ioat = arg; 454e974f91cSConrad Meyer 455e974f91cSConrad Meyer ioat->comp_update_bus_addr = seg[0].ds_addr; 456e974f91cSConrad Meyer } 457e974f91cSConrad Meyer 458e974f91cSConrad Meyer static void 459e974f91cSConrad Meyer ioat_dmamap_cb(void *arg, bus_dma_segment_t *segs, int nseg, int error) 460e974f91cSConrad Meyer { 461e974f91cSConrad Meyer bus_addr_t *baddr; 462e974f91cSConrad Meyer 463e974f91cSConrad Meyer baddr = arg; 464e974f91cSConrad Meyer *baddr = segs->ds_addr; 465e974f91cSConrad Meyer } 466e974f91cSConrad Meyer 467e974f91cSConrad Meyer /* 468e974f91cSConrad Meyer * Interrupt setup and handlers 469e974f91cSConrad Meyer */ 470e974f91cSConrad Meyer static int 4714253ea50SConrad Meyer ioat_setup_intr(struct ioat_softc *ioat) 472e974f91cSConrad Meyer { 473e974f91cSConrad Meyer uint32_t num_vectors; 474e974f91cSConrad Meyer int error; 475e974f91cSConrad Meyer boolean_t use_msix; 476e974f91cSConrad Meyer boolean_t force_legacy_interrupts; 477e974f91cSConrad Meyer 478e974f91cSConrad Meyer use_msix = FALSE; 479e974f91cSConrad Meyer force_legacy_interrupts = FALSE; 480e974f91cSConrad Meyer 481e974f91cSConrad Meyer if (!g_force_legacy_interrupts && pci_msix_count(ioat->device) >= 1) { 482e974f91cSConrad Meyer num_vectors = 1; 483e974f91cSConrad Meyer pci_alloc_msix(ioat->device, &num_vectors); 484e974f91cSConrad Meyer if (num_vectors == 1) 485e974f91cSConrad Meyer use_msix = TRUE; 486e974f91cSConrad Meyer } 487e974f91cSConrad Meyer 488e974f91cSConrad Meyer if (use_msix) { 489e974f91cSConrad Meyer ioat->rid = 1; 490e974f91cSConrad Meyer ioat->res = bus_alloc_resource_any(ioat->device, SYS_RES_IRQ, 491e974f91cSConrad Meyer &ioat->rid, RF_ACTIVE); 492e974f91cSConrad Meyer } else { 493e974f91cSConrad Meyer ioat->rid = 0; 494e974f91cSConrad Meyer ioat->res = bus_alloc_resource_any(ioat->device, SYS_RES_IRQ, 495e974f91cSConrad Meyer &ioat->rid, RF_SHAREABLE | RF_ACTIVE); 496e974f91cSConrad Meyer } 497e974f91cSConrad Meyer if (ioat->res == NULL) { 498e974f91cSConrad Meyer ioat_log_message(0, "bus_alloc_resource failed\n"); 499e974f91cSConrad Meyer return (ENOMEM); 500e974f91cSConrad Meyer } 501e974f91cSConrad Meyer 502e974f91cSConrad Meyer ioat->tag = NULL; 503e974f91cSConrad Meyer error = bus_setup_intr(ioat->device, ioat->res, INTR_MPSAFE | 504e974f91cSConrad Meyer INTR_TYPE_MISC, NULL, ioat_interrupt_handler, ioat, &ioat->tag); 505e974f91cSConrad Meyer if (error != 0) { 506e974f91cSConrad Meyer ioat_log_message(0, "bus_setup_intr failed\n"); 507e974f91cSConrad Meyer return (error); 508e974f91cSConrad Meyer } 509e974f91cSConrad Meyer 510e974f91cSConrad Meyer ioat_write_intrctrl(ioat, IOAT_INTRCTRL_MASTER_INT_EN); 511e974f91cSConrad Meyer return (0); 512e974f91cSConrad Meyer } 513e974f91cSConrad Meyer 5144253ea50SConrad Meyer static boolean_t 5150d1a05d9SConrad Meyer ioat_model_resets_msix(struct ioat_softc *ioat) 5164253ea50SConrad Meyer { 5174253ea50SConrad Meyer u_int32_t pciid; 5184253ea50SConrad Meyer 5194253ea50SConrad Meyer pciid = pci_get_devid(ioat->device); 5204253ea50SConrad Meyer switch (pciid) { 5210d1a05d9SConrad Meyer /* BWD: */ 5220d1a05d9SConrad Meyer case 0x0c508086: 5230d1a05d9SConrad Meyer case 0x0c518086: 5240d1a05d9SConrad Meyer case 0x0c528086: 5250d1a05d9SConrad Meyer case 0x0c538086: 5260d1a05d9SConrad Meyer /* BDXDE: */ 5274253ea50SConrad Meyer case 0x6f508086: 5284253ea50SConrad Meyer case 0x6f518086: 5294253ea50SConrad Meyer case 0x6f528086: 5304253ea50SConrad Meyer case 0x6f538086: 5314253ea50SConrad Meyer return (TRUE); 5324253ea50SConrad Meyer } 5334253ea50SConrad Meyer 5344253ea50SConrad Meyer return (FALSE); 5354253ea50SConrad Meyer } 5364253ea50SConrad Meyer 537e974f91cSConrad Meyer static void 538e974f91cSConrad Meyer ioat_interrupt_handler(void *arg) 539e974f91cSConrad Meyer { 540e974f91cSConrad Meyer struct ioat_softc *ioat = arg; 541e974f91cSConrad Meyer 542e974f91cSConrad Meyer ioat_process_events(ioat); 543e974f91cSConrad Meyer } 544e974f91cSConrad Meyer 545e974f91cSConrad Meyer static void 546e974f91cSConrad Meyer ioat_process_events(struct ioat_softc *ioat) 547e974f91cSConrad Meyer { 548e974f91cSConrad Meyer struct ioat_descriptor *desc; 549e974f91cSConrad Meyer struct bus_dmadesc *dmadesc; 550e974f91cSConrad Meyer uint64_t comp_update, status; 551e974f91cSConrad Meyer uint32_t completed; 552e974f91cSConrad Meyer 553e974f91cSConrad Meyer mtx_lock(&ioat->cleanup_lock); 554e974f91cSConrad Meyer 555e974f91cSConrad Meyer completed = 0; 556e974f91cSConrad Meyer comp_update = *ioat->comp_update; 557e974f91cSConrad Meyer status = comp_update & IOAT_CHANSTS_COMPLETED_DESCRIPTOR_MASK; 558e974f91cSConrad Meyer 559e974f91cSConrad Meyer ioat_log_message(3, "%s\n", __func__); 560e974f91cSConrad Meyer 561e974f91cSConrad Meyer if (status == ioat->last_seen) { 562e974f91cSConrad Meyer mtx_unlock(&ioat->cleanup_lock); 563e974f91cSConrad Meyer return; 564e974f91cSConrad Meyer } 565e974f91cSConrad Meyer 566e974f91cSConrad Meyer while (1) { 567e974f91cSConrad Meyer desc = ioat_get_ring_entry(ioat, ioat->tail); 568e974f91cSConrad Meyer dmadesc = &desc->bus_dmadesc; 569e974f91cSConrad Meyer ioat_log_message(3, "completing desc %d\n", ioat->tail); 570e974f91cSConrad Meyer 571e974f91cSConrad Meyer if (dmadesc->callback_fn) 572e974f91cSConrad Meyer (*dmadesc->callback_fn)(dmadesc->callback_arg); 573e974f91cSConrad Meyer 574e974f91cSConrad Meyer ioat->tail++; 575e974f91cSConrad Meyer if (desc->hw_desc_bus_addr == status) 576e974f91cSConrad Meyer break; 577e974f91cSConrad Meyer } 578e974f91cSConrad Meyer 579e974f91cSConrad Meyer ioat->last_seen = desc->hw_desc_bus_addr; 580e974f91cSConrad Meyer 581e974f91cSConrad Meyer if (ioat->head == ioat->tail) { 582e974f91cSConrad Meyer ioat->is_completion_pending = FALSE; 583e974f91cSConrad Meyer callout_reset(&ioat->timer, 5 * hz, ioat_timer_callback, ioat); 584e974f91cSConrad Meyer } 585e974f91cSConrad Meyer 586e974f91cSConrad Meyer ioat_write_chanctrl(ioat, IOAT_CHANCTRL_RUN); 587e974f91cSConrad Meyer mtx_unlock(&ioat->cleanup_lock); 588e974f91cSConrad Meyer } 589e974f91cSConrad Meyer 590e974f91cSConrad Meyer /* 591e974f91cSConrad Meyer * User API functions 592e974f91cSConrad Meyer */ 593e974f91cSConrad Meyer bus_dmaengine_t 594e974f91cSConrad Meyer ioat_get_dmaengine(uint32_t index) 595e974f91cSConrad Meyer { 596e974f91cSConrad Meyer 597e974f91cSConrad Meyer if (index < ioat_channel_index) 598e974f91cSConrad Meyer return (&ioat_channel[index]->dmaengine); 599e974f91cSConrad Meyer return (NULL); 600e974f91cSConrad Meyer } 601e974f91cSConrad Meyer 602e974f91cSConrad Meyer void 603e974f91cSConrad Meyer ioat_acquire(bus_dmaengine_t dmaengine) 604e974f91cSConrad Meyer { 605e974f91cSConrad Meyer struct ioat_softc *ioat; 606e974f91cSConrad Meyer 607e974f91cSConrad Meyer ioat = to_ioat_softc(dmaengine); 608e974f91cSConrad Meyer mtx_lock(&ioat->submit_lock); 609e974f91cSConrad Meyer ioat_log_message(3, "%s\n", __func__); 610e974f91cSConrad Meyer } 611e974f91cSConrad Meyer 612e974f91cSConrad Meyer void 613e974f91cSConrad Meyer ioat_release(bus_dmaengine_t dmaengine) 614e974f91cSConrad Meyer { 615e974f91cSConrad Meyer struct ioat_softc *ioat; 616e974f91cSConrad Meyer 617e974f91cSConrad Meyer ioat_log_message(3, "%s\n", __func__); 618e974f91cSConrad Meyer ioat = to_ioat_softc(dmaengine); 619e974f91cSConrad Meyer ioat_write_2(ioat, IOAT_DMACOUNT_OFFSET, (uint16_t)ioat->head); 620e974f91cSConrad Meyer mtx_unlock(&ioat->submit_lock); 621e974f91cSConrad Meyer } 622e974f91cSConrad Meyer 623e974f91cSConrad Meyer struct bus_dmadesc * 624e974f91cSConrad Meyer ioat_null(bus_dmaengine_t dmaengine, bus_dmaengine_callback_t callback_fn, 625e974f91cSConrad Meyer void *callback_arg, uint32_t flags) 626e974f91cSConrad Meyer { 627e974f91cSConrad Meyer struct ioat_softc *ioat; 628e974f91cSConrad Meyer struct ioat_descriptor *desc; 629e974f91cSConrad Meyer struct ioat_dma_hw_descriptor *hw_desc; 630e974f91cSConrad Meyer 631e974f91cSConrad Meyer KASSERT((flags & ~DMA_ALL_FLAGS) == 0, ("Unrecognized flag(s): %#x", 632e974f91cSConrad Meyer flags & ~DMA_ALL_FLAGS)); 633e974f91cSConrad Meyer 634e974f91cSConrad Meyer ioat = to_ioat_softc(dmaengine); 635e974f91cSConrad Meyer 636e974f91cSConrad Meyer if (ioat_reserve_space_and_lock(ioat, 1) != 0) 637e974f91cSConrad Meyer return (NULL); 638e974f91cSConrad Meyer 639e974f91cSConrad Meyer ioat_log_message(3, "%s\n", __func__); 640e974f91cSConrad Meyer 641e974f91cSConrad Meyer desc = ioat_get_ring_entry(ioat, ioat->head); 642e974f91cSConrad Meyer hw_desc = desc->u.dma; 643e974f91cSConrad Meyer 644e974f91cSConrad Meyer hw_desc->u.control_raw = 0; 645e974f91cSConrad Meyer hw_desc->u.control.null = 1; 646e974f91cSConrad Meyer hw_desc->u.control.completion_update = 1; 647e974f91cSConrad Meyer 648e974f91cSConrad Meyer if ((flags & DMA_INT_EN) != 0) 649e974f91cSConrad Meyer hw_desc->u.control.int_enable = 1; 650e974f91cSConrad Meyer 651e974f91cSConrad Meyer hw_desc->size = 8; 652e974f91cSConrad Meyer hw_desc->src_addr = 0; 653e974f91cSConrad Meyer hw_desc->dest_addr = 0; 654e974f91cSConrad Meyer 655e974f91cSConrad Meyer desc->bus_dmadesc.callback_fn = callback_fn; 656e974f91cSConrad Meyer desc->bus_dmadesc.callback_arg = callback_arg; 657e974f91cSConrad Meyer 658e974f91cSConrad Meyer ioat_submit_single(ioat); 659e974f91cSConrad Meyer return (&desc->bus_dmadesc); 660e974f91cSConrad Meyer } 661e974f91cSConrad Meyer 662e974f91cSConrad Meyer struct bus_dmadesc * 663e974f91cSConrad Meyer ioat_copy(bus_dmaengine_t dmaengine, bus_addr_t dst, 664e974f91cSConrad Meyer bus_addr_t src, bus_size_t len, bus_dmaengine_callback_t callback_fn, 665e974f91cSConrad Meyer void *callback_arg, uint32_t flags) 666e974f91cSConrad Meyer { 667e974f91cSConrad Meyer struct ioat_descriptor *desc; 668e974f91cSConrad Meyer struct ioat_dma_hw_descriptor *hw_desc; 669e974f91cSConrad Meyer struct ioat_softc *ioat; 670e974f91cSConrad Meyer 671e974f91cSConrad Meyer KASSERT((flags & ~DMA_ALL_FLAGS) == 0, ("Unrecognized flag(s): %#x", 672e974f91cSConrad Meyer flags & ~DMA_ALL_FLAGS)); 673e974f91cSConrad Meyer 674e974f91cSConrad Meyer ioat = to_ioat_softc(dmaengine); 675e974f91cSConrad Meyer 676e974f91cSConrad Meyer if (len > ioat->max_xfer_size) { 677e974f91cSConrad Meyer ioat_log_message(0, "%s: max_xfer_size = %d, requested = %d\n", 678e974f91cSConrad Meyer __func__, ioat->max_xfer_size, (int)len); 679e974f91cSConrad Meyer return (NULL); 680e974f91cSConrad Meyer } 681e974f91cSConrad Meyer 682e974f91cSConrad Meyer if (ioat_reserve_space_and_lock(ioat, 1) != 0) 683e974f91cSConrad Meyer return (NULL); 684e974f91cSConrad Meyer 685e974f91cSConrad Meyer ioat_log_message(3, "%s\n", __func__); 686e974f91cSConrad Meyer 687e974f91cSConrad Meyer desc = ioat_get_ring_entry(ioat, ioat->head); 688e974f91cSConrad Meyer hw_desc = desc->u.dma; 689e974f91cSConrad Meyer 690e974f91cSConrad Meyer hw_desc->u.control_raw = 0; 691e974f91cSConrad Meyer hw_desc->u.control.completion_update = 1; 692e974f91cSConrad Meyer 693e974f91cSConrad Meyer if ((flags & DMA_INT_EN) != 0) 694e974f91cSConrad Meyer hw_desc->u.control.int_enable = 1; 695e974f91cSConrad Meyer 696e974f91cSConrad Meyer hw_desc->size = len; 697e974f91cSConrad Meyer hw_desc->src_addr = src; 698e974f91cSConrad Meyer hw_desc->dest_addr = dst; 699e974f91cSConrad Meyer 700e974f91cSConrad Meyer if (g_ioat_debug_level >= 3) 701e974f91cSConrad Meyer dump_descriptor(hw_desc); 702e974f91cSConrad Meyer 703e974f91cSConrad Meyer desc->bus_dmadesc.callback_fn = callback_fn; 704e974f91cSConrad Meyer desc->bus_dmadesc.callback_arg = callback_arg; 705e974f91cSConrad Meyer 706e974f91cSConrad Meyer ioat_submit_single(ioat); 707e974f91cSConrad Meyer return (&desc->bus_dmadesc); 708e974f91cSConrad Meyer } 709e974f91cSConrad Meyer 710e974f91cSConrad Meyer /* 711e974f91cSConrad Meyer * Ring Management 712e974f91cSConrad Meyer */ 713e974f91cSConrad Meyer static inline uint32_t 714e974f91cSConrad Meyer ioat_get_active(struct ioat_softc *ioat) 715e974f91cSConrad Meyer { 716e974f91cSConrad Meyer 717e974f91cSConrad Meyer return ((ioat->head - ioat->tail) & ((1 << ioat->ring_size_order) - 1)); 718e974f91cSConrad Meyer } 719e974f91cSConrad Meyer 720e974f91cSConrad Meyer static inline uint32_t 721e974f91cSConrad Meyer ioat_get_ring_space(struct ioat_softc *ioat) 722e974f91cSConrad Meyer { 723e974f91cSConrad Meyer 724e974f91cSConrad Meyer return ((1 << ioat->ring_size_order) - ioat_get_active(ioat) - 1); 725e974f91cSConrad Meyer } 726e974f91cSConrad Meyer 727e974f91cSConrad Meyer static struct ioat_descriptor * 728e974f91cSConrad Meyer ioat_alloc_ring_entry(struct ioat_softc *ioat) 729e974f91cSConrad Meyer { 730e974f91cSConrad Meyer struct ioat_dma_hw_descriptor *hw_desc; 731e974f91cSConrad Meyer struct ioat_descriptor *desc; 732e974f91cSConrad Meyer 733e974f91cSConrad Meyer desc = malloc(sizeof(struct ioat_descriptor), M_IOAT, M_NOWAIT); 734e974f91cSConrad Meyer if (desc == NULL) 735e974f91cSConrad Meyer return (NULL); 736e974f91cSConrad Meyer 737e974f91cSConrad Meyer bus_dmamem_alloc(ioat->hw_desc_tag, (void **)&hw_desc, BUS_DMA_ZERO, 738e974f91cSConrad Meyer &ioat->hw_desc_map); 739e974f91cSConrad Meyer if (hw_desc == NULL) { 740e974f91cSConrad Meyer free(desc, M_IOAT); 741e974f91cSConrad Meyer return (NULL); 742e974f91cSConrad Meyer } 743e974f91cSConrad Meyer 744e974f91cSConrad Meyer bus_dmamap_load(ioat->hw_desc_tag, ioat->hw_desc_map, hw_desc, 745e974f91cSConrad Meyer sizeof(*hw_desc), ioat_dmamap_cb, &desc->hw_desc_bus_addr, 0); 746e974f91cSConrad Meyer 747e974f91cSConrad Meyer desc->u.dma = hw_desc; 748e974f91cSConrad Meyer return (desc); 749e974f91cSConrad Meyer } 750e974f91cSConrad Meyer 751e974f91cSConrad Meyer static void 752e974f91cSConrad Meyer ioat_free_ring_entry(struct ioat_softc *ioat, struct ioat_descriptor *desc) 753e974f91cSConrad Meyer { 754e974f91cSConrad Meyer 755e974f91cSConrad Meyer if (desc == NULL) 756e974f91cSConrad Meyer return; 757e974f91cSConrad Meyer 758e974f91cSConrad Meyer if (desc->u.dma) 759e974f91cSConrad Meyer bus_dmamem_free(ioat->hw_desc_tag, desc->u.dma, 760e974f91cSConrad Meyer ioat->hw_desc_map); 761e974f91cSConrad Meyer free(desc, M_IOAT); 762e974f91cSConrad Meyer } 763e974f91cSConrad Meyer 764e974f91cSConrad Meyer static int 765e974f91cSConrad Meyer ioat_reserve_space_and_lock(struct ioat_softc *ioat, int num_descs) 766e974f91cSConrad Meyer { 767e974f91cSConrad Meyer boolean_t retry; 768e974f91cSConrad Meyer 769e974f91cSConrad Meyer while (1) { 770e974f91cSConrad Meyer if (ioat_get_ring_space(ioat) >= num_descs) 771e974f91cSConrad Meyer return (0); 772e974f91cSConrad Meyer 773e974f91cSConrad Meyer mtx_lock(&ioat->cleanup_lock); 774e974f91cSConrad Meyer retry = resize_ring(ioat, ioat->ring_size_order + 1); 775e974f91cSConrad Meyer mtx_unlock(&ioat->cleanup_lock); 776e974f91cSConrad Meyer 777e974f91cSConrad Meyer if (!retry) 778e974f91cSConrad Meyer return (ENOMEM); 779e974f91cSConrad Meyer } 780e974f91cSConrad Meyer } 781e974f91cSConrad Meyer 782e974f91cSConrad Meyer static struct ioat_descriptor * 783e974f91cSConrad Meyer ioat_get_ring_entry(struct ioat_softc *ioat, uint32_t index) 784e974f91cSConrad Meyer { 785e974f91cSConrad Meyer 786e974f91cSConrad Meyer return (ioat->ring[index % (1 << ioat->ring_size_order)]); 787e974f91cSConrad Meyer } 788e974f91cSConrad Meyer 789e974f91cSConrad Meyer static boolean_t 790e974f91cSConrad Meyer resize_ring(struct ioat_softc *ioat, int order) 791e974f91cSConrad Meyer { 792e974f91cSConrad Meyer struct ioat_descriptor **ring; 793e974f91cSConrad Meyer struct ioat_descriptor *next; 794e974f91cSConrad Meyer struct ioat_dma_hw_descriptor *hw; 795e974f91cSConrad Meyer struct ioat_descriptor *ent; 796e974f91cSConrad Meyer uint32_t current_size, active, new_size, i, new_idx, current_idx; 797e974f91cSConrad Meyer uint32_t new_idx2; 798e974f91cSConrad Meyer 799e974f91cSConrad Meyer current_size = 1 << ioat->ring_size_order; 800e974f91cSConrad Meyer active = (ioat->head - ioat->tail) & (current_size - 1); 801e974f91cSConrad Meyer new_size = 1 << order; 802e974f91cSConrad Meyer 803e974f91cSConrad Meyer if (order > IOAT_MAX_ORDER) 804e974f91cSConrad Meyer return (FALSE); 805e974f91cSConrad Meyer 806e974f91cSConrad Meyer /* 807e974f91cSConrad Meyer * when shrinking, verify that we can hold the current active 808e974f91cSConrad Meyer * set in the new ring 809e974f91cSConrad Meyer */ 810e974f91cSConrad Meyer if (active >= new_size) 811e974f91cSConrad Meyer return (FALSE); 812e974f91cSConrad Meyer 813e974f91cSConrad Meyer /* allocate the array to hold the software ring */ 814e974f91cSConrad Meyer ring = malloc(new_size * sizeof(*ring), M_IOAT, M_ZERO | M_NOWAIT); 815e974f91cSConrad Meyer if (ring == NULL) 816e974f91cSConrad Meyer return (FALSE); 817e974f91cSConrad Meyer 818e974f91cSConrad Meyer ioat_log_message(2, "ring resize: new: %d old: %d\n", 819e974f91cSConrad Meyer new_size, current_size); 820e974f91cSConrad Meyer 821e974f91cSConrad Meyer /* allocate/trim descriptors as needed */ 822e974f91cSConrad Meyer if (new_size > current_size) { 823e974f91cSConrad Meyer /* copy current descriptors to the new ring */ 824e974f91cSConrad Meyer for (i = 0; i < current_size; i++) { 825e974f91cSConrad Meyer current_idx = (ioat->tail + i) & (current_size - 1); 826e974f91cSConrad Meyer new_idx = (ioat->tail + i) & (new_size - 1); 827e974f91cSConrad Meyer 828e974f91cSConrad Meyer ring[new_idx] = ioat->ring[current_idx]; 829e974f91cSConrad Meyer ring[new_idx]->id = new_idx; 830e974f91cSConrad Meyer } 831e974f91cSConrad Meyer 832e974f91cSConrad Meyer /* add new descriptors to the ring */ 833e974f91cSConrad Meyer for (i = current_size; i < new_size; i++) { 834e974f91cSConrad Meyer new_idx = (ioat->tail + i) & (new_size - 1); 835e974f91cSConrad Meyer 836e974f91cSConrad Meyer ring[new_idx] = ioat_alloc_ring_entry(ioat); 8378c8e8487SConrad Meyer if (ring[new_idx] == NULL) { 838e974f91cSConrad Meyer while (i--) { 839e974f91cSConrad Meyer new_idx2 = (ioat->tail + i) & 840e974f91cSConrad Meyer (new_size - 1); 841e974f91cSConrad Meyer 842e974f91cSConrad Meyer ioat_free_ring_entry(ioat, 843e974f91cSConrad Meyer ring[new_idx2]); 844e974f91cSConrad Meyer } 845e974f91cSConrad Meyer free(ring, M_IOAT); 846e974f91cSConrad Meyer return (FALSE); 847e974f91cSConrad Meyer } 848e974f91cSConrad Meyer ring[new_idx]->id = new_idx; 849e974f91cSConrad Meyer } 850e974f91cSConrad Meyer 851e974f91cSConrad Meyer for (i = current_size - 1; i < new_size; i++) { 852e974f91cSConrad Meyer new_idx = (ioat->tail + i) & (new_size - 1); 853e974f91cSConrad Meyer next = ring[(new_idx + 1) & (new_size - 1)]; 854e974f91cSConrad Meyer hw = ring[new_idx]->u.dma; 855e974f91cSConrad Meyer 856e974f91cSConrad Meyer hw->next = next->hw_desc_bus_addr; 857e974f91cSConrad Meyer } 858e974f91cSConrad Meyer } else { 859e974f91cSConrad Meyer /* 860e974f91cSConrad Meyer * copy current descriptors to the new ring, dropping the 861e974f91cSConrad Meyer * removed descriptors 862e974f91cSConrad Meyer */ 863e974f91cSConrad Meyer for (i = 0; i < new_size; i++) { 864e974f91cSConrad Meyer current_idx = (ioat->tail + i) & (current_size - 1); 865e974f91cSConrad Meyer new_idx = (ioat->tail + i) & (new_size - 1); 866e974f91cSConrad Meyer 867e974f91cSConrad Meyer ring[new_idx] = ioat->ring[current_idx]; 868e974f91cSConrad Meyer ring[new_idx]->id = new_idx; 869e974f91cSConrad Meyer } 870e974f91cSConrad Meyer 871e974f91cSConrad Meyer /* free deleted descriptors */ 872e974f91cSConrad Meyer for (i = new_size; i < current_size; i++) { 873e974f91cSConrad Meyer ent = ioat_get_ring_entry(ioat, ioat->tail + i); 874e974f91cSConrad Meyer ioat_free_ring_entry(ioat, ent); 875e974f91cSConrad Meyer } 876e974f91cSConrad Meyer 877e974f91cSConrad Meyer /* fix up hardware ring */ 878e974f91cSConrad Meyer hw = ring[(ioat->tail + new_size - 1) & (new_size - 1)]->u.dma; 879e974f91cSConrad Meyer next = ring[(ioat->tail + new_size) & (new_size - 1)]; 880e974f91cSConrad Meyer hw->next = next->hw_desc_bus_addr; 881e974f91cSConrad Meyer } 882e974f91cSConrad Meyer 883e974f91cSConrad Meyer free(ioat->ring, M_IOAT); 884e974f91cSConrad Meyer ioat->ring = ring; 885e974f91cSConrad Meyer ioat->ring_size_order = order; 886e974f91cSConrad Meyer 887e974f91cSConrad Meyer return (TRUE); 888e974f91cSConrad Meyer } 889e974f91cSConrad Meyer 890e974f91cSConrad Meyer static void 891e974f91cSConrad Meyer ioat_timer_callback(void *arg) 892e974f91cSConrad Meyer { 893e974f91cSConrad Meyer struct ioat_descriptor *desc; 894e974f91cSConrad Meyer struct ioat_softc *ioat; 895e974f91cSConrad Meyer uint64_t status; 896e974f91cSConrad Meyer uint32_t chanerr; 897e974f91cSConrad Meyer 898e974f91cSConrad Meyer ioat = arg; 899e974f91cSConrad Meyer ioat_log_message(2, "%s\n", __func__); 900e974f91cSConrad Meyer 901e974f91cSConrad Meyer if (ioat->is_completion_pending) { 902e974f91cSConrad Meyer status = ioat_get_chansts(ioat); 903e974f91cSConrad Meyer 904e974f91cSConrad Meyer /* 905e974f91cSConrad Meyer * When halted due to errors, check for channel programming 906e974f91cSConrad Meyer * errors before advancing the completion state. 907e974f91cSConrad Meyer */ 908e974f91cSConrad Meyer if (is_ioat_halted(status)) { 909e974f91cSConrad Meyer chanerr = ioat_read_4(ioat, IOAT_CHANERR_OFFSET); 910e974f91cSConrad Meyer ioat_log_message(0, "Channel halted (%x)\n", chanerr); 911e974f91cSConrad Meyer 912e974f91cSConrad Meyer desc = ioat_get_ring_entry(ioat, ioat->tail + 0); 913e974f91cSConrad Meyer dump_descriptor(desc->u.raw); 914e974f91cSConrad Meyer 915e974f91cSConrad Meyer desc = ioat_get_ring_entry(ioat, ioat->tail + 1); 916e974f91cSConrad Meyer dump_descriptor(desc->u.raw); 917e974f91cSConrad Meyer } 918e974f91cSConrad Meyer ioat_process_events(ioat); 919e974f91cSConrad Meyer } else { 920e974f91cSConrad Meyer mtx_lock(&ioat->submit_lock); 921e974f91cSConrad Meyer mtx_lock(&ioat->cleanup_lock); 922e974f91cSConrad Meyer 923e974f91cSConrad Meyer if (ioat_get_active(ioat) == 0 && 924e974f91cSConrad Meyer ioat->ring_size_order > IOAT_MIN_ORDER) 925e974f91cSConrad Meyer resize_ring(ioat, ioat->ring_size_order - 1); 926e974f91cSConrad Meyer 927e974f91cSConrad Meyer mtx_unlock(&ioat->cleanup_lock); 928e974f91cSConrad Meyer mtx_unlock(&ioat->submit_lock); 929e974f91cSConrad Meyer 930e974f91cSConrad Meyer if (ioat->ring_size_order > IOAT_MIN_ORDER) 931e974f91cSConrad Meyer callout_reset(&ioat->timer, 5 * hz, 932e974f91cSConrad Meyer ioat_timer_callback, ioat); 933e974f91cSConrad Meyer } 934e974f91cSConrad Meyer } 935e974f91cSConrad Meyer 936e974f91cSConrad Meyer /* 937e974f91cSConrad Meyer * Support Functions 938e974f91cSConrad Meyer */ 939e974f91cSConrad Meyer static void 940e974f91cSConrad Meyer ioat_submit_single(struct ioat_softc *ioat) 941e974f91cSConrad Meyer { 942e974f91cSConrad Meyer 943e974f91cSConrad Meyer atomic_add_rel_int(&ioat->head, 1); 944e974f91cSConrad Meyer 945e974f91cSConrad Meyer if (!ioat->is_completion_pending) { 946e974f91cSConrad Meyer ioat->is_completion_pending = TRUE; 947e974f91cSConrad Meyer callout_reset(&ioat->timer, 10 * hz, ioat_timer_callback, 948e974f91cSConrad Meyer ioat); 949e974f91cSConrad Meyer } 950e974f91cSConrad Meyer } 951e974f91cSConrad Meyer 952e974f91cSConrad Meyer static int 953e974f91cSConrad Meyer ioat_reset_hw(struct ioat_softc *ioat) 954e974f91cSConrad Meyer { 955e974f91cSConrad Meyer uint64_t status; 956e974f91cSConrad Meyer uint32_t chanerr; 9570d1a05d9SConrad Meyer int timeout; 958e974f91cSConrad Meyer 959e974f91cSConrad Meyer status = ioat_get_chansts(ioat); 960e974f91cSConrad Meyer if (is_ioat_active(status) || is_ioat_idle(status)) 961e974f91cSConrad Meyer ioat_suspend(ioat); 962e974f91cSConrad Meyer 963e974f91cSConrad Meyer /* Wait at most 20 ms */ 964e974f91cSConrad Meyer for (timeout = 0; (is_ioat_active(status) || is_ioat_idle(status)) && 965e974f91cSConrad Meyer timeout < 20; timeout++) { 966e974f91cSConrad Meyer DELAY(1000); 967e974f91cSConrad Meyer status = ioat_get_chansts(ioat); 968e974f91cSConrad Meyer } 969e974f91cSConrad Meyer if (timeout == 20) 970e974f91cSConrad Meyer return (ETIMEDOUT); 971e974f91cSConrad Meyer 972e974f91cSConrad Meyer chanerr = ioat_read_4(ioat, IOAT_CHANERR_OFFSET); 973e974f91cSConrad Meyer ioat_write_4(ioat, IOAT_CHANERR_OFFSET, chanerr); 974e974f91cSConrad Meyer 975e974f91cSConrad Meyer /* 976e974f91cSConrad Meyer * IOAT v3 workaround - CHANERRMSK_INT with 3E07h to masks out errors 977e974f91cSConrad Meyer * that can cause stability issues for IOAT v3. 978e974f91cSConrad Meyer */ 979e974f91cSConrad Meyer pci_write_config(ioat->device, IOAT_CFG_CHANERRMASK_INT_OFFSET, 0x3e07, 980e974f91cSConrad Meyer 4); 981e974f91cSConrad Meyer chanerr = pci_read_config(ioat->device, IOAT_CFG_CHANERR_INT_OFFSET, 4); 982e974f91cSConrad Meyer pci_write_config(ioat->device, IOAT_CFG_CHANERR_INT_OFFSET, chanerr, 4); 983e974f91cSConrad Meyer 9840d1a05d9SConrad Meyer /* 9850d1a05d9SConrad Meyer * BDXDE and BWD models reset MSI-X registers on device reset. 9860d1a05d9SConrad Meyer * Save/restore their contents manually. 9870d1a05d9SConrad Meyer */ 9880d1a05d9SConrad Meyer if (ioat_model_resets_msix(ioat)) 9890d1a05d9SConrad Meyer pci_save_state(ioat->device); 9900d1a05d9SConrad Meyer 991e974f91cSConrad Meyer ioat_reset(ioat); 992e974f91cSConrad Meyer 993e974f91cSConrad Meyer /* Wait at most 20 ms */ 994e974f91cSConrad Meyer for (timeout = 0; ioat_reset_pending(ioat) && timeout < 20; timeout++) 995e974f91cSConrad Meyer DELAY(1000); 996e974f91cSConrad Meyer if (timeout == 20) 997e974f91cSConrad Meyer return (ETIMEDOUT); 998e974f91cSConrad Meyer 9990d1a05d9SConrad Meyer if (ioat_model_resets_msix(ioat)) 10000d1a05d9SConrad Meyer pci_restore_state(ioat->device); 10014253ea50SConrad Meyer 1002e974f91cSConrad Meyer return (0); 1003e974f91cSConrad Meyer } 1004e974f91cSConrad Meyer 1005e974f91cSConrad Meyer static void 1006e974f91cSConrad Meyer dump_descriptor(void *hw_desc) 1007e974f91cSConrad Meyer { 1008e974f91cSConrad Meyer int i, j; 1009e974f91cSConrad Meyer 1010e974f91cSConrad Meyer for (i = 0; i < 2; i++) { 1011e974f91cSConrad Meyer for (j = 0; j < 8; j++) 1012e974f91cSConrad Meyer printf("%08x ", ((uint32_t *)hw_desc)[i * 8 + j]); 1013e974f91cSConrad Meyer printf("\n"); 1014e974f91cSConrad Meyer } 1015e974f91cSConrad Meyer } 1016e974f91cSConrad Meyer 1017e974f91cSConrad Meyer static void 1018e974f91cSConrad Meyer ioat_setup_sysctl(device_t device) 1019e974f91cSConrad Meyer { 1020e974f91cSConrad Meyer struct sysctl_ctx_list *sysctl_ctx; 1021e974f91cSConrad Meyer struct sysctl_oid *sysctl_tree; 1022e974f91cSConrad Meyer struct ioat_softc *ioat; 1023e974f91cSConrad Meyer 1024e974f91cSConrad Meyer ioat = DEVICE2SOFTC(device); 1025e974f91cSConrad Meyer sysctl_ctx = device_get_sysctl_ctx(device); 1026e974f91cSConrad Meyer sysctl_tree = device_get_sysctl_tree(device); 1027e974f91cSConrad Meyer 1028e974f91cSConrad Meyer SYSCTL_ADD_UINT(sysctl_ctx, SYSCTL_CHILDREN(sysctl_tree), OID_AUTO, 1029e974f91cSConrad Meyer "ring_size_order", CTLFLAG_RD, &ioat->ring_size_order, 1030e974f91cSConrad Meyer 0, "HW descriptor ring size order"); 1031e974f91cSConrad Meyer SYSCTL_ADD_UINT(sysctl_ctx, SYSCTL_CHILDREN(sysctl_tree), OID_AUTO, 1032e974f91cSConrad Meyer "head", CTLFLAG_RD, &ioat->head, 1033e974f91cSConrad Meyer 0, "HW descriptor head pointer index"); 1034e974f91cSConrad Meyer SYSCTL_ADD_UINT(sysctl_ctx, SYSCTL_CHILDREN(sysctl_tree), OID_AUTO, 1035e974f91cSConrad Meyer "tail", CTLFLAG_RD, &ioat->tail, 1036e974f91cSConrad Meyer 0, "HW descriptor tail pointer index"); 1037e974f91cSConrad Meyer } 1038e974f91cSConrad Meyer 1039e974f91cSConrad Meyer void 1040e974f91cSConrad Meyer ioat_log_message(int verbosity, char *fmt, ...) 1041e974f91cSConrad Meyer { 1042e974f91cSConrad Meyer va_list argp; 1043e974f91cSConrad Meyer char buffer[512]; 1044e974f91cSConrad Meyer struct timeval tv; 1045e974f91cSConrad Meyer 1046e974f91cSConrad Meyer if (verbosity > g_ioat_debug_level) 1047e974f91cSConrad Meyer return; 1048e974f91cSConrad Meyer 1049e974f91cSConrad Meyer va_start(argp, fmt); 1050e974f91cSConrad Meyer vsnprintf(buffer, sizeof(buffer) - 1, fmt, argp); 1051e974f91cSConrad Meyer va_end(argp); 1052e974f91cSConrad Meyer microuptime(&tv); 1053e974f91cSConrad Meyer 1054e974f91cSConrad Meyer printf("[%d:%06d] ioat: %s", (int)tv.tv_sec, (int)tv.tv_usec, buffer); 1055e974f91cSConrad Meyer } 1056