1 /*- 2 * Copyright (c) 2016-2017 Alexander Motin <mav@FreeBSD.org> 3 * Copyright (C) 2013 Intel Corporation 4 * Copyright (C) 2015 EMC Corporation 5 * All rights reserved. 6 * 7 * Redistribution and use in source and binary forms, with or without 8 * modification, are permitted provided that the following conditions 9 * are met: 10 * 1. Redistributions of source code must retain the above copyright 11 * notice, this list of conditions and the following disclaimer. 12 * 2. Redistributions in binary form must reproduce the above copyright 13 * notice, this list of conditions and the following disclaimer in the 14 * documentation and/or other materials provided with the distribution. 15 * 16 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND 17 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 18 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 19 * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE 20 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 21 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 22 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 23 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 24 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 25 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 26 * SUCH DAMAGE. 27 */ 28 29 /* 30 * The Non-Transparent Bridge (NTB) is a device that allows you to connect 31 * two or more systems using a PCI-e links, providing remote memory access. 32 * 33 * This module contains a driver for NTB hardware in Intel Xeon/Atom CPUs. 34 * 35 * NOTE: Much of the code in this module is shared with Linux. Any patches may 36 * be picked up and redistributed in Linux with a dual GPL/BSD license. 37 */ 38 39 #include <sys/cdefs.h> 40 __FBSDID("$FreeBSD$"); 41 42 #include <sys/param.h> 43 #include <sys/kernel.h> 44 #include <sys/systm.h> 45 #include <sys/bus.h> 46 #include <sys/endian.h> 47 #include <sys/interrupt.h> 48 #include <sys/malloc.h> 49 #include <sys/module.h> 50 #include <sys/mutex.h> 51 #include <sys/pciio.h> 52 #include <sys/queue.h> 53 #include <sys/rman.h> 54 #include <sys/sbuf.h> 55 #include <sys/sysctl.h> 56 #include <vm/vm.h> 57 #include <vm/pmap.h> 58 #include <machine/bus.h> 59 #include <machine/intr_machdep.h> 60 #include <machine/resource.h> 61 #include <dev/pci/pcireg.h> 62 #include <dev/pci/pcivar.h> 63 64 #include "ntb_hw_intel.h" 65 #include "../ntb.h" 66 67 #define MAX_MSIX_INTERRUPTS MAX(XEON_DB_COUNT, ATOM_DB_COUNT) 68 69 #define NTB_HB_TIMEOUT 1 /* second */ 70 #define ATOM_LINK_RECOVERY_TIME 500 /* ms */ 71 #define BAR_HIGH_MASK (~((1ull << 12) - 1)) 72 73 #define NTB_MSIX_VER_GUARD 0xaabbccdd 74 #define NTB_MSIX_RECEIVED 0xe0f0e0f0 75 76 /* 77 * PCI constants could be somewhere more generic, but aren't defined/used in 78 * pci.c. 79 */ 80 #define PCI_MSIX_ENTRY_SIZE 16 81 #define PCI_MSIX_ENTRY_LOWER_ADDR 0 82 #define PCI_MSIX_ENTRY_UPPER_ADDR 4 83 #define PCI_MSIX_ENTRY_DATA 8 84 85 enum ntb_device_type { 86 NTB_XEON, 87 NTB_ATOM 88 }; 89 90 /* ntb_conn_type are hardware numbers, cannot change. */ 91 enum ntb_conn_type { 92 NTB_CONN_TRANSPARENT = 0, 93 NTB_CONN_B2B = 1, 94 NTB_CONN_RP = 2, 95 }; 96 97 enum ntb_b2b_direction { 98 NTB_DEV_USD = 0, 99 NTB_DEV_DSD = 1, 100 }; 101 102 enum ntb_bar { 103 NTB_CONFIG_BAR = 0, 104 NTB_B2B_BAR_1, 105 NTB_B2B_BAR_2, 106 NTB_B2B_BAR_3, 107 NTB_MAX_BARS 108 }; 109 110 enum { 111 NTB_MSIX_GUARD = 0, 112 NTB_MSIX_DATA0, 113 NTB_MSIX_DATA1, 114 NTB_MSIX_DATA2, 115 NTB_MSIX_OFS0, 116 NTB_MSIX_OFS1, 117 NTB_MSIX_OFS2, 118 NTB_MSIX_DONE, 119 NTB_MAX_MSIX_SPAD 120 }; 121 122 /* Device features and workarounds */ 123 #define HAS_FEATURE(ntb, feature) \ 124 (((ntb)->features & (feature)) != 0) 125 126 struct ntb_hw_info { 127 uint32_t device_id; 128 const char *desc; 129 enum ntb_device_type type; 130 uint32_t features; 131 }; 132 133 struct ntb_pci_bar_info { 134 bus_space_tag_t pci_bus_tag; 135 bus_space_handle_t pci_bus_handle; 136 int pci_resource_id; 137 struct resource *pci_resource; 138 vm_paddr_t pbase; 139 caddr_t vbase; 140 vm_size_t size; 141 vm_memattr_t map_mode; 142 143 /* Configuration register offsets */ 144 uint32_t psz_off; 145 uint32_t ssz_off; 146 uint32_t pbarxlat_off; 147 }; 148 149 struct ntb_int_info { 150 struct resource *res; 151 int rid; 152 void *tag; 153 }; 154 155 struct ntb_vec { 156 struct ntb_softc *ntb; 157 uint32_t num; 158 unsigned masked; 159 }; 160 161 struct ntb_reg { 162 uint32_t ntb_ctl; 163 uint32_t lnk_sta; 164 uint8_t db_size; 165 unsigned mw_bar[NTB_MAX_BARS]; 166 }; 167 168 struct ntb_alt_reg { 169 uint32_t db_bell; 170 uint32_t db_mask; 171 uint32_t spad; 172 }; 173 174 struct ntb_xlat_reg { 175 uint32_t bar0_base; 176 uint32_t bar2_base; 177 uint32_t bar4_base; 178 uint32_t bar5_base; 179 180 uint32_t bar2_xlat; 181 uint32_t bar4_xlat; 182 uint32_t bar5_xlat; 183 184 uint32_t bar2_limit; 185 uint32_t bar4_limit; 186 uint32_t bar5_limit; 187 }; 188 189 struct ntb_b2b_addr { 190 uint64_t bar0_addr; 191 uint64_t bar2_addr64; 192 uint64_t bar4_addr64; 193 uint64_t bar4_addr32; 194 uint64_t bar5_addr32; 195 }; 196 197 struct ntb_msix_data { 198 uint32_t nmd_ofs; 199 uint32_t nmd_data; 200 }; 201 202 struct ntb_softc { 203 /* ntb.c context. Do not move! Must go first! */ 204 void *ntb_store; 205 206 device_t device; 207 enum ntb_device_type type; 208 uint32_t features; 209 210 struct ntb_pci_bar_info bar_info[NTB_MAX_BARS]; 211 struct ntb_int_info int_info[MAX_MSIX_INTERRUPTS]; 212 uint32_t allocated_interrupts; 213 214 struct ntb_msix_data peer_msix_data[XEON_NONLINK_DB_MSIX_BITS]; 215 struct ntb_msix_data msix_data[XEON_NONLINK_DB_MSIX_BITS]; 216 bool peer_msix_good; 217 bool peer_msix_done; 218 struct ntb_pci_bar_info *peer_lapic_bar; 219 struct callout peer_msix_work; 220 221 struct callout heartbeat_timer; 222 struct callout lr_timer; 223 224 struct ntb_vec *msix_vec; 225 226 uint32_t ppd; 227 enum ntb_conn_type conn_type; 228 enum ntb_b2b_direction dev_type; 229 230 /* Offset of peer bar0 in B2B BAR */ 231 uint64_t b2b_off; 232 /* Memory window used to access peer bar0 */ 233 #define B2B_MW_DISABLED UINT8_MAX 234 uint8_t b2b_mw_idx; 235 uint32_t msix_xlat; 236 uint8_t msix_mw_idx; 237 238 uint8_t mw_count; 239 uint8_t spad_count; 240 uint8_t db_count; 241 uint8_t db_vec_count; 242 uint8_t db_vec_shift; 243 244 /* Protects local db_mask. */ 245 #define DB_MASK_LOCK(sc) mtx_lock_spin(&(sc)->db_mask_lock) 246 #define DB_MASK_UNLOCK(sc) mtx_unlock_spin(&(sc)->db_mask_lock) 247 #define DB_MASK_ASSERT(sc,f) mtx_assert(&(sc)->db_mask_lock, (f)) 248 struct mtx db_mask_lock; 249 250 volatile uint32_t ntb_ctl; 251 volatile uint32_t lnk_sta; 252 253 uint64_t db_valid_mask; 254 uint64_t db_link_mask; 255 uint64_t db_mask; 256 uint64_t fake_db; /* NTB_SB01BASE_LOCKUP*/ 257 uint64_t force_db; /* NTB_SB01BASE_LOCKUP*/ 258 259 int last_ts; /* ticks @ last irq */ 260 261 const struct ntb_reg *reg; 262 const struct ntb_alt_reg *self_reg; 263 const struct ntb_alt_reg *peer_reg; 264 const struct ntb_xlat_reg *xlat_reg; 265 }; 266 267 #ifdef __i386__ 268 static __inline uint64_t 269 bus_space_read_8(bus_space_tag_t tag, bus_space_handle_t handle, 270 bus_size_t offset) 271 { 272 273 return (bus_space_read_4(tag, handle, offset) | 274 ((uint64_t)bus_space_read_4(tag, handle, offset + 4)) << 32); 275 } 276 277 static __inline void 278 bus_space_write_8(bus_space_tag_t tag, bus_space_handle_t handle, 279 bus_size_t offset, uint64_t val) 280 { 281 282 bus_space_write_4(tag, handle, offset, val); 283 bus_space_write_4(tag, handle, offset + 4, val >> 32); 284 } 285 #endif 286 287 #define intel_ntb_bar_read(SIZE, bar, offset) \ 288 bus_space_read_ ## SIZE (ntb->bar_info[(bar)].pci_bus_tag, \ 289 ntb->bar_info[(bar)].pci_bus_handle, (offset)) 290 #define intel_ntb_bar_write(SIZE, bar, offset, val) \ 291 bus_space_write_ ## SIZE (ntb->bar_info[(bar)].pci_bus_tag, \ 292 ntb->bar_info[(bar)].pci_bus_handle, (offset), (val)) 293 #define intel_ntb_reg_read(SIZE, offset) \ 294 intel_ntb_bar_read(SIZE, NTB_CONFIG_BAR, offset) 295 #define intel_ntb_reg_write(SIZE, offset, val) \ 296 intel_ntb_bar_write(SIZE, NTB_CONFIG_BAR, offset, val) 297 #define intel_ntb_mw_read(SIZE, offset) \ 298 intel_ntb_bar_read(SIZE, intel_ntb_mw_to_bar(ntb, ntb->b2b_mw_idx), \ 299 offset) 300 #define intel_ntb_mw_write(SIZE, offset, val) \ 301 intel_ntb_bar_write(SIZE, intel_ntb_mw_to_bar(ntb, ntb->b2b_mw_idx), \ 302 offset, val) 303 304 static int intel_ntb_probe(device_t device); 305 static int intel_ntb_attach(device_t device); 306 static int intel_ntb_detach(device_t device); 307 static uint64_t intel_ntb_db_valid_mask(device_t dev); 308 static void intel_ntb_spad_clear(device_t dev); 309 static uint64_t intel_ntb_db_vector_mask(device_t dev, uint32_t vector); 310 static bool intel_ntb_link_is_up(device_t dev, enum ntb_speed *speed, 311 enum ntb_width *width); 312 static int intel_ntb_link_enable(device_t dev, enum ntb_speed speed, 313 enum ntb_width width); 314 static int intel_ntb_link_disable(device_t dev); 315 static int intel_ntb_spad_read(device_t dev, unsigned int idx, uint32_t *val); 316 static int intel_ntb_peer_spad_write(device_t dev, unsigned int idx, uint32_t val); 317 318 static unsigned intel_ntb_user_mw_to_idx(struct ntb_softc *, unsigned uidx); 319 static inline enum ntb_bar intel_ntb_mw_to_bar(struct ntb_softc *, unsigned mw); 320 static inline bool bar_is_64bit(struct ntb_softc *, enum ntb_bar); 321 static inline void bar_get_xlat_params(struct ntb_softc *, enum ntb_bar, 322 uint32_t *base, uint32_t *xlat, uint32_t *lmt); 323 static int intel_ntb_map_pci_bars(struct ntb_softc *ntb); 324 static int intel_ntb_mw_set_wc_internal(struct ntb_softc *, unsigned idx, 325 vm_memattr_t); 326 static void print_map_success(struct ntb_softc *, struct ntb_pci_bar_info *, 327 const char *); 328 static int map_mmr_bar(struct ntb_softc *ntb, struct ntb_pci_bar_info *bar); 329 static int map_memory_window_bar(struct ntb_softc *ntb, 330 struct ntb_pci_bar_info *bar); 331 static void intel_ntb_unmap_pci_bar(struct ntb_softc *ntb); 332 static int intel_ntb_remap_msix(device_t, uint32_t desired, uint32_t avail); 333 static int intel_ntb_init_isr(struct ntb_softc *ntb); 334 static int intel_ntb_setup_legacy_interrupt(struct ntb_softc *ntb); 335 static int intel_ntb_setup_msix(struct ntb_softc *ntb, uint32_t num_vectors); 336 static void intel_ntb_teardown_interrupts(struct ntb_softc *ntb); 337 static inline uint64_t intel_ntb_vec_mask(struct ntb_softc *, uint64_t db_vector); 338 static void intel_ntb_interrupt(struct ntb_softc *, uint32_t vec); 339 static void ndev_vec_isr(void *arg); 340 static void ndev_irq_isr(void *arg); 341 static inline uint64_t db_ioread(struct ntb_softc *, uint64_t regoff); 342 static inline void db_iowrite(struct ntb_softc *, uint64_t regoff, uint64_t); 343 static inline void db_iowrite_raw(struct ntb_softc *, uint64_t regoff, uint64_t); 344 static int intel_ntb_create_msix_vec(struct ntb_softc *ntb, uint32_t num_vectors); 345 static void intel_ntb_free_msix_vec(struct ntb_softc *ntb); 346 static void intel_ntb_get_msix_info(struct ntb_softc *ntb); 347 static void intel_ntb_exchange_msix(void *); 348 static struct ntb_hw_info *intel_ntb_get_device_info(uint32_t device_id); 349 static void intel_ntb_detect_max_mw(struct ntb_softc *ntb); 350 static int intel_ntb_detect_xeon(struct ntb_softc *ntb); 351 static int intel_ntb_detect_atom(struct ntb_softc *ntb); 352 static int intel_ntb_xeon_init_dev(struct ntb_softc *ntb); 353 static int intel_ntb_atom_init_dev(struct ntb_softc *ntb); 354 static void intel_ntb_teardown_xeon(struct ntb_softc *ntb); 355 static void configure_atom_secondary_side_bars(struct ntb_softc *ntb); 356 static void xeon_reset_sbar_size(struct ntb_softc *, enum ntb_bar idx, 357 enum ntb_bar regbar); 358 static void xeon_set_sbar_base_and_limit(struct ntb_softc *, 359 uint64_t base_addr, enum ntb_bar idx, enum ntb_bar regbar); 360 static void xeon_set_pbar_xlat(struct ntb_softc *, uint64_t base_addr, 361 enum ntb_bar idx); 362 static int xeon_setup_b2b_mw(struct ntb_softc *, 363 const struct ntb_b2b_addr *addr, const struct ntb_b2b_addr *peer_addr); 364 static inline bool link_is_up(struct ntb_softc *ntb); 365 static inline bool _xeon_link_is_up(struct ntb_softc *ntb); 366 static inline bool atom_link_is_err(struct ntb_softc *ntb); 367 static inline enum ntb_speed intel_ntb_link_sta_speed(struct ntb_softc *); 368 static inline enum ntb_width intel_ntb_link_sta_width(struct ntb_softc *); 369 static void atom_link_hb(void *arg); 370 static void recover_atom_link(void *arg); 371 static bool intel_ntb_poll_link(struct ntb_softc *ntb); 372 static void save_bar_parameters(struct ntb_pci_bar_info *bar); 373 static void intel_ntb_sysctl_init(struct ntb_softc *); 374 static int sysctl_handle_features(SYSCTL_HANDLER_ARGS); 375 static int sysctl_handle_link_admin(SYSCTL_HANDLER_ARGS); 376 static int sysctl_handle_link_status_human(SYSCTL_HANDLER_ARGS); 377 static int sysctl_handle_link_status(SYSCTL_HANDLER_ARGS); 378 static int sysctl_handle_register(SYSCTL_HANDLER_ARGS); 379 380 static unsigned g_ntb_hw_debug_level; 381 SYSCTL_UINT(_hw_ntb, OID_AUTO, debug_level, CTLFLAG_RWTUN, 382 &g_ntb_hw_debug_level, 0, "ntb_hw log level -- higher is more verbose"); 383 #define intel_ntb_printf(lvl, ...) do { \ 384 if ((lvl) <= g_ntb_hw_debug_level) { \ 385 device_printf(ntb->device, __VA_ARGS__); \ 386 } \ 387 } while (0) 388 389 #define _NTB_PAT_UC 0 390 #define _NTB_PAT_WC 1 391 #define _NTB_PAT_WT 4 392 #define _NTB_PAT_WP 5 393 #define _NTB_PAT_WB 6 394 #define _NTB_PAT_UCM 7 395 static unsigned g_ntb_mw_pat = _NTB_PAT_UC; 396 SYSCTL_UINT(_hw_ntb, OID_AUTO, default_mw_pat, CTLFLAG_RDTUN, 397 &g_ntb_mw_pat, 0, "Configure the default memory window cache flags (PAT): " 398 "UC: " __XSTRING(_NTB_PAT_UC) ", " 399 "WC: " __XSTRING(_NTB_PAT_WC) ", " 400 "WT: " __XSTRING(_NTB_PAT_WT) ", " 401 "WP: " __XSTRING(_NTB_PAT_WP) ", " 402 "WB: " __XSTRING(_NTB_PAT_WB) ", " 403 "UC-: " __XSTRING(_NTB_PAT_UCM)); 404 405 static inline vm_memattr_t 406 intel_ntb_pat_flags(void) 407 { 408 409 switch (g_ntb_mw_pat) { 410 case _NTB_PAT_WC: 411 return (VM_MEMATTR_WRITE_COMBINING); 412 case _NTB_PAT_WT: 413 return (VM_MEMATTR_WRITE_THROUGH); 414 case _NTB_PAT_WP: 415 return (VM_MEMATTR_WRITE_PROTECTED); 416 case _NTB_PAT_WB: 417 return (VM_MEMATTR_WRITE_BACK); 418 case _NTB_PAT_UCM: 419 return (VM_MEMATTR_WEAK_UNCACHEABLE); 420 case _NTB_PAT_UC: 421 /* FALLTHROUGH */ 422 default: 423 return (VM_MEMATTR_UNCACHEABLE); 424 } 425 } 426 427 /* 428 * Well, this obviously doesn't belong here, but it doesn't seem to exist 429 * anywhere better yet. 430 */ 431 static inline const char * 432 intel_ntb_vm_memattr_to_str(vm_memattr_t pat) 433 { 434 435 switch (pat) { 436 case VM_MEMATTR_WRITE_COMBINING: 437 return ("WRITE_COMBINING"); 438 case VM_MEMATTR_WRITE_THROUGH: 439 return ("WRITE_THROUGH"); 440 case VM_MEMATTR_WRITE_PROTECTED: 441 return ("WRITE_PROTECTED"); 442 case VM_MEMATTR_WRITE_BACK: 443 return ("WRITE_BACK"); 444 case VM_MEMATTR_WEAK_UNCACHEABLE: 445 return ("UNCACHED"); 446 case VM_MEMATTR_UNCACHEABLE: 447 return ("UNCACHEABLE"); 448 default: 449 return ("UNKNOWN"); 450 } 451 } 452 453 static int g_ntb_msix_idx = 1; 454 SYSCTL_INT(_hw_ntb, OID_AUTO, msix_mw_idx, CTLFLAG_RDTUN, &g_ntb_msix_idx, 455 0, "Use this memory window to access the peer MSIX message complex on " 456 "certain Xeon-based NTB systems, as a workaround for a hardware errata. " 457 "Like b2b_mw_idx, negative values index from the last available memory " 458 "window. (Applies on Xeon platforms with SB01BASE_LOCKUP errata.)"); 459 460 static int g_ntb_mw_idx = -1; 461 SYSCTL_INT(_hw_ntb, OID_AUTO, b2b_mw_idx, CTLFLAG_RDTUN, &g_ntb_mw_idx, 462 0, "Use this memory window to access the peer NTB registers. A " 463 "non-negative value starts from the first MW index; a negative value " 464 "starts from the last MW index. The default is -1, i.e., the last " 465 "available memory window. Both sides of the NTB MUST set the same " 466 "value here! (Applies on Xeon platforms with SDOORBELL_LOCKUP errata.)"); 467 468 /* Hardware owns the low 16 bits of features. */ 469 #define NTB_BAR_SIZE_4K (1 << 0) 470 #define NTB_SDOORBELL_LOCKUP (1 << 1) 471 #define NTB_SB01BASE_LOCKUP (1 << 2) 472 #define NTB_B2BDOORBELL_BIT14 (1 << 3) 473 /* Software/configuration owns the top 16 bits. */ 474 #define NTB_SPLIT_BAR (1ull << 16) 475 476 #define NTB_FEATURES_STR \ 477 "\20\21SPLIT_BAR4\04B2B_DOORBELL_BIT14\03SB01BASE_LOCKUP" \ 478 "\02SDOORBELL_LOCKUP\01BAR_SIZE_4K" 479 480 static struct ntb_hw_info pci_ids[] = { 481 /* XXX: PS/SS IDs left out until they are supported. */ 482 { 0x0C4E8086, "BWD Atom Processor S1200 Non-Transparent Bridge B2B", 483 NTB_ATOM, 0 }, 484 485 { 0x37258086, "JSF Xeon C35xx/C55xx Non-Transparent Bridge B2B", 486 NTB_XEON, NTB_SDOORBELL_LOCKUP | NTB_B2BDOORBELL_BIT14 }, 487 { 0x3C0D8086, "SNB Xeon E5/Core i7 Non-Transparent Bridge B2B", 488 NTB_XEON, NTB_SDOORBELL_LOCKUP | NTB_B2BDOORBELL_BIT14 }, 489 { 0x0E0D8086, "IVT Xeon E5 V2 Non-Transparent Bridge B2B", NTB_XEON, 490 NTB_SDOORBELL_LOCKUP | NTB_B2BDOORBELL_BIT14 | 491 NTB_SB01BASE_LOCKUP | NTB_BAR_SIZE_4K }, 492 { 0x2F0D8086, "HSX Xeon E5 V3 Non-Transparent Bridge B2B", NTB_XEON, 493 NTB_SDOORBELL_LOCKUP | NTB_B2BDOORBELL_BIT14 | 494 NTB_SB01BASE_LOCKUP }, 495 { 0x6F0D8086, "BDX Xeon E5 V4 Non-Transparent Bridge B2B", NTB_XEON, 496 NTB_SDOORBELL_LOCKUP | NTB_B2BDOORBELL_BIT14 | 497 NTB_SB01BASE_LOCKUP }, 498 }; 499 500 static const struct ntb_reg atom_reg = { 501 .ntb_ctl = ATOM_NTBCNTL_OFFSET, 502 .lnk_sta = ATOM_LINK_STATUS_OFFSET, 503 .db_size = sizeof(uint64_t), 504 .mw_bar = { NTB_B2B_BAR_1, NTB_B2B_BAR_2 }, 505 }; 506 507 static const struct ntb_alt_reg atom_pri_reg = { 508 .db_bell = ATOM_PDOORBELL_OFFSET, 509 .db_mask = ATOM_PDBMSK_OFFSET, 510 .spad = ATOM_SPAD_OFFSET, 511 }; 512 513 static const struct ntb_alt_reg atom_b2b_reg = { 514 .db_bell = ATOM_B2B_DOORBELL_OFFSET, 515 .spad = ATOM_B2B_SPAD_OFFSET, 516 }; 517 518 static const struct ntb_xlat_reg atom_sec_xlat = { 519 #if 0 520 /* "FIXME" says the Linux driver. */ 521 .bar0_base = ATOM_SBAR0BASE_OFFSET, 522 .bar2_base = ATOM_SBAR2BASE_OFFSET, 523 .bar4_base = ATOM_SBAR4BASE_OFFSET, 524 525 .bar2_limit = ATOM_SBAR2LMT_OFFSET, 526 .bar4_limit = ATOM_SBAR4LMT_OFFSET, 527 #endif 528 529 .bar2_xlat = ATOM_SBAR2XLAT_OFFSET, 530 .bar4_xlat = ATOM_SBAR4XLAT_OFFSET, 531 }; 532 533 static const struct ntb_reg xeon_reg = { 534 .ntb_ctl = XEON_NTBCNTL_OFFSET, 535 .lnk_sta = XEON_LINK_STATUS_OFFSET, 536 .db_size = sizeof(uint16_t), 537 .mw_bar = { NTB_B2B_BAR_1, NTB_B2B_BAR_2, NTB_B2B_BAR_3 }, 538 }; 539 540 static const struct ntb_alt_reg xeon_pri_reg = { 541 .db_bell = XEON_PDOORBELL_OFFSET, 542 .db_mask = XEON_PDBMSK_OFFSET, 543 .spad = XEON_SPAD_OFFSET, 544 }; 545 546 static const struct ntb_alt_reg xeon_b2b_reg = { 547 .db_bell = XEON_B2B_DOORBELL_OFFSET, 548 .spad = XEON_B2B_SPAD_OFFSET, 549 }; 550 551 static const struct ntb_xlat_reg xeon_sec_xlat = { 552 .bar0_base = XEON_SBAR0BASE_OFFSET, 553 .bar2_base = XEON_SBAR2BASE_OFFSET, 554 .bar4_base = XEON_SBAR4BASE_OFFSET, 555 .bar5_base = XEON_SBAR5BASE_OFFSET, 556 557 .bar2_limit = XEON_SBAR2LMT_OFFSET, 558 .bar4_limit = XEON_SBAR4LMT_OFFSET, 559 .bar5_limit = XEON_SBAR5LMT_OFFSET, 560 561 .bar2_xlat = XEON_SBAR2XLAT_OFFSET, 562 .bar4_xlat = XEON_SBAR4XLAT_OFFSET, 563 .bar5_xlat = XEON_SBAR5XLAT_OFFSET, 564 }; 565 566 static struct ntb_b2b_addr xeon_b2b_usd_addr = { 567 .bar0_addr = XEON_B2B_BAR0_ADDR, 568 .bar2_addr64 = XEON_B2B_BAR2_ADDR64, 569 .bar4_addr64 = XEON_B2B_BAR4_ADDR64, 570 .bar4_addr32 = XEON_B2B_BAR4_ADDR32, 571 .bar5_addr32 = XEON_B2B_BAR5_ADDR32, 572 }; 573 574 static struct ntb_b2b_addr xeon_b2b_dsd_addr = { 575 .bar0_addr = XEON_B2B_BAR0_ADDR, 576 .bar2_addr64 = XEON_B2B_BAR2_ADDR64, 577 .bar4_addr64 = XEON_B2B_BAR4_ADDR64, 578 .bar4_addr32 = XEON_B2B_BAR4_ADDR32, 579 .bar5_addr32 = XEON_B2B_BAR5_ADDR32, 580 }; 581 582 SYSCTL_NODE(_hw_ntb, OID_AUTO, xeon_b2b, CTLFLAG_RW, 0, 583 "B2B MW segment overrides -- MUST be the same on both sides"); 584 585 SYSCTL_UQUAD(_hw_ntb_xeon_b2b, OID_AUTO, usd_bar2_addr64, CTLFLAG_RDTUN, 586 &xeon_b2b_usd_addr.bar2_addr64, 0, "If using B2B topology on Xeon " 587 "hardware, use this 64-bit address on the bus between the NTB devices for " 588 "the window at BAR2, on the upstream side of the link. MUST be the same " 589 "address on both sides."); 590 SYSCTL_UQUAD(_hw_ntb_xeon_b2b, OID_AUTO, usd_bar4_addr64, CTLFLAG_RDTUN, 591 &xeon_b2b_usd_addr.bar4_addr64, 0, "See usd_bar2_addr64, but BAR4."); 592 SYSCTL_UQUAD(_hw_ntb_xeon_b2b, OID_AUTO, usd_bar4_addr32, CTLFLAG_RDTUN, 593 &xeon_b2b_usd_addr.bar4_addr32, 0, "See usd_bar2_addr64, but BAR4 " 594 "(split-BAR mode)."); 595 SYSCTL_UQUAD(_hw_ntb_xeon_b2b, OID_AUTO, usd_bar5_addr32, CTLFLAG_RDTUN, 596 &xeon_b2b_usd_addr.bar5_addr32, 0, "See usd_bar2_addr64, but BAR5 " 597 "(split-BAR mode)."); 598 599 SYSCTL_UQUAD(_hw_ntb_xeon_b2b, OID_AUTO, dsd_bar2_addr64, CTLFLAG_RDTUN, 600 &xeon_b2b_dsd_addr.bar2_addr64, 0, "If using B2B topology on Xeon " 601 "hardware, use this 64-bit address on the bus between the NTB devices for " 602 "the window at BAR2, on the downstream side of the link. MUST be the same" 603 " address on both sides."); 604 SYSCTL_UQUAD(_hw_ntb_xeon_b2b, OID_AUTO, dsd_bar4_addr64, CTLFLAG_RDTUN, 605 &xeon_b2b_dsd_addr.bar4_addr64, 0, "See dsd_bar2_addr64, but BAR4."); 606 SYSCTL_UQUAD(_hw_ntb_xeon_b2b, OID_AUTO, dsd_bar4_addr32, CTLFLAG_RDTUN, 607 &xeon_b2b_dsd_addr.bar4_addr32, 0, "See dsd_bar2_addr64, but BAR4 " 608 "(split-BAR mode)."); 609 SYSCTL_UQUAD(_hw_ntb_xeon_b2b, OID_AUTO, dsd_bar5_addr32, CTLFLAG_RDTUN, 610 &xeon_b2b_dsd_addr.bar5_addr32, 0, "See dsd_bar2_addr64, but BAR5 " 611 "(split-BAR mode)."); 612 613 /* 614 * OS <-> Driver interface structures 615 */ 616 MALLOC_DEFINE(M_NTB, "ntb_hw", "ntb_hw driver memory allocations"); 617 618 /* 619 * OS <-> Driver linkage functions 620 */ 621 static int 622 intel_ntb_probe(device_t device) 623 { 624 struct ntb_hw_info *p; 625 626 p = intel_ntb_get_device_info(pci_get_devid(device)); 627 if (p == NULL) 628 return (ENXIO); 629 630 device_set_desc(device, p->desc); 631 return (0); 632 } 633 634 static int 635 intel_ntb_attach(device_t device) 636 { 637 struct ntb_softc *ntb; 638 struct ntb_hw_info *p; 639 int error; 640 641 ntb = device_get_softc(device); 642 p = intel_ntb_get_device_info(pci_get_devid(device)); 643 644 ntb->device = device; 645 ntb->type = p->type; 646 ntb->features = p->features; 647 ntb->b2b_mw_idx = B2B_MW_DISABLED; 648 ntb->msix_mw_idx = B2B_MW_DISABLED; 649 650 /* Heartbeat timer for NTB_ATOM since there is no link interrupt */ 651 callout_init(&ntb->heartbeat_timer, 1); 652 callout_init(&ntb->lr_timer, 1); 653 callout_init(&ntb->peer_msix_work, 1); 654 mtx_init(&ntb->db_mask_lock, "ntb hw bits", NULL, MTX_SPIN); 655 656 if (ntb->type == NTB_ATOM) 657 error = intel_ntb_detect_atom(ntb); 658 else 659 error = intel_ntb_detect_xeon(ntb); 660 if (error != 0) 661 goto out; 662 663 intel_ntb_detect_max_mw(ntb); 664 665 pci_enable_busmaster(ntb->device); 666 667 error = intel_ntb_map_pci_bars(ntb); 668 if (error != 0) 669 goto out; 670 if (ntb->type == NTB_ATOM) 671 error = intel_ntb_atom_init_dev(ntb); 672 else 673 error = intel_ntb_xeon_init_dev(ntb); 674 if (error != 0) 675 goto out; 676 677 intel_ntb_spad_clear(device); 678 679 intel_ntb_poll_link(ntb); 680 681 intel_ntb_sysctl_init(ntb); 682 683 /* Attach children to this controller */ 684 error = ntb_register_device(device); 685 686 out: 687 if (error != 0) 688 intel_ntb_detach(device); 689 return (error); 690 } 691 692 static int 693 intel_ntb_detach(device_t device) 694 { 695 struct ntb_softc *ntb; 696 697 ntb = device_get_softc(device); 698 699 /* Detach & delete all children */ 700 ntb_unregister_device(device); 701 702 if (ntb->self_reg != NULL) { 703 DB_MASK_LOCK(ntb); 704 db_iowrite(ntb, ntb->self_reg->db_mask, ntb->db_valid_mask); 705 DB_MASK_UNLOCK(ntb); 706 } 707 callout_drain(&ntb->heartbeat_timer); 708 callout_drain(&ntb->lr_timer); 709 callout_drain(&ntb->peer_msix_work); 710 pci_disable_busmaster(ntb->device); 711 if (ntb->type == NTB_XEON) 712 intel_ntb_teardown_xeon(ntb); 713 intel_ntb_teardown_interrupts(ntb); 714 715 mtx_destroy(&ntb->db_mask_lock); 716 717 intel_ntb_unmap_pci_bar(ntb); 718 719 return (0); 720 } 721 722 /* 723 * Driver internal routines 724 */ 725 static inline enum ntb_bar 726 intel_ntb_mw_to_bar(struct ntb_softc *ntb, unsigned mw) 727 { 728 729 KASSERT(mw < ntb->mw_count, 730 ("%s: mw:%u > count:%u", __func__, mw, (unsigned)ntb->mw_count)); 731 KASSERT(ntb->reg->mw_bar[mw] != 0, ("invalid mw")); 732 733 return (ntb->reg->mw_bar[mw]); 734 } 735 736 static inline bool 737 bar_is_64bit(struct ntb_softc *ntb, enum ntb_bar bar) 738 { 739 /* XXX This assertion could be stronger. */ 740 KASSERT(bar < NTB_MAX_BARS, ("bogus bar")); 741 return (bar < NTB_B2B_BAR_2 || !HAS_FEATURE(ntb, NTB_SPLIT_BAR)); 742 } 743 744 static inline void 745 bar_get_xlat_params(struct ntb_softc *ntb, enum ntb_bar bar, uint32_t *base, 746 uint32_t *xlat, uint32_t *lmt) 747 { 748 uint32_t basev, lmtv, xlatv; 749 750 switch (bar) { 751 case NTB_B2B_BAR_1: 752 basev = ntb->xlat_reg->bar2_base; 753 lmtv = ntb->xlat_reg->bar2_limit; 754 xlatv = ntb->xlat_reg->bar2_xlat; 755 break; 756 case NTB_B2B_BAR_2: 757 basev = ntb->xlat_reg->bar4_base; 758 lmtv = ntb->xlat_reg->bar4_limit; 759 xlatv = ntb->xlat_reg->bar4_xlat; 760 break; 761 case NTB_B2B_BAR_3: 762 basev = ntb->xlat_reg->bar5_base; 763 lmtv = ntb->xlat_reg->bar5_limit; 764 xlatv = ntb->xlat_reg->bar5_xlat; 765 break; 766 default: 767 KASSERT(bar >= NTB_B2B_BAR_1 && bar < NTB_MAX_BARS, 768 ("bad bar")); 769 basev = lmtv = xlatv = 0; 770 break; 771 } 772 773 if (base != NULL) 774 *base = basev; 775 if (xlat != NULL) 776 *xlat = xlatv; 777 if (lmt != NULL) 778 *lmt = lmtv; 779 } 780 781 static int 782 intel_ntb_map_pci_bars(struct ntb_softc *ntb) 783 { 784 int rc; 785 786 ntb->bar_info[NTB_CONFIG_BAR].pci_resource_id = PCIR_BAR(0); 787 rc = map_mmr_bar(ntb, &ntb->bar_info[NTB_CONFIG_BAR]); 788 if (rc != 0) 789 goto out; 790 791 ntb->bar_info[NTB_B2B_BAR_1].pci_resource_id = PCIR_BAR(2); 792 rc = map_memory_window_bar(ntb, &ntb->bar_info[NTB_B2B_BAR_1]); 793 if (rc != 0) 794 goto out; 795 ntb->bar_info[NTB_B2B_BAR_1].psz_off = XEON_PBAR23SZ_OFFSET; 796 ntb->bar_info[NTB_B2B_BAR_1].ssz_off = XEON_SBAR23SZ_OFFSET; 797 ntb->bar_info[NTB_B2B_BAR_1].pbarxlat_off = XEON_PBAR2XLAT_OFFSET; 798 799 ntb->bar_info[NTB_B2B_BAR_2].pci_resource_id = PCIR_BAR(4); 800 rc = map_memory_window_bar(ntb, &ntb->bar_info[NTB_B2B_BAR_2]); 801 if (rc != 0) 802 goto out; 803 ntb->bar_info[NTB_B2B_BAR_2].psz_off = XEON_PBAR4SZ_OFFSET; 804 ntb->bar_info[NTB_B2B_BAR_2].ssz_off = XEON_SBAR4SZ_OFFSET; 805 ntb->bar_info[NTB_B2B_BAR_2].pbarxlat_off = XEON_PBAR4XLAT_OFFSET; 806 807 if (!HAS_FEATURE(ntb, NTB_SPLIT_BAR)) 808 goto out; 809 810 ntb->bar_info[NTB_B2B_BAR_3].pci_resource_id = PCIR_BAR(5); 811 rc = map_memory_window_bar(ntb, &ntb->bar_info[NTB_B2B_BAR_3]); 812 ntb->bar_info[NTB_B2B_BAR_3].psz_off = XEON_PBAR5SZ_OFFSET; 813 ntb->bar_info[NTB_B2B_BAR_3].ssz_off = XEON_SBAR5SZ_OFFSET; 814 ntb->bar_info[NTB_B2B_BAR_3].pbarxlat_off = XEON_PBAR5XLAT_OFFSET; 815 816 out: 817 if (rc != 0) 818 device_printf(ntb->device, 819 "unable to allocate pci resource\n"); 820 return (rc); 821 } 822 823 static void 824 print_map_success(struct ntb_softc *ntb, struct ntb_pci_bar_info *bar, 825 const char *kind) 826 { 827 828 device_printf(ntb->device, 829 "Mapped BAR%d v:[%p-%p] p:[%p-%p] (0x%jx bytes) (%s)\n", 830 PCI_RID2BAR(bar->pci_resource_id), bar->vbase, 831 (char *)bar->vbase + bar->size - 1, 832 (void *)bar->pbase, (void *)(bar->pbase + bar->size - 1), 833 (uintmax_t)bar->size, kind); 834 } 835 836 static int 837 map_mmr_bar(struct ntb_softc *ntb, struct ntb_pci_bar_info *bar) 838 { 839 840 bar->pci_resource = bus_alloc_resource_any(ntb->device, SYS_RES_MEMORY, 841 &bar->pci_resource_id, RF_ACTIVE); 842 if (bar->pci_resource == NULL) 843 return (ENXIO); 844 845 save_bar_parameters(bar); 846 bar->map_mode = VM_MEMATTR_UNCACHEABLE; 847 print_map_success(ntb, bar, "mmr"); 848 return (0); 849 } 850 851 static int 852 map_memory_window_bar(struct ntb_softc *ntb, struct ntb_pci_bar_info *bar) 853 { 854 int rc; 855 vm_memattr_t mapmode; 856 uint8_t bar_size_bits = 0; 857 858 bar->pci_resource = bus_alloc_resource_any(ntb->device, SYS_RES_MEMORY, 859 &bar->pci_resource_id, RF_ACTIVE); 860 861 if (bar->pci_resource == NULL) 862 return (ENXIO); 863 864 save_bar_parameters(bar); 865 /* 866 * Ivytown NTB BAR sizes are misreported by the hardware due to a 867 * hardware issue. To work around this, query the size it should be 868 * configured to by the device and modify the resource to correspond to 869 * this new size. The BIOS on systems with this problem is required to 870 * provide enough address space to allow the driver to make this change 871 * safely. 872 * 873 * Ideally I could have just specified the size when I allocated the 874 * resource like: 875 * bus_alloc_resource(ntb->device, 876 * SYS_RES_MEMORY, &bar->pci_resource_id, 0ul, ~0ul, 877 * 1ul << bar_size_bits, RF_ACTIVE); 878 * but the PCI driver does not honor the size in this call, so we have 879 * to modify it after the fact. 880 */ 881 if (HAS_FEATURE(ntb, NTB_BAR_SIZE_4K)) { 882 if (bar->pci_resource_id == PCIR_BAR(2)) 883 bar_size_bits = pci_read_config(ntb->device, 884 XEON_PBAR23SZ_OFFSET, 1); 885 else 886 bar_size_bits = pci_read_config(ntb->device, 887 XEON_PBAR45SZ_OFFSET, 1); 888 889 rc = bus_adjust_resource(ntb->device, SYS_RES_MEMORY, 890 bar->pci_resource, bar->pbase, 891 bar->pbase + (1ul << bar_size_bits) - 1); 892 if (rc != 0) { 893 device_printf(ntb->device, 894 "unable to resize bar\n"); 895 return (rc); 896 } 897 898 save_bar_parameters(bar); 899 } 900 901 bar->map_mode = VM_MEMATTR_UNCACHEABLE; 902 print_map_success(ntb, bar, "mw"); 903 904 /* 905 * Optionally, mark MW BARs as anything other than UC to improve 906 * performance. 907 */ 908 mapmode = intel_ntb_pat_flags(); 909 if (mapmode == bar->map_mode) 910 return (0); 911 912 rc = pmap_change_attr((vm_offset_t)bar->vbase, bar->size, mapmode); 913 if (rc == 0) { 914 bar->map_mode = mapmode; 915 device_printf(ntb->device, 916 "Marked BAR%d v:[%p-%p] p:[%p-%p] as " 917 "%s.\n", 918 PCI_RID2BAR(bar->pci_resource_id), bar->vbase, 919 (char *)bar->vbase + bar->size - 1, 920 (void *)bar->pbase, (void *)(bar->pbase + bar->size - 1), 921 intel_ntb_vm_memattr_to_str(mapmode)); 922 } else 923 device_printf(ntb->device, 924 "Unable to mark BAR%d v:[%p-%p] p:[%p-%p] as " 925 "%s: %d\n", 926 PCI_RID2BAR(bar->pci_resource_id), bar->vbase, 927 (char *)bar->vbase + bar->size - 1, 928 (void *)bar->pbase, (void *)(bar->pbase + bar->size - 1), 929 intel_ntb_vm_memattr_to_str(mapmode), rc); 930 /* Proceed anyway */ 931 return (0); 932 } 933 934 static void 935 intel_ntb_unmap_pci_bar(struct ntb_softc *ntb) 936 { 937 struct ntb_pci_bar_info *current_bar; 938 int i; 939 940 for (i = 0; i < NTB_MAX_BARS; i++) { 941 current_bar = &ntb->bar_info[i]; 942 if (current_bar->pci_resource != NULL) 943 bus_release_resource(ntb->device, SYS_RES_MEMORY, 944 current_bar->pci_resource_id, 945 current_bar->pci_resource); 946 } 947 } 948 949 static int 950 intel_ntb_setup_msix(struct ntb_softc *ntb, uint32_t num_vectors) 951 { 952 uint32_t i; 953 int rc; 954 955 for (i = 0; i < num_vectors; i++) { 956 ntb->int_info[i].rid = i + 1; 957 ntb->int_info[i].res = bus_alloc_resource_any(ntb->device, 958 SYS_RES_IRQ, &ntb->int_info[i].rid, RF_ACTIVE); 959 if (ntb->int_info[i].res == NULL) { 960 device_printf(ntb->device, 961 "bus_alloc_resource failed\n"); 962 return (ENOMEM); 963 } 964 ntb->int_info[i].tag = NULL; 965 ntb->allocated_interrupts++; 966 rc = bus_setup_intr(ntb->device, ntb->int_info[i].res, 967 INTR_MPSAFE | INTR_TYPE_MISC, NULL, ndev_vec_isr, 968 &ntb->msix_vec[i], &ntb->int_info[i].tag); 969 if (rc != 0) { 970 device_printf(ntb->device, "bus_setup_intr failed\n"); 971 return (ENXIO); 972 } 973 } 974 return (0); 975 } 976 977 /* 978 * The Linux NTB driver drops from MSI-X to legacy INTx if a unique vector 979 * cannot be allocated for each MSI-X message. JHB seems to think remapping 980 * should be okay. This tunable should enable us to test that hypothesis 981 * when someone gets their hands on some Xeon hardware. 982 */ 983 static int ntb_force_remap_mode; 984 SYSCTL_INT(_hw_ntb, OID_AUTO, force_remap_mode, CTLFLAG_RDTUN, 985 &ntb_force_remap_mode, 0, "If enabled, force MSI-X messages to be remapped" 986 " to a smaller number of ithreads, even if the desired number are " 987 "available"); 988 989 /* 990 * In case it is NOT ok, give consumers an abort button. 991 */ 992 static int ntb_prefer_intx; 993 SYSCTL_INT(_hw_ntb, OID_AUTO, prefer_intx_to_remap, CTLFLAG_RDTUN, 994 &ntb_prefer_intx, 0, "If enabled, prefer to use legacy INTx mode rather " 995 "than remapping MSI-X messages over available slots (match Linux driver " 996 "behavior)"); 997 998 /* 999 * Remap the desired number of MSI-X messages to available ithreads in a simple 1000 * round-robin fashion. 1001 */ 1002 static int 1003 intel_ntb_remap_msix(device_t dev, uint32_t desired, uint32_t avail) 1004 { 1005 u_int *vectors; 1006 uint32_t i; 1007 int rc; 1008 1009 if (ntb_prefer_intx != 0) 1010 return (ENXIO); 1011 1012 vectors = malloc(desired * sizeof(*vectors), M_NTB, M_ZERO | M_WAITOK); 1013 1014 for (i = 0; i < desired; i++) 1015 vectors[i] = (i % avail) + 1; 1016 1017 rc = pci_remap_msix(dev, desired, vectors); 1018 free(vectors, M_NTB); 1019 return (rc); 1020 } 1021 1022 static int 1023 intel_ntb_init_isr(struct ntb_softc *ntb) 1024 { 1025 uint32_t desired_vectors, num_vectors; 1026 int rc; 1027 1028 ntb->allocated_interrupts = 0; 1029 ntb->last_ts = ticks; 1030 1031 /* 1032 * Mask all doorbell interrupts. (Except link events!) 1033 */ 1034 DB_MASK_LOCK(ntb); 1035 ntb->db_mask = ntb->db_valid_mask; 1036 db_iowrite(ntb, ntb->self_reg->db_mask, ntb->db_mask); 1037 DB_MASK_UNLOCK(ntb); 1038 1039 num_vectors = desired_vectors = MIN(pci_msix_count(ntb->device), 1040 ntb->db_count); 1041 if (desired_vectors >= 1) { 1042 rc = pci_alloc_msix(ntb->device, &num_vectors); 1043 1044 if (ntb_force_remap_mode != 0 && rc == 0 && 1045 num_vectors == desired_vectors) 1046 num_vectors--; 1047 1048 if (rc == 0 && num_vectors < desired_vectors) { 1049 rc = intel_ntb_remap_msix(ntb->device, desired_vectors, 1050 num_vectors); 1051 if (rc == 0) 1052 num_vectors = desired_vectors; 1053 else 1054 pci_release_msi(ntb->device); 1055 } 1056 if (rc != 0) 1057 num_vectors = 1; 1058 } else 1059 num_vectors = 1; 1060 1061 if (ntb->type == NTB_XEON && num_vectors < ntb->db_vec_count) { 1062 if (HAS_FEATURE(ntb, NTB_SB01BASE_LOCKUP)) { 1063 device_printf(ntb->device, 1064 "Errata workaround does not support MSI or INTX\n"); 1065 return (EINVAL); 1066 } 1067 1068 ntb->db_vec_count = 1; 1069 ntb->db_vec_shift = XEON_DB_TOTAL_SHIFT; 1070 rc = intel_ntb_setup_legacy_interrupt(ntb); 1071 } else { 1072 if (num_vectors - 1 != XEON_NONLINK_DB_MSIX_BITS && 1073 HAS_FEATURE(ntb, NTB_SB01BASE_LOCKUP)) { 1074 device_printf(ntb->device, 1075 "Errata workaround expects %d doorbell bits\n", 1076 XEON_NONLINK_DB_MSIX_BITS); 1077 return (EINVAL); 1078 } 1079 1080 intel_ntb_create_msix_vec(ntb, num_vectors); 1081 rc = intel_ntb_setup_msix(ntb, num_vectors); 1082 } 1083 if (rc != 0) { 1084 device_printf(ntb->device, 1085 "Error allocating interrupts: %d\n", rc); 1086 intel_ntb_free_msix_vec(ntb); 1087 } 1088 1089 return (rc); 1090 } 1091 1092 static int 1093 intel_ntb_setup_legacy_interrupt(struct ntb_softc *ntb) 1094 { 1095 int rc; 1096 1097 ntb->int_info[0].rid = 0; 1098 ntb->int_info[0].res = bus_alloc_resource_any(ntb->device, SYS_RES_IRQ, 1099 &ntb->int_info[0].rid, RF_SHAREABLE|RF_ACTIVE); 1100 if (ntb->int_info[0].res == NULL) { 1101 device_printf(ntb->device, "bus_alloc_resource failed\n"); 1102 return (ENOMEM); 1103 } 1104 1105 ntb->int_info[0].tag = NULL; 1106 ntb->allocated_interrupts = 1; 1107 1108 rc = bus_setup_intr(ntb->device, ntb->int_info[0].res, 1109 INTR_MPSAFE | INTR_TYPE_MISC, NULL, ndev_irq_isr, 1110 ntb, &ntb->int_info[0].tag); 1111 if (rc != 0) { 1112 device_printf(ntb->device, "bus_setup_intr failed\n"); 1113 return (ENXIO); 1114 } 1115 1116 return (0); 1117 } 1118 1119 static void 1120 intel_ntb_teardown_interrupts(struct ntb_softc *ntb) 1121 { 1122 struct ntb_int_info *current_int; 1123 int i; 1124 1125 for (i = 0; i < ntb->allocated_interrupts; i++) { 1126 current_int = &ntb->int_info[i]; 1127 if (current_int->tag != NULL) 1128 bus_teardown_intr(ntb->device, current_int->res, 1129 current_int->tag); 1130 1131 if (current_int->res != NULL) 1132 bus_release_resource(ntb->device, SYS_RES_IRQ, 1133 rman_get_rid(current_int->res), current_int->res); 1134 } 1135 1136 intel_ntb_free_msix_vec(ntb); 1137 pci_release_msi(ntb->device); 1138 } 1139 1140 /* 1141 * Doorbell register and mask are 64-bit on Atom, 16-bit on Xeon. Abstract it 1142 * out to make code clearer. 1143 */ 1144 static inline uint64_t 1145 db_ioread(struct ntb_softc *ntb, uint64_t regoff) 1146 { 1147 1148 if (ntb->type == NTB_ATOM) 1149 return (intel_ntb_reg_read(8, regoff)); 1150 1151 KASSERT(ntb->type == NTB_XEON, ("bad ntb type")); 1152 1153 return (intel_ntb_reg_read(2, regoff)); 1154 } 1155 1156 static inline void 1157 db_iowrite(struct ntb_softc *ntb, uint64_t regoff, uint64_t val) 1158 { 1159 1160 KASSERT((val & ~ntb->db_valid_mask) == 0, 1161 ("%s: Invalid bits 0x%jx (valid: 0x%jx)", __func__, 1162 (uintmax_t)(val & ~ntb->db_valid_mask), 1163 (uintmax_t)ntb->db_valid_mask)); 1164 1165 if (regoff == ntb->self_reg->db_mask) 1166 DB_MASK_ASSERT(ntb, MA_OWNED); 1167 db_iowrite_raw(ntb, regoff, val); 1168 } 1169 1170 static inline void 1171 db_iowrite_raw(struct ntb_softc *ntb, uint64_t regoff, uint64_t val) 1172 { 1173 1174 if (ntb->type == NTB_ATOM) { 1175 intel_ntb_reg_write(8, regoff, val); 1176 return; 1177 } 1178 1179 KASSERT(ntb->type == NTB_XEON, ("bad ntb type")); 1180 intel_ntb_reg_write(2, regoff, (uint16_t)val); 1181 } 1182 1183 static void 1184 intel_ntb_db_set_mask(device_t dev, uint64_t bits) 1185 { 1186 struct ntb_softc *ntb = device_get_softc(dev); 1187 1188 DB_MASK_LOCK(ntb); 1189 ntb->db_mask |= bits; 1190 if (!HAS_FEATURE(ntb, NTB_SB01BASE_LOCKUP)) 1191 db_iowrite(ntb, ntb->self_reg->db_mask, ntb->db_mask); 1192 DB_MASK_UNLOCK(ntb); 1193 } 1194 1195 static void 1196 intel_ntb_db_clear_mask(device_t dev, uint64_t bits) 1197 { 1198 struct ntb_softc *ntb = device_get_softc(dev); 1199 uint64_t ibits; 1200 int i; 1201 1202 KASSERT((bits & ~ntb->db_valid_mask) == 0, 1203 ("%s: Invalid bits 0x%jx (valid: 0x%jx)", __func__, 1204 (uintmax_t)(bits & ~ntb->db_valid_mask), 1205 (uintmax_t)ntb->db_valid_mask)); 1206 1207 DB_MASK_LOCK(ntb); 1208 ibits = ntb->fake_db & ntb->db_mask & bits; 1209 ntb->db_mask &= ~bits; 1210 if (HAS_FEATURE(ntb, NTB_SB01BASE_LOCKUP)) { 1211 /* Simulate fake interrupts if unmasked DB bits are set. */ 1212 ntb->force_db |= ibits; 1213 for (i = 0; i < XEON_NONLINK_DB_MSIX_BITS; i++) { 1214 if ((ibits & intel_ntb_db_vector_mask(dev, i)) != 0) 1215 swi_sched(ntb->int_info[i].tag, 0); 1216 } 1217 } else { 1218 db_iowrite(ntb, ntb->self_reg->db_mask, ntb->db_mask); 1219 } 1220 DB_MASK_UNLOCK(ntb); 1221 } 1222 1223 static uint64_t 1224 intel_ntb_db_read(device_t dev) 1225 { 1226 struct ntb_softc *ntb = device_get_softc(dev); 1227 1228 if (HAS_FEATURE(ntb, NTB_SB01BASE_LOCKUP)) 1229 return (ntb->fake_db); 1230 1231 return (db_ioread(ntb, ntb->self_reg->db_bell)); 1232 } 1233 1234 static void 1235 intel_ntb_db_clear(device_t dev, uint64_t bits) 1236 { 1237 struct ntb_softc *ntb = device_get_softc(dev); 1238 1239 KASSERT((bits & ~ntb->db_valid_mask) == 0, 1240 ("%s: Invalid bits 0x%jx (valid: 0x%jx)", __func__, 1241 (uintmax_t)(bits & ~ntb->db_valid_mask), 1242 (uintmax_t)ntb->db_valid_mask)); 1243 1244 if (HAS_FEATURE(ntb, NTB_SB01BASE_LOCKUP)) { 1245 DB_MASK_LOCK(ntb); 1246 ntb->fake_db &= ~bits; 1247 DB_MASK_UNLOCK(ntb); 1248 return; 1249 } 1250 1251 db_iowrite(ntb, ntb->self_reg->db_bell, bits); 1252 } 1253 1254 static inline uint64_t 1255 intel_ntb_vec_mask(struct ntb_softc *ntb, uint64_t db_vector) 1256 { 1257 uint64_t shift, mask; 1258 1259 if (HAS_FEATURE(ntb, NTB_SB01BASE_LOCKUP)) { 1260 /* 1261 * Remap vectors in custom way to make at least first 1262 * three doorbells to not generate stray events. 1263 * This breaks Linux compatibility (if one existed) 1264 * when more then one DB is used (not by if_ntb). 1265 */ 1266 if (db_vector < XEON_NONLINK_DB_MSIX_BITS - 1) 1267 return (1 << db_vector); 1268 if (db_vector == XEON_NONLINK_DB_MSIX_BITS - 1) 1269 return (0x7ffc); 1270 } 1271 1272 shift = ntb->db_vec_shift; 1273 mask = (1ull << shift) - 1; 1274 return (mask << (shift * db_vector)); 1275 } 1276 1277 static void 1278 intel_ntb_interrupt(struct ntb_softc *ntb, uint32_t vec) 1279 { 1280 uint64_t vec_mask; 1281 1282 ntb->last_ts = ticks; 1283 vec_mask = intel_ntb_vec_mask(ntb, vec); 1284 1285 if ((vec_mask & ntb->db_link_mask) != 0) { 1286 if (intel_ntb_poll_link(ntb)) 1287 ntb_link_event(ntb->device); 1288 } 1289 1290 if (HAS_FEATURE(ntb, NTB_SB01BASE_LOCKUP) && 1291 (vec_mask & ntb->db_link_mask) == 0) { 1292 DB_MASK_LOCK(ntb); 1293 1294 /* 1295 * Do not report same DB events again if not cleared yet, 1296 * unless the mask was just cleared for them and this 1297 * interrupt handler call can be the consequence of it. 1298 */ 1299 vec_mask &= ~ntb->fake_db | ntb->force_db; 1300 ntb->force_db &= ~vec_mask; 1301 1302 /* Update our internal doorbell register. */ 1303 ntb->fake_db |= vec_mask; 1304 1305 /* Do not report masked DB events. */ 1306 vec_mask &= ~ntb->db_mask; 1307 1308 DB_MASK_UNLOCK(ntb); 1309 } 1310 1311 if ((vec_mask & ntb->db_valid_mask) != 0) 1312 ntb_db_event(ntb->device, vec); 1313 } 1314 1315 static void 1316 ndev_vec_isr(void *arg) 1317 { 1318 struct ntb_vec *nvec = arg; 1319 1320 intel_ntb_interrupt(nvec->ntb, nvec->num); 1321 } 1322 1323 static void 1324 ndev_irq_isr(void *arg) 1325 { 1326 /* If we couldn't set up MSI-X, we only have the one vector. */ 1327 intel_ntb_interrupt(arg, 0); 1328 } 1329 1330 static int 1331 intel_ntb_create_msix_vec(struct ntb_softc *ntb, uint32_t num_vectors) 1332 { 1333 uint32_t i; 1334 1335 ntb->msix_vec = malloc(num_vectors * sizeof(*ntb->msix_vec), M_NTB, 1336 M_ZERO | M_WAITOK); 1337 for (i = 0; i < num_vectors; i++) { 1338 ntb->msix_vec[i].num = i; 1339 ntb->msix_vec[i].ntb = ntb; 1340 } 1341 1342 return (0); 1343 } 1344 1345 static void 1346 intel_ntb_free_msix_vec(struct ntb_softc *ntb) 1347 { 1348 1349 if (ntb->msix_vec == NULL) 1350 return; 1351 1352 free(ntb->msix_vec, M_NTB); 1353 ntb->msix_vec = NULL; 1354 } 1355 1356 static void 1357 intel_ntb_get_msix_info(struct ntb_softc *ntb) 1358 { 1359 struct pci_devinfo *dinfo; 1360 struct pcicfg_msix *msix; 1361 uint32_t laddr, data, i, offset; 1362 1363 dinfo = device_get_ivars(ntb->device); 1364 msix = &dinfo->cfg.msix; 1365 1366 CTASSERT(XEON_NONLINK_DB_MSIX_BITS == nitems(ntb->msix_data)); 1367 1368 for (i = 0; i < XEON_NONLINK_DB_MSIX_BITS; i++) { 1369 offset = msix->msix_table_offset + i * PCI_MSIX_ENTRY_SIZE; 1370 1371 laddr = bus_read_4(msix->msix_table_res, offset + 1372 PCI_MSIX_ENTRY_LOWER_ADDR); 1373 intel_ntb_printf(2, "local MSIX addr(%u): 0x%x\n", i, laddr); 1374 1375 KASSERT((laddr & MSI_INTEL_ADDR_BASE) == MSI_INTEL_ADDR_BASE, 1376 ("local MSIX addr 0x%x not in MSI base 0x%x", laddr, 1377 MSI_INTEL_ADDR_BASE)); 1378 ntb->msix_data[i].nmd_ofs = laddr; 1379 1380 data = bus_read_4(msix->msix_table_res, offset + 1381 PCI_MSIX_ENTRY_DATA); 1382 intel_ntb_printf(2, "local MSIX data(%u): 0x%x\n", i, data); 1383 1384 ntb->msix_data[i].nmd_data = data; 1385 } 1386 } 1387 1388 static struct ntb_hw_info * 1389 intel_ntb_get_device_info(uint32_t device_id) 1390 { 1391 struct ntb_hw_info *ep; 1392 1393 for (ep = pci_ids; ep < &pci_ids[nitems(pci_ids)]; ep++) { 1394 if (ep->device_id == device_id) 1395 return (ep); 1396 } 1397 return (NULL); 1398 } 1399 1400 static void 1401 intel_ntb_teardown_xeon(struct ntb_softc *ntb) 1402 { 1403 1404 if (ntb->reg != NULL) 1405 intel_ntb_link_disable(ntb->device); 1406 } 1407 1408 static void 1409 intel_ntb_detect_max_mw(struct ntb_softc *ntb) 1410 { 1411 1412 if (ntb->type == NTB_ATOM) { 1413 ntb->mw_count = ATOM_MW_COUNT; 1414 return; 1415 } 1416 1417 if (HAS_FEATURE(ntb, NTB_SPLIT_BAR)) 1418 ntb->mw_count = XEON_HSX_SPLIT_MW_COUNT; 1419 else 1420 ntb->mw_count = XEON_SNB_MW_COUNT; 1421 } 1422 1423 static int 1424 intel_ntb_detect_xeon(struct ntb_softc *ntb) 1425 { 1426 uint8_t ppd, conn_type; 1427 1428 ppd = pci_read_config(ntb->device, NTB_PPD_OFFSET, 1); 1429 ntb->ppd = ppd; 1430 1431 if ((ppd & XEON_PPD_DEV_TYPE) != 0) 1432 ntb->dev_type = NTB_DEV_DSD; 1433 else 1434 ntb->dev_type = NTB_DEV_USD; 1435 1436 if ((ppd & XEON_PPD_SPLIT_BAR) != 0) 1437 ntb->features |= NTB_SPLIT_BAR; 1438 1439 if (HAS_FEATURE(ntb, NTB_SB01BASE_LOCKUP) && 1440 !HAS_FEATURE(ntb, NTB_SPLIT_BAR)) { 1441 device_printf(ntb->device, 1442 "Can not apply SB01BASE_LOCKUP workaround " 1443 "with split BARs disabled!\n"); 1444 device_printf(ntb->device, 1445 "Expect system hangs under heavy NTB traffic!\n"); 1446 ntb->features &= ~NTB_SB01BASE_LOCKUP; 1447 } 1448 1449 /* 1450 * SDOORBELL errata workaround gets in the way of SB01BASE_LOCKUP 1451 * errata workaround; only do one at a time. 1452 */ 1453 if (HAS_FEATURE(ntb, NTB_SB01BASE_LOCKUP)) 1454 ntb->features &= ~NTB_SDOORBELL_LOCKUP; 1455 1456 conn_type = ppd & XEON_PPD_CONN_TYPE; 1457 switch (conn_type) { 1458 case NTB_CONN_B2B: 1459 ntb->conn_type = conn_type; 1460 break; 1461 case NTB_CONN_RP: 1462 case NTB_CONN_TRANSPARENT: 1463 default: 1464 device_printf(ntb->device, "Unsupported connection type: %u\n", 1465 (unsigned)conn_type); 1466 return (ENXIO); 1467 } 1468 return (0); 1469 } 1470 1471 static int 1472 intel_ntb_detect_atom(struct ntb_softc *ntb) 1473 { 1474 uint32_t ppd, conn_type; 1475 1476 ppd = pci_read_config(ntb->device, NTB_PPD_OFFSET, 4); 1477 ntb->ppd = ppd; 1478 1479 if ((ppd & ATOM_PPD_DEV_TYPE) != 0) 1480 ntb->dev_type = NTB_DEV_DSD; 1481 else 1482 ntb->dev_type = NTB_DEV_USD; 1483 1484 conn_type = (ppd & ATOM_PPD_CONN_TYPE) >> 8; 1485 switch (conn_type) { 1486 case NTB_CONN_B2B: 1487 ntb->conn_type = conn_type; 1488 break; 1489 default: 1490 device_printf(ntb->device, "Unsupported NTB configuration\n"); 1491 return (ENXIO); 1492 } 1493 return (0); 1494 } 1495 1496 static int 1497 intel_ntb_xeon_init_dev(struct ntb_softc *ntb) 1498 { 1499 int rc; 1500 1501 ntb->spad_count = XEON_SPAD_COUNT; 1502 ntb->db_count = XEON_DB_COUNT; 1503 ntb->db_link_mask = XEON_DB_LINK_BIT; 1504 ntb->db_vec_count = XEON_DB_MSIX_VECTOR_COUNT; 1505 ntb->db_vec_shift = XEON_DB_MSIX_VECTOR_SHIFT; 1506 1507 if (ntb->conn_type != NTB_CONN_B2B) { 1508 device_printf(ntb->device, "Connection type %d not supported\n", 1509 ntb->conn_type); 1510 return (ENXIO); 1511 } 1512 1513 ntb->reg = &xeon_reg; 1514 ntb->self_reg = &xeon_pri_reg; 1515 ntb->peer_reg = &xeon_b2b_reg; 1516 ntb->xlat_reg = &xeon_sec_xlat; 1517 1518 if (HAS_FEATURE(ntb, NTB_SB01BASE_LOCKUP)) { 1519 ntb->force_db = ntb->fake_db = 0; 1520 ntb->msix_mw_idx = (ntb->mw_count + g_ntb_msix_idx) % 1521 ntb->mw_count; 1522 intel_ntb_printf(2, "Setting up MSIX mw idx %d means %u\n", 1523 g_ntb_msix_idx, ntb->msix_mw_idx); 1524 rc = intel_ntb_mw_set_wc_internal(ntb, ntb->msix_mw_idx, 1525 VM_MEMATTR_UNCACHEABLE); 1526 KASSERT(rc == 0, ("shouldn't fail")); 1527 } else if (HAS_FEATURE(ntb, NTB_SDOORBELL_LOCKUP)) { 1528 /* 1529 * There is a Xeon hardware errata related to writes to SDOORBELL or 1530 * B2BDOORBELL in conjunction with inbound access to NTB MMIO space, 1531 * which may hang the system. To workaround this, use a memory 1532 * window to access the interrupt and scratch pad registers on the 1533 * remote system. 1534 */ 1535 ntb->b2b_mw_idx = (ntb->mw_count + g_ntb_mw_idx) % 1536 ntb->mw_count; 1537 intel_ntb_printf(2, "Setting up b2b mw idx %d means %u\n", 1538 g_ntb_mw_idx, ntb->b2b_mw_idx); 1539 rc = intel_ntb_mw_set_wc_internal(ntb, ntb->b2b_mw_idx, 1540 VM_MEMATTR_UNCACHEABLE); 1541 KASSERT(rc == 0, ("shouldn't fail")); 1542 } else if (HAS_FEATURE(ntb, NTB_B2BDOORBELL_BIT14)) 1543 /* 1544 * HW Errata on bit 14 of b2bdoorbell register. Writes will not be 1545 * mirrored to the remote system. Shrink the number of bits by one, 1546 * since bit 14 is the last bit. 1547 * 1548 * On REGS_THRU_MW errata mode, we don't use the b2bdoorbell register 1549 * anyway. Nor for non-B2B connection types. 1550 */ 1551 ntb->db_count = XEON_DB_COUNT - 1; 1552 1553 ntb->db_valid_mask = (1ull << ntb->db_count) - 1; 1554 1555 if (ntb->dev_type == NTB_DEV_USD) 1556 rc = xeon_setup_b2b_mw(ntb, &xeon_b2b_dsd_addr, 1557 &xeon_b2b_usd_addr); 1558 else 1559 rc = xeon_setup_b2b_mw(ntb, &xeon_b2b_usd_addr, 1560 &xeon_b2b_dsd_addr); 1561 if (rc != 0) 1562 return (rc); 1563 1564 /* Enable Bus Master and Memory Space on the secondary side */ 1565 intel_ntb_reg_write(2, XEON_SPCICMD_OFFSET, 1566 PCIM_CMD_MEMEN | PCIM_CMD_BUSMASTEREN); 1567 1568 /* 1569 * Mask all doorbell interrupts. 1570 */ 1571 DB_MASK_LOCK(ntb); 1572 ntb->db_mask = ntb->db_valid_mask; 1573 db_iowrite(ntb, ntb->self_reg->db_mask, ntb->db_mask); 1574 DB_MASK_UNLOCK(ntb); 1575 1576 rc = intel_ntb_init_isr(ntb); 1577 return (rc); 1578 } 1579 1580 static int 1581 intel_ntb_atom_init_dev(struct ntb_softc *ntb) 1582 { 1583 int error; 1584 1585 KASSERT(ntb->conn_type == NTB_CONN_B2B, 1586 ("Unsupported NTB configuration (%d)\n", ntb->conn_type)); 1587 1588 ntb->spad_count = ATOM_SPAD_COUNT; 1589 ntb->db_count = ATOM_DB_COUNT; 1590 ntb->db_vec_count = ATOM_DB_MSIX_VECTOR_COUNT; 1591 ntb->db_vec_shift = ATOM_DB_MSIX_VECTOR_SHIFT; 1592 ntb->db_valid_mask = (1ull << ntb->db_count) - 1; 1593 1594 ntb->reg = &atom_reg; 1595 ntb->self_reg = &atom_pri_reg; 1596 ntb->peer_reg = &atom_b2b_reg; 1597 ntb->xlat_reg = &atom_sec_xlat; 1598 1599 /* 1600 * FIXME - MSI-X bug on early Atom HW, remove once internal issue is 1601 * resolved. Mask transaction layer internal parity errors. 1602 */ 1603 pci_write_config(ntb->device, 0xFC, 0x4, 4); 1604 1605 configure_atom_secondary_side_bars(ntb); 1606 1607 /* Enable Bus Master and Memory Space on the secondary side */ 1608 intel_ntb_reg_write(2, ATOM_SPCICMD_OFFSET, 1609 PCIM_CMD_MEMEN | PCIM_CMD_BUSMASTEREN); 1610 1611 error = intel_ntb_init_isr(ntb); 1612 if (error != 0) 1613 return (error); 1614 1615 /* Initiate PCI-E link training */ 1616 intel_ntb_link_enable(ntb->device, NTB_SPEED_AUTO, NTB_WIDTH_AUTO); 1617 1618 callout_reset(&ntb->heartbeat_timer, 0, atom_link_hb, ntb); 1619 1620 return (0); 1621 } 1622 1623 /* XXX: Linux driver doesn't seem to do any of this for Atom. */ 1624 static void 1625 configure_atom_secondary_side_bars(struct ntb_softc *ntb) 1626 { 1627 1628 if (ntb->dev_type == NTB_DEV_USD) { 1629 intel_ntb_reg_write(8, ATOM_PBAR2XLAT_OFFSET, 1630 XEON_B2B_BAR2_ADDR64); 1631 intel_ntb_reg_write(8, ATOM_PBAR4XLAT_OFFSET, 1632 XEON_B2B_BAR4_ADDR64); 1633 intel_ntb_reg_write(8, ATOM_MBAR23_OFFSET, XEON_B2B_BAR2_ADDR64); 1634 intel_ntb_reg_write(8, ATOM_MBAR45_OFFSET, XEON_B2B_BAR4_ADDR64); 1635 } else { 1636 intel_ntb_reg_write(8, ATOM_PBAR2XLAT_OFFSET, 1637 XEON_B2B_BAR2_ADDR64); 1638 intel_ntb_reg_write(8, ATOM_PBAR4XLAT_OFFSET, 1639 XEON_B2B_BAR4_ADDR64); 1640 intel_ntb_reg_write(8, ATOM_MBAR23_OFFSET, XEON_B2B_BAR2_ADDR64); 1641 intel_ntb_reg_write(8, ATOM_MBAR45_OFFSET, XEON_B2B_BAR4_ADDR64); 1642 } 1643 } 1644 1645 1646 /* 1647 * When working around Xeon SDOORBELL errata by remapping remote registers in a 1648 * MW, limit the B2B MW to half a MW. By sharing a MW, half the shared MW 1649 * remains for use by a higher layer. 1650 * 1651 * Will only be used if working around SDOORBELL errata and the BIOS-configured 1652 * MW size is sufficiently large. 1653 */ 1654 static unsigned int ntb_b2b_mw_share; 1655 SYSCTL_UINT(_hw_ntb, OID_AUTO, b2b_mw_share, CTLFLAG_RDTUN, &ntb_b2b_mw_share, 1656 0, "If enabled (non-zero), prefer to share half of the B2B peer register " 1657 "MW with higher level consumers. Both sides of the NTB MUST set the same " 1658 "value here."); 1659 1660 static void 1661 xeon_reset_sbar_size(struct ntb_softc *ntb, enum ntb_bar idx, 1662 enum ntb_bar regbar) 1663 { 1664 struct ntb_pci_bar_info *bar; 1665 uint8_t bar_sz; 1666 1667 if (!HAS_FEATURE(ntb, NTB_SPLIT_BAR) && idx >= NTB_B2B_BAR_3) 1668 return; 1669 1670 bar = &ntb->bar_info[idx]; 1671 bar_sz = pci_read_config(ntb->device, bar->psz_off, 1); 1672 if (idx == regbar) { 1673 if (ntb->b2b_off != 0) 1674 bar_sz--; 1675 else 1676 bar_sz = 0; 1677 } 1678 pci_write_config(ntb->device, bar->ssz_off, bar_sz, 1); 1679 bar_sz = pci_read_config(ntb->device, bar->ssz_off, 1); 1680 (void)bar_sz; 1681 } 1682 1683 static void 1684 xeon_set_sbar_base_and_limit(struct ntb_softc *ntb, uint64_t bar_addr, 1685 enum ntb_bar idx, enum ntb_bar regbar) 1686 { 1687 uint64_t reg_val; 1688 uint32_t base_reg, lmt_reg; 1689 1690 bar_get_xlat_params(ntb, idx, &base_reg, NULL, &lmt_reg); 1691 if (idx == regbar) { 1692 if (ntb->b2b_off) 1693 bar_addr += ntb->b2b_off; 1694 else 1695 bar_addr = 0; 1696 } 1697 1698 if (!bar_is_64bit(ntb, idx)) { 1699 intel_ntb_reg_write(4, base_reg, bar_addr); 1700 reg_val = intel_ntb_reg_read(4, base_reg); 1701 (void)reg_val; 1702 1703 intel_ntb_reg_write(4, lmt_reg, bar_addr); 1704 reg_val = intel_ntb_reg_read(4, lmt_reg); 1705 (void)reg_val; 1706 } else { 1707 intel_ntb_reg_write(8, base_reg, bar_addr); 1708 reg_val = intel_ntb_reg_read(8, base_reg); 1709 (void)reg_val; 1710 1711 intel_ntb_reg_write(8, lmt_reg, bar_addr); 1712 reg_val = intel_ntb_reg_read(8, lmt_reg); 1713 (void)reg_val; 1714 } 1715 } 1716 1717 static void 1718 xeon_set_pbar_xlat(struct ntb_softc *ntb, uint64_t base_addr, enum ntb_bar idx) 1719 { 1720 struct ntb_pci_bar_info *bar; 1721 1722 bar = &ntb->bar_info[idx]; 1723 if (HAS_FEATURE(ntb, NTB_SPLIT_BAR) && idx >= NTB_B2B_BAR_2) { 1724 intel_ntb_reg_write(4, bar->pbarxlat_off, base_addr); 1725 base_addr = intel_ntb_reg_read(4, bar->pbarxlat_off); 1726 } else { 1727 intel_ntb_reg_write(8, bar->pbarxlat_off, base_addr); 1728 base_addr = intel_ntb_reg_read(8, bar->pbarxlat_off); 1729 } 1730 (void)base_addr; 1731 } 1732 1733 static int 1734 xeon_setup_b2b_mw(struct ntb_softc *ntb, const struct ntb_b2b_addr *addr, 1735 const struct ntb_b2b_addr *peer_addr) 1736 { 1737 struct ntb_pci_bar_info *b2b_bar; 1738 vm_size_t bar_size; 1739 uint64_t bar_addr; 1740 enum ntb_bar b2b_bar_num, i; 1741 1742 if (ntb->b2b_mw_idx == B2B_MW_DISABLED) { 1743 b2b_bar = NULL; 1744 b2b_bar_num = NTB_CONFIG_BAR; 1745 ntb->b2b_off = 0; 1746 } else { 1747 b2b_bar_num = intel_ntb_mw_to_bar(ntb, ntb->b2b_mw_idx); 1748 KASSERT(b2b_bar_num > 0 && b2b_bar_num < NTB_MAX_BARS, 1749 ("invalid b2b mw bar")); 1750 1751 b2b_bar = &ntb->bar_info[b2b_bar_num]; 1752 bar_size = b2b_bar->size; 1753 1754 if (ntb_b2b_mw_share != 0 && 1755 (bar_size >> 1) >= XEON_B2B_MIN_SIZE) 1756 ntb->b2b_off = bar_size >> 1; 1757 else if (bar_size >= XEON_B2B_MIN_SIZE) { 1758 ntb->b2b_off = 0; 1759 } else { 1760 device_printf(ntb->device, 1761 "B2B bar size is too small!\n"); 1762 return (EIO); 1763 } 1764 } 1765 1766 /* 1767 * Reset the secondary bar sizes to match the primary bar sizes. 1768 * (Except, disable or halve the size of the B2B secondary bar.) 1769 */ 1770 for (i = NTB_B2B_BAR_1; i < NTB_MAX_BARS; i++) 1771 xeon_reset_sbar_size(ntb, i, b2b_bar_num); 1772 1773 bar_addr = 0; 1774 if (b2b_bar_num == NTB_CONFIG_BAR) 1775 bar_addr = addr->bar0_addr; 1776 else if (b2b_bar_num == NTB_B2B_BAR_1) 1777 bar_addr = addr->bar2_addr64; 1778 else if (b2b_bar_num == NTB_B2B_BAR_2 && !HAS_FEATURE(ntb, NTB_SPLIT_BAR)) 1779 bar_addr = addr->bar4_addr64; 1780 else if (b2b_bar_num == NTB_B2B_BAR_2) 1781 bar_addr = addr->bar4_addr32; 1782 else if (b2b_bar_num == NTB_B2B_BAR_3) 1783 bar_addr = addr->bar5_addr32; 1784 else 1785 KASSERT(false, ("invalid bar")); 1786 1787 intel_ntb_reg_write(8, XEON_SBAR0BASE_OFFSET, bar_addr); 1788 1789 /* 1790 * Other SBARs are normally hit by the PBAR xlat, except for the b2b 1791 * register BAR. The B2B BAR is either disabled above or configured 1792 * half-size. It starts at PBAR xlat + offset. 1793 * 1794 * Also set up incoming BAR limits == base (zero length window). 1795 */ 1796 xeon_set_sbar_base_and_limit(ntb, addr->bar2_addr64, NTB_B2B_BAR_1, 1797 b2b_bar_num); 1798 if (HAS_FEATURE(ntb, NTB_SPLIT_BAR)) { 1799 xeon_set_sbar_base_and_limit(ntb, addr->bar4_addr32, 1800 NTB_B2B_BAR_2, b2b_bar_num); 1801 xeon_set_sbar_base_and_limit(ntb, addr->bar5_addr32, 1802 NTB_B2B_BAR_3, b2b_bar_num); 1803 } else 1804 xeon_set_sbar_base_and_limit(ntb, addr->bar4_addr64, 1805 NTB_B2B_BAR_2, b2b_bar_num); 1806 1807 /* Zero incoming translation addrs */ 1808 intel_ntb_reg_write(8, XEON_SBAR2XLAT_OFFSET, 0); 1809 intel_ntb_reg_write(8, XEON_SBAR4XLAT_OFFSET, 0); 1810 1811 if (HAS_FEATURE(ntb, NTB_SB01BASE_LOCKUP)) { 1812 uint32_t xlat_reg, lmt_reg; 1813 enum ntb_bar bar_num; 1814 1815 /* 1816 * We point the chosen MSIX MW BAR xlat to remote LAPIC for 1817 * workaround 1818 */ 1819 bar_num = intel_ntb_mw_to_bar(ntb, ntb->msix_mw_idx); 1820 bar_get_xlat_params(ntb, bar_num, NULL, &xlat_reg, &lmt_reg); 1821 if (bar_is_64bit(ntb, bar_num)) { 1822 intel_ntb_reg_write(8, xlat_reg, MSI_INTEL_ADDR_BASE); 1823 ntb->msix_xlat = intel_ntb_reg_read(8, xlat_reg); 1824 intel_ntb_reg_write(8, lmt_reg, 0); 1825 } else { 1826 intel_ntb_reg_write(4, xlat_reg, MSI_INTEL_ADDR_BASE); 1827 ntb->msix_xlat = intel_ntb_reg_read(4, xlat_reg); 1828 intel_ntb_reg_write(4, lmt_reg, 0); 1829 } 1830 1831 ntb->peer_lapic_bar = &ntb->bar_info[bar_num]; 1832 } 1833 (void)intel_ntb_reg_read(8, XEON_SBAR2XLAT_OFFSET); 1834 (void)intel_ntb_reg_read(8, XEON_SBAR4XLAT_OFFSET); 1835 1836 /* Zero outgoing translation limits (whole bar size windows) */ 1837 intel_ntb_reg_write(8, XEON_PBAR2LMT_OFFSET, 0); 1838 intel_ntb_reg_write(8, XEON_PBAR4LMT_OFFSET, 0); 1839 1840 /* Set outgoing translation offsets */ 1841 xeon_set_pbar_xlat(ntb, peer_addr->bar2_addr64, NTB_B2B_BAR_1); 1842 if (HAS_FEATURE(ntb, NTB_SPLIT_BAR)) { 1843 xeon_set_pbar_xlat(ntb, peer_addr->bar4_addr32, NTB_B2B_BAR_2); 1844 xeon_set_pbar_xlat(ntb, peer_addr->bar5_addr32, NTB_B2B_BAR_3); 1845 } else 1846 xeon_set_pbar_xlat(ntb, peer_addr->bar4_addr64, NTB_B2B_BAR_2); 1847 1848 /* Set the translation offset for B2B registers */ 1849 bar_addr = 0; 1850 if (b2b_bar_num == NTB_CONFIG_BAR) 1851 bar_addr = peer_addr->bar0_addr; 1852 else if (b2b_bar_num == NTB_B2B_BAR_1) 1853 bar_addr = peer_addr->bar2_addr64; 1854 else if (b2b_bar_num == NTB_B2B_BAR_2 && !HAS_FEATURE(ntb, NTB_SPLIT_BAR)) 1855 bar_addr = peer_addr->bar4_addr64; 1856 else if (b2b_bar_num == NTB_B2B_BAR_2) 1857 bar_addr = peer_addr->bar4_addr32; 1858 else if (b2b_bar_num == NTB_B2B_BAR_3) 1859 bar_addr = peer_addr->bar5_addr32; 1860 else 1861 KASSERT(false, ("invalid bar")); 1862 1863 /* 1864 * B2B_XLAT_OFFSET is a 64-bit register but can only be written 32 bits 1865 * at a time. 1866 */ 1867 intel_ntb_reg_write(4, XEON_B2B_XLAT_OFFSETL, bar_addr & 0xffffffff); 1868 intel_ntb_reg_write(4, XEON_B2B_XLAT_OFFSETU, bar_addr >> 32); 1869 return (0); 1870 } 1871 1872 static inline bool 1873 _xeon_link_is_up(struct ntb_softc *ntb) 1874 { 1875 1876 if (ntb->conn_type == NTB_CONN_TRANSPARENT) 1877 return (true); 1878 return ((ntb->lnk_sta & NTB_LINK_STATUS_ACTIVE) != 0); 1879 } 1880 1881 static inline bool 1882 link_is_up(struct ntb_softc *ntb) 1883 { 1884 1885 if (ntb->type == NTB_XEON) 1886 return (_xeon_link_is_up(ntb) && (ntb->peer_msix_good || 1887 !HAS_FEATURE(ntb, NTB_SB01BASE_LOCKUP))); 1888 1889 KASSERT(ntb->type == NTB_ATOM, ("ntb type")); 1890 return ((ntb->ntb_ctl & ATOM_CNTL_LINK_DOWN) == 0); 1891 } 1892 1893 static inline bool 1894 atom_link_is_err(struct ntb_softc *ntb) 1895 { 1896 uint32_t status; 1897 1898 KASSERT(ntb->type == NTB_ATOM, ("ntb type")); 1899 1900 status = intel_ntb_reg_read(4, ATOM_LTSSMSTATEJMP_OFFSET); 1901 if ((status & ATOM_LTSSMSTATEJMP_FORCEDETECT) != 0) 1902 return (true); 1903 1904 status = intel_ntb_reg_read(4, ATOM_IBSTERRRCRVSTS0_OFFSET); 1905 return ((status & ATOM_IBIST_ERR_OFLOW) != 0); 1906 } 1907 1908 /* Atom does not have link status interrupt, poll on that platform */ 1909 static void 1910 atom_link_hb(void *arg) 1911 { 1912 struct ntb_softc *ntb = arg; 1913 sbintime_t timo, poll_ts; 1914 1915 timo = NTB_HB_TIMEOUT * hz; 1916 poll_ts = ntb->last_ts + timo; 1917 1918 /* 1919 * Delay polling the link status if an interrupt was received, unless 1920 * the cached link status says the link is down. 1921 */ 1922 if ((sbintime_t)ticks - poll_ts < 0 && link_is_up(ntb)) { 1923 timo = poll_ts - ticks; 1924 goto out; 1925 } 1926 1927 if (intel_ntb_poll_link(ntb)) 1928 ntb_link_event(ntb->device); 1929 1930 if (!link_is_up(ntb) && atom_link_is_err(ntb)) { 1931 /* Link is down with error, proceed with recovery */ 1932 callout_reset(&ntb->lr_timer, 0, recover_atom_link, ntb); 1933 return; 1934 } 1935 1936 out: 1937 callout_reset(&ntb->heartbeat_timer, timo, atom_link_hb, ntb); 1938 } 1939 1940 static void 1941 atom_perform_link_restart(struct ntb_softc *ntb) 1942 { 1943 uint32_t status; 1944 1945 /* Driver resets the NTB ModPhy lanes - magic! */ 1946 intel_ntb_reg_write(1, ATOM_MODPHY_PCSREG6, 0xe0); 1947 intel_ntb_reg_write(1, ATOM_MODPHY_PCSREG4, 0x40); 1948 intel_ntb_reg_write(1, ATOM_MODPHY_PCSREG4, 0x60); 1949 intel_ntb_reg_write(1, ATOM_MODPHY_PCSREG6, 0x60); 1950 1951 /* Driver waits 100ms to allow the NTB ModPhy to settle */ 1952 pause("ModPhy", hz / 10); 1953 1954 /* Clear AER Errors, write to clear */ 1955 status = intel_ntb_reg_read(4, ATOM_ERRCORSTS_OFFSET); 1956 status &= PCIM_AER_COR_REPLAY_ROLLOVER; 1957 intel_ntb_reg_write(4, ATOM_ERRCORSTS_OFFSET, status); 1958 1959 /* Clear unexpected electrical idle event in LTSSM, write to clear */ 1960 status = intel_ntb_reg_read(4, ATOM_LTSSMERRSTS0_OFFSET); 1961 status |= ATOM_LTSSMERRSTS0_UNEXPECTEDEI; 1962 intel_ntb_reg_write(4, ATOM_LTSSMERRSTS0_OFFSET, status); 1963 1964 /* Clear DeSkew Buffer error, write to clear */ 1965 status = intel_ntb_reg_read(4, ATOM_DESKEWSTS_OFFSET); 1966 status |= ATOM_DESKEWSTS_DBERR; 1967 intel_ntb_reg_write(4, ATOM_DESKEWSTS_OFFSET, status); 1968 1969 status = intel_ntb_reg_read(4, ATOM_IBSTERRRCRVSTS0_OFFSET); 1970 status &= ATOM_IBIST_ERR_OFLOW; 1971 intel_ntb_reg_write(4, ATOM_IBSTERRRCRVSTS0_OFFSET, status); 1972 1973 /* Releases the NTB state machine to allow the link to retrain */ 1974 status = intel_ntb_reg_read(4, ATOM_LTSSMSTATEJMP_OFFSET); 1975 status &= ~ATOM_LTSSMSTATEJMP_FORCEDETECT; 1976 intel_ntb_reg_write(4, ATOM_LTSSMSTATEJMP_OFFSET, status); 1977 } 1978 1979 static int 1980 intel_ntb_link_enable(device_t dev, enum ntb_speed speed __unused, 1981 enum ntb_width width __unused) 1982 { 1983 struct ntb_softc *ntb = device_get_softc(dev); 1984 uint32_t cntl; 1985 1986 intel_ntb_printf(2, "%s\n", __func__); 1987 1988 if (ntb->type == NTB_ATOM) { 1989 pci_write_config(ntb->device, NTB_PPD_OFFSET, 1990 ntb->ppd | ATOM_PPD_INIT_LINK, 4); 1991 return (0); 1992 } 1993 1994 if (ntb->conn_type == NTB_CONN_TRANSPARENT) { 1995 ntb_link_event(dev); 1996 return (0); 1997 } 1998 1999 cntl = intel_ntb_reg_read(4, ntb->reg->ntb_ctl); 2000 cntl &= ~(NTB_CNTL_LINK_DISABLE | NTB_CNTL_CFG_LOCK); 2001 cntl |= NTB_CNTL_P2S_BAR23_SNOOP | NTB_CNTL_S2P_BAR23_SNOOP; 2002 cntl |= NTB_CNTL_P2S_BAR4_SNOOP | NTB_CNTL_S2P_BAR4_SNOOP; 2003 if (HAS_FEATURE(ntb, NTB_SPLIT_BAR)) 2004 cntl |= NTB_CNTL_P2S_BAR5_SNOOP | NTB_CNTL_S2P_BAR5_SNOOP; 2005 intel_ntb_reg_write(4, ntb->reg->ntb_ctl, cntl); 2006 return (0); 2007 } 2008 2009 static int 2010 intel_ntb_link_disable(device_t dev) 2011 { 2012 struct ntb_softc *ntb = device_get_softc(dev); 2013 uint32_t cntl; 2014 2015 intel_ntb_printf(2, "%s\n", __func__); 2016 2017 if (ntb->conn_type == NTB_CONN_TRANSPARENT) { 2018 ntb_link_event(dev); 2019 return (0); 2020 } 2021 2022 cntl = intel_ntb_reg_read(4, ntb->reg->ntb_ctl); 2023 cntl &= ~(NTB_CNTL_P2S_BAR23_SNOOP | NTB_CNTL_S2P_BAR23_SNOOP); 2024 cntl &= ~(NTB_CNTL_P2S_BAR4_SNOOP | NTB_CNTL_S2P_BAR4_SNOOP); 2025 if (HAS_FEATURE(ntb, NTB_SPLIT_BAR)) 2026 cntl &= ~(NTB_CNTL_P2S_BAR5_SNOOP | NTB_CNTL_S2P_BAR5_SNOOP); 2027 cntl |= NTB_CNTL_LINK_DISABLE | NTB_CNTL_CFG_LOCK; 2028 intel_ntb_reg_write(4, ntb->reg->ntb_ctl, cntl); 2029 return (0); 2030 } 2031 2032 static bool 2033 intel_ntb_link_enabled(device_t dev) 2034 { 2035 struct ntb_softc *ntb = device_get_softc(dev); 2036 uint32_t cntl; 2037 2038 if (ntb->type == NTB_ATOM) { 2039 cntl = pci_read_config(ntb->device, NTB_PPD_OFFSET, 4); 2040 return ((cntl & ATOM_PPD_INIT_LINK) != 0); 2041 } 2042 2043 if (ntb->conn_type == NTB_CONN_TRANSPARENT) 2044 return (true); 2045 2046 cntl = intel_ntb_reg_read(4, ntb->reg->ntb_ctl); 2047 return ((cntl & NTB_CNTL_LINK_DISABLE) == 0); 2048 } 2049 2050 static void 2051 recover_atom_link(void *arg) 2052 { 2053 struct ntb_softc *ntb = arg; 2054 unsigned speed, width, oldspeed, oldwidth; 2055 uint32_t status32; 2056 2057 atom_perform_link_restart(ntb); 2058 2059 /* 2060 * There is a potential race between the 2 NTB devices recovering at 2061 * the same time. If the times are the same, the link will not recover 2062 * and the driver will be stuck in this loop forever. Add a random 2063 * interval to the recovery time to prevent this race. 2064 */ 2065 status32 = arc4random() % ATOM_LINK_RECOVERY_TIME; 2066 pause("Link", (ATOM_LINK_RECOVERY_TIME + status32) * hz / 1000); 2067 2068 if (atom_link_is_err(ntb)) 2069 goto retry; 2070 2071 status32 = intel_ntb_reg_read(4, ntb->reg->ntb_ctl); 2072 if ((status32 & ATOM_CNTL_LINK_DOWN) != 0) 2073 goto out; 2074 2075 status32 = intel_ntb_reg_read(4, ntb->reg->lnk_sta); 2076 width = NTB_LNK_STA_WIDTH(status32); 2077 speed = status32 & NTB_LINK_SPEED_MASK; 2078 2079 oldwidth = NTB_LNK_STA_WIDTH(ntb->lnk_sta); 2080 oldspeed = ntb->lnk_sta & NTB_LINK_SPEED_MASK; 2081 if (oldwidth != width || oldspeed != speed) 2082 goto retry; 2083 2084 out: 2085 callout_reset(&ntb->heartbeat_timer, NTB_HB_TIMEOUT * hz, atom_link_hb, 2086 ntb); 2087 return; 2088 2089 retry: 2090 callout_reset(&ntb->lr_timer, NTB_HB_TIMEOUT * hz, recover_atom_link, 2091 ntb); 2092 } 2093 2094 /* 2095 * Polls the HW link status register(s); returns true if something has changed. 2096 */ 2097 static bool 2098 intel_ntb_poll_link(struct ntb_softc *ntb) 2099 { 2100 uint32_t ntb_cntl; 2101 uint16_t reg_val; 2102 2103 if (ntb->type == NTB_ATOM) { 2104 ntb_cntl = intel_ntb_reg_read(4, ntb->reg->ntb_ctl); 2105 if (ntb_cntl == ntb->ntb_ctl) 2106 return (false); 2107 2108 ntb->ntb_ctl = ntb_cntl; 2109 ntb->lnk_sta = intel_ntb_reg_read(4, ntb->reg->lnk_sta); 2110 } else { 2111 db_iowrite_raw(ntb, ntb->self_reg->db_bell, ntb->db_link_mask); 2112 2113 reg_val = pci_read_config(ntb->device, ntb->reg->lnk_sta, 2); 2114 if (reg_val == ntb->lnk_sta) 2115 return (false); 2116 2117 ntb->lnk_sta = reg_val; 2118 2119 if (HAS_FEATURE(ntb, NTB_SB01BASE_LOCKUP)) { 2120 if (_xeon_link_is_up(ntb)) { 2121 if (!ntb->peer_msix_good) { 2122 callout_reset(&ntb->peer_msix_work, 0, 2123 intel_ntb_exchange_msix, ntb); 2124 return (false); 2125 } 2126 } else { 2127 ntb->peer_msix_good = false; 2128 ntb->peer_msix_done = false; 2129 } 2130 } 2131 } 2132 return (true); 2133 } 2134 2135 static inline enum ntb_speed 2136 intel_ntb_link_sta_speed(struct ntb_softc *ntb) 2137 { 2138 2139 if (!link_is_up(ntb)) 2140 return (NTB_SPEED_NONE); 2141 return (ntb->lnk_sta & NTB_LINK_SPEED_MASK); 2142 } 2143 2144 static inline enum ntb_width 2145 intel_ntb_link_sta_width(struct ntb_softc *ntb) 2146 { 2147 2148 if (!link_is_up(ntb)) 2149 return (NTB_WIDTH_NONE); 2150 return (NTB_LNK_STA_WIDTH(ntb->lnk_sta)); 2151 } 2152 2153 SYSCTL_NODE(_hw_ntb, OID_AUTO, debug_info, CTLFLAG_RW, 0, 2154 "Driver state, statistics, and HW registers"); 2155 2156 #define NTB_REGSZ_MASK (3ul << 30) 2157 #define NTB_REG_64 (1ul << 30) 2158 #define NTB_REG_32 (2ul << 30) 2159 #define NTB_REG_16 (3ul << 30) 2160 #define NTB_REG_8 (0ul << 30) 2161 2162 #define NTB_DB_READ (1ul << 29) 2163 #define NTB_PCI_REG (1ul << 28) 2164 #define NTB_REGFLAGS_MASK (NTB_REGSZ_MASK | NTB_DB_READ | NTB_PCI_REG) 2165 2166 static void 2167 intel_ntb_sysctl_init(struct ntb_softc *ntb) 2168 { 2169 struct sysctl_oid_list *globals, *tree_par, *regpar, *statpar, *errpar; 2170 struct sysctl_ctx_list *ctx; 2171 struct sysctl_oid *tree, *tmptree; 2172 2173 ctx = device_get_sysctl_ctx(ntb->device); 2174 globals = SYSCTL_CHILDREN(device_get_sysctl_tree(ntb->device)); 2175 2176 SYSCTL_ADD_PROC(ctx, globals, OID_AUTO, "link_status", 2177 CTLFLAG_RD | CTLTYPE_STRING, ntb, 0, 2178 sysctl_handle_link_status_human, "A", 2179 "Link status (human readable)"); 2180 SYSCTL_ADD_PROC(ctx, globals, OID_AUTO, "active", 2181 CTLFLAG_RD | CTLTYPE_UINT, ntb, 0, sysctl_handle_link_status, 2182 "IU", "Link status (1=active, 0=inactive)"); 2183 SYSCTL_ADD_PROC(ctx, globals, OID_AUTO, "admin_up", 2184 CTLFLAG_RW | CTLTYPE_UINT, ntb, 0, sysctl_handle_link_admin, 2185 "IU", "Set/get interface status (1=UP, 0=DOWN)"); 2186 2187 tree = SYSCTL_ADD_NODE(ctx, globals, OID_AUTO, "debug_info", 2188 CTLFLAG_RD, NULL, "Driver state, statistics, and HW registers"); 2189 tree_par = SYSCTL_CHILDREN(tree); 2190 2191 SYSCTL_ADD_UINT(ctx, tree_par, OID_AUTO, "conn_type", CTLFLAG_RD, 2192 &ntb->conn_type, 0, "0 - Transparent; 1 - B2B; 2 - Root Port"); 2193 SYSCTL_ADD_UINT(ctx, tree_par, OID_AUTO, "dev_type", CTLFLAG_RD, 2194 &ntb->dev_type, 0, "0 - USD; 1 - DSD"); 2195 SYSCTL_ADD_UINT(ctx, tree_par, OID_AUTO, "ppd", CTLFLAG_RD, 2196 &ntb->ppd, 0, "Raw PPD register (cached)"); 2197 2198 if (ntb->b2b_mw_idx != B2B_MW_DISABLED) { 2199 SYSCTL_ADD_U8(ctx, tree_par, OID_AUTO, "b2b_idx", CTLFLAG_RD, 2200 &ntb->b2b_mw_idx, 0, 2201 "Index of the MW used for B2B remote register access"); 2202 SYSCTL_ADD_UQUAD(ctx, tree_par, OID_AUTO, "b2b_off", 2203 CTLFLAG_RD, &ntb->b2b_off, 2204 "If non-zero, offset of B2B register region in shared MW"); 2205 } 2206 2207 SYSCTL_ADD_PROC(ctx, tree_par, OID_AUTO, "features", 2208 CTLFLAG_RD | CTLTYPE_STRING, ntb, 0, sysctl_handle_features, "A", 2209 "Features/errata of this NTB device"); 2210 2211 SYSCTL_ADD_UINT(ctx, tree_par, OID_AUTO, "ntb_ctl", CTLFLAG_RD, 2212 __DEVOLATILE(uint32_t *, &ntb->ntb_ctl), 0, 2213 "NTB CTL register (cached)"); 2214 SYSCTL_ADD_UINT(ctx, tree_par, OID_AUTO, "lnk_sta", CTLFLAG_RD, 2215 __DEVOLATILE(uint32_t *, &ntb->lnk_sta), 0, 2216 "LNK STA register (cached)"); 2217 2218 SYSCTL_ADD_U8(ctx, tree_par, OID_AUTO, "mw_count", CTLFLAG_RD, 2219 &ntb->mw_count, 0, "MW count"); 2220 SYSCTL_ADD_U8(ctx, tree_par, OID_AUTO, "spad_count", CTLFLAG_RD, 2221 &ntb->spad_count, 0, "Scratchpad count"); 2222 SYSCTL_ADD_U8(ctx, tree_par, OID_AUTO, "db_count", CTLFLAG_RD, 2223 &ntb->db_count, 0, "Doorbell count"); 2224 SYSCTL_ADD_U8(ctx, tree_par, OID_AUTO, "db_vec_count", CTLFLAG_RD, 2225 &ntb->db_vec_count, 0, "Doorbell vector count"); 2226 SYSCTL_ADD_U8(ctx, tree_par, OID_AUTO, "db_vec_shift", CTLFLAG_RD, 2227 &ntb->db_vec_shift, 0, "Doorbell vector shift"); 2228 2229 SYSCTL_ADD_UQUAD(ctx, tree_par, OID_AUTO, "db_valid_mask", CTLFLAG_RD, 2230 &ntb->db_valid_mask, "Doorbell valid mask"); 2231 SYSCTL_ADD_UQUAD(ctx, tree_par, OID_AUTO, "db_link_mask", CTLFLAG_RD, 2232 &ntb->db_link_mask, "Doorbell link mask"); 2233 SYSCTL_ADD_UQUAD(ctx, tree_par, OID_AUTO, "db_mask", CTLFLAG_RD, 2234 &ntb->db_mask, "Doorbell mask (cached)"); 2235 2236 tmptree = SYSCTL_ADD_NODE(ctx, tree_par, OID_AUTO, "registers", 2237 CTLFLAG_RD, NULL, "Raw HW registers (big-endian)"); 2238 regpar = SYSCTL_CHILDREN(tmptree); 2239 2240 SYSCTL_ADD_PROC(ctx, regpar, OID_AUTO, "ntbcntl", 2241 CTLFLAG_RD | CTLTYPE_OPAQUE, ntb, NTB_REG_32 | 2242 ntb->reg->ntb_ctl, sysctl_handle_register, "IU", 2243 "NTB Control register"); 2244 SYSCTL_ADD_PROC(ctx, regpar, OID_AUTO, "lnkcap", 2245 CTLFLAG_RD | CTLTYPE_OPAQUE, ntb, NTB_REG_32 | 2246 0x19c, sysctl_handle_register, "IU", 2247 "NTB Link Capabilities"); 2248 SYSCTL_ADD_PROC(ctx, regpar, OID_AUTO, "lnkcon", 2249 CTLFLAG_RD | CTLTYPE_OPAQUE, ntb, NTB_REG_32 | 2250 0x1a0, sysctl_handle_register, "IU", 2251 "NTB Link Control register"); 2252 2253 SYSCTL_ADD_PROC(ctx, regpar, OID_AUTO, "db_mask", 2254 CTLFLAG_RD | CTLTYPE_OPAQUE, ntb, 2255 NTB_REG_64 | NTB_DB_READ | ntb->self_reg->db_mask, 2256 sysctl_handle_register, "QU", "Doorbell mask register"); 2257 SYSCTL_ADD_PROC(ctx, regpar, OID_AUTO, "db_bell", 2258 CTLFLAG_RD | CTLTYPE_OPAQUE, ntb, 2259 NTB_REG_64 | NTB_DB_READ | ntb->self_reg->db_bell, 2260 sysctl_handle_register, "QU", "Doorbell register"); 2261 2262 SYSCTL_ADD_PROC(ctx, regpar, OID_AUTO, "incoming_xlat23", 2263 CTLFLAG_RD | CTLTYPE_OPAQUE, ntb, 2264 NTB_REG_64 | ntb->xlat_reg->bar2_xlat, 2265 sysctl_handle_register, "QU", "Incoming XLAT23 register"); 2266 if (HAS_FEATURE(ntb, NTB_SPLIT_BAR)) { 2267 SYSCTL_ADD_PROC(ctx, regpar, OID_AUTO, "incoming_xlat4", 2268 CTLFLAG_RD | CTLTYPE_OPAQUE, ntb, 2269 NTB_REG_32 | ntb->xlat_reg->bar4_xlat, 2270 sysctl_handle_register, "IU", "Incoming XLAT4 register"); 2271 SYSCTL_ADD_PROC(ctx, regpar, OID_AUTO, "incoming_xlat5", 2272 CTLFLAG_RD | CTLTYPE_OPAQUE, ntb, 2273 NTB_REG_32 | ntb->xlat_reg->bar5_xlat, 2274 sysctl_handle_register, "IU", "Incoming XLAT5 register"); 2275 } else { 2276 SYSCTL_ADD_PROC(ctx, regpar, OID_AUTO, "incoming_xlat45", 2277 CTLFLAG_RD | CTLTYPE_OPAQUE, ntb, 2278 NTB_REG_64 | ntb->xlat_reg->bar4_xlat, 2279 sysctl_handle_register, "QU", "Incoming XLAT45 register"); 2280 } 2281 2282 SYSCTL_ADD_PROC(ctx, regpar, OID_AUTO, "incoming_lmt23", 2283 CTLFLAG_RD | CTLTYPE_OPAQUE, ntb, 2284 NTB_REG_64 | ntb->xlat_reg->bar2_limit, 2285 sysctl_handle_register, "QU", "Incoming LMT23 register"); 2286 if (HAS_FEATURE(ntb, NTB_SPLIT_BAR)) { 2287 SYSCTL_ADD_PROC(ctx, regpar, OID_AUTO, "incoming_lmt4", 2288 CTLFLAG_RD | CTLTYPE_OPAQUE, ntb, 2289 NTB_REG_32 | ntb->xlat_reg->bar4_limit, 2290 sysctl_handle_register, "IU", "Incoming LMT4 register"); 2291 SYSCTL_ADD_PROC(ctx, regpar, OID_AUTO, "incoming_lmt5", 2292 CTLFLAG_RD | CTLTYPE_OPAQUE, ntb, 2293 NTB_REG_32 | ntb->xlat_reg->bar5_limit, 2294 sysctl_handle_register, "IU", "Incoming LMT5 register"); 2295 } else { 2296 SYSCTL_ADD_PROC(ctx, regpar, OID_AUTO, "incoming_lmt45", 2297 CTLFLAG_RD | CTLTYPE_OPAQUE, ntb, 2298 NTB_REG_64 | ntb->xlat_reg->bar4_limit, 2299 sysctl_handle_register, "QU", "Incoming LMT45 register"); 2300 } 2301 2302 if (ntb->type == NTB_ATOM) 2303 return; 2304 2305 tmptree = SYSCTL_ADD_NODE(ctx, regpar, OID_AUTO, "xeon_stats", 2306 CTLFLAG_RD, NULL, "Xeon HW statistics"); 2307 statpar = SYSCTL_CHILDREN(tmptree); 2308 SYSCTL_ADD_PROC(ctx, statpar, OID_AUTO, "upstream_mem_miss", 2309 CTLFLAG_RD | CTLTYPE_OPAQUE, ntb, 2310 NTB_REG_16 | XEON_USMEMMISS_OFFSET, 2311 sysctl_handle_register, "SU", "Upstream Memory Miss"); 2312 2313 tmptree = SYSCTL_ADD_NODE(ctx, regpar, OID_AUTO, "xeon_hw_err", 2314 CTLFLAG_RD, NULL, "Xeon HW errors"); 2315 errpar = SYSCTL_CHILDREN(tmptree); 2316 2317 SYSCTL_ADD_PROC(ctx, regpar, OID_AUTO, "ppd", 2318 CTLFLAG_RD | CTLTYPE_OPAQUE, ntb, 2319 NTB_REG_8 | NTB_PCI_REG | NTB_PPD_OFFSET, 2320 sysctl_handle_register, "CU", "PPD"); 2321 2322 SYSCTL_ADD_PROC(ctx, regpar, OID_AUTO, "pbar23_sz", 2323 CTLFLAG_RD | CTLTYPE_OPAQUE, ntb, 2324 NTB_REG_8 | NTB_PCI_REG | XEON_PBAR23SZ_OFFSET, 2325 sysctl_handle_register, "CU", "PBAR23 SZ (log2)"); 2326 SYSCTL_ADD_PROC(ctx, regpar, OID_AUTO, "pbar4_sz", 2327 CTLFLAG_RD | CTLTYPE_OPAQUE, ntb, 2328 NTB_REG_8 | NTB_PCI_REG | XEON_PBAR4SZ_OFFSET, 2329 sysctl_handle_register, "CU", "PBAR4 SZ (log2)"); 2330 SYSCTL_ADD_PROC(ctx, regpar, OID_AUTO, "pbar5_sz", 2331 CTLFLAG_RD | CTLTYPE_OPAQUE, ntb, 2332 NTB_REG_8 | NTB_PCI_REG | XEON_PBAR5SZ_OFFSET, 2333 sysctl_handle_register, "CU", "PBAR5 SZ (log2)"); 2334 2335 SYSCTL_ADD_PROC(ctx, regpar, OID_AUTO, "sbar23_sz", 2336 CTLFLAG_RD | CTLTYPE_OPAQUE, ntb, 2337 NTB_REG_8 | NTB_PCI_REG | XEON_SBAR23SZ_OFFSET, 2338 sysctl_handle_register, "CU", "SBAR23 SZ (log2)"); 2339 SYSCTL_ADD_PROC(ctx, regpar, OID_AUTO, "sbar4_sz", 2340 CTLFLAG_RD | CTLTYPE_OPAQUE, ntb, 2341 NTB_REG_8 | NTB_PCI_REG | XEON_SBAR4SZ_OFFSET, 2342 sysctl_handle_register, "CU", "SBAR4 SZ (log2)"); 2343 SYSCTL_ADD_PROC(ctx, regpar, OID_AUTO, "sbar5_sz", 2344 CTLFLAG_RD | CTLTYPE_OPAQUE, ntb, 2345 NTB_REG_8 | NTB_PCI_REG | XEON_SBAR5SZ_OFFSET, 2346 sysctl_handle_register, "CU", "SBAR5 SZ (log2)"); 2347 2348 SYSCTL_ADD_PROC(ctx, regpar, OID_AUTO, "devsts", 2349 CTLFLAG_RD | CTLTYPE_OPAQUE, ntb, 2350 NTB_REG_16 | NTB_PCI_REG | XEON_DEVSTS_OFFSET, 2351 sysctl_handle_register, "SU", "DEVSTS"); 2352 SYSCTL_ADD_PROC(ctx, regpar, OID_AUTO, "lnksts", 2353 CTLFLAG_RD | CTLTYPE_OPAQUE, ntb, 2354 NTB_REG_16 | NTB_PCI_REG | XEON_LINK_STATUS_OFFSET, 2355 sysctl_handle_register, "SU", "LNKSTS"); 2356 SYSCTL_ADD_PROC(ctx, regpar, OID_AUTO, "slnksts", 2357 CTLFLAG_RD | CTLTYPE_OPAQUE, ntb, 2358 NTB_REG_16 | NTB_PCI_REG | XEON_SLINK_STATUS_OFFSET, 2359 sysctl_handle_register, "SU", "SLNKSTS"); 2360 2361 SYSCTL_ADD_PROC(ctx, errpar, OID_AUTO, "uncerrsts", 2362 CTLFLAG_RD | CTLTYPE_OPAQUE, ntb, 2363 NTB_REG_32 | NTB_PCI_REG | XEON_UNCERRSTS_OFFSET, 2364 sysctl_handle_register, "IU", "UNCERRSTS"); 2365 SYSCTL_ADD_PROC(ctx, errpar, OID_AUTO, "corerrsts", 2366 CTLFLAG_RD | CTLTYPE_OPAQUE, ntb, 2367 NTB_REG_32 | NTB_PCI_REG | XEON_CORERRSTS_OFFSET, 2368 sysctl_handle_register, "IU", "CORERRSTS"); 2369 2370 if (ntb->conn_type != NTB_CONN_B2B) 2371 return; 2372 2373 SYSCTL_ADD_PROC(ctx, regpar, OID_AUTO, "outgoing_xlat23", 2374 CTLFLAG_RD | CTLTYPE_OPAQUE, ntb, 2375 NTB_REG_64 | ntb->bar_info[NTB_B2B_BAR_1].pbarxlat_off, 2376 sysctl_handle_register, "QU", "Outgoing XLAT23 register"); 2377 if (HAS_FEATURE(ntb, NTB_SPLIT_BAR)) { 2378 SYSCTL_ADD_PROC(ctx, regpar, OID_AUTO, "outgoing_xlat4", 2379 CTLFLAG_RD | CTLTYPE_OPAQUE, ntb, 2380 NTB_REG_32 | ntb->bar_info[NTB_B2B_BAR_2].pbarxlat_off, 2381 sysctl_handle_register, "IU", "Outgoing XLAT4 register"); 2382 SYSCTL_ADD_PROC(ctx, regpar, OID_AUTO, "outgoing_xlat5", 2383 CTLFLAG_RD | CTLTYPE_OPAQUE, ntb, 2384 NTB_REG_32 | ntb->bar_info[NTB_B2B_BAR_3].pbarxlat_off, 2385 sysctl_handle_register, "IU", "Outgoing XLAT5 register"); 2386 } else { 2387 SYSCTL_ADD_PROC(ctx, regpar, OID_AUTO, "outgoing_xlat45", 2388 CTLFLAG_RD | CTLTYPE_OPAQUE, ntb, 2389 NTB_REG_64 | ntb->bar_info[NTB_B2B_BAR_2].pbarxlat_off, 2390 sysctl_handle_register, "QU", "Outgoing XLAT45 register"); 2391 } 2392 2393 SYSCTL_ADD_PROC(ctx, regpar, OID_AUTO, "outgoing_lmt23", 2394 CTLFLAG_RD | CTLTYPE_OPAQUE, ntb, 2395 NTB_REG_64 | XEON_PBAR2LMT_OFFSET, 2396 sysctl_handle_register, "QU", "Outgoing LMT23 register"); 2397 if (HAS_FEATURE(ntb, NTB_SPLIT_BAR)) { 2398 SYSCTL_ADD_PROC(ctx, regpar, OID_AUTO, "outgoing_lmt4", 2399 CTLFLAG_RD | CTLTYPE_OPAQUE, ntb, 2400 NTB_REG_32 | XEON_PBAR4LMT_OFFSET, 2401 sysctl_handle_register, "IU", "Outgoing LMT4 register"); 2402 SYSCTL_ADD_PROC(ctx, regpar, OID_AUTO, "outgoing_lmt5", 2403 CTLFLAG_RD | CTLTYPE_OPAQUE, ntb, 2404 NTB_REG_32 | XEON_PBAR5LMT_OFFSET, 2405 sysctl_handle_register, "IU", "Outgoing LMT5 register"); 2406 } else { 2407 SYSCTL_ADD_PROC(ctx, regpar, OID_AUTO, "outgoing_lmt45", 2408 CTLFLAG_RD | CTLTYPE_OPAQUE, ntb, 2409 NTB_REG_64 | XEON_PBAR4LMT_OFFSET, 2410 sysctl_handle_register, "QU", "Outgoing LMT45 register"); 2411 } 2412 2413 SYSCTL_ADD_PROC(ctx, regpar, OID_AUTO, "sbar01_base", 2414 CTLFLAG_RD | CTLTYPE_OPAQUE, ntb, 2415 NTB_REG_64 | ntb->xlat_reg->bar0_base, 2416 sysctl_handle_register, "QU", "Secondary BAR01 base register"); 2417 SYSCTL_ADD_PROC(ctx, regpar, OID_AUTO, "sbar23_base", 2418 CTLFLAG_RD | CTLTYPE_OPAQUE, ntb, 2419 NTB_REG_64 | ntb->xlat_reg->bar2_base, 2420 sysctl_handle_register, "QU", "Secondary BAR23 base register"); 2421 if (HAS_FEATURE(ntb, NTB_SPLIT_BAR)) { 2422 SYSCTL_ADD_PROC(ctx, regpar, OID_AUTO, "sbar4_base", 2423 CTLFLAG_RD | CTLTYPE_OPAQUE, ntb, 2424 NTB_REG_32 | ntb->xlat_reg->bar4_base, 2425 sysctl_handle_register, "IU", 2426 "Secondary BAR4 base register"); 2427 SYSCTL_ADD_PROC(ctx, regpar, OID_AUTO, "sbar5_base", 2428 CTLFLAG_RD | CTLTYPE_OPAQUE, ntb, 2429 NTB_REG_32 | ntb->xlat_reg->bar5_base, 2430 sysctl_handle_register, "IU", 2431 "Secondary BAR5 base register"); 2432 } else { 2433 SYSCTL_ADD_PROC(ctx, regpar, OID_AUTO, "sbar45_base", 2434 CTLFLAG_RD | CTLTYPE_OPAQUE, ntb, 2435 NTB_REG_64 | ntb->xlat_reg->bar4_base, 2436 sysctl_handle_register, "QU", 2437 "Secondary BAR45 base register"); 2438 } 2439 } 2440 2441 static int 2442 sysctl_handle_features(SYSCTL_HANDLER_ARGS) 2443 { 2444 struct ntb_softc *ntb = arg1; 2445 struct sbuf sb; 2446 int error; 2447 2448 sbuf_new_for_sysctl(&sb, NULL, 256, req); 2449 2450 sbuf_printf(&sb, "%b", ntb->features, NTB_FEATURES_STR); 2451 error = sbuf_finish(&sb); 2452 sbuf_delete(&sb); 2453 2454 if (error || !req->newptr) 2455 return (error); 2456 return (EINVAL); 2457 } 2458 2459 static int 2460 sysctl_handle_link_admin(SYSCTL_HANDLER_ARGS) 2461 { 2462 struct ntb_softc *ntb = arg1; 2463 unsigned old, new; 2464 int error; 2465 2466 old = intel_ntb_link_enabled(ntb->device); 2467 2468 error = SYSCTL_OUT(req, &old, sizeof(old)); 2469 if (error != 0 || req->newptr == NULL) 2470 return (error); 2471 2472 error = SYSCTL_IN(req, &new, sizeof(new)); 2473 if (error != 0) 2474 return (error); 2475 2476 intel_ntb_printf(0, "Admin set interface state to '%sabled'\n", 2477 (new != 0)? "en" : "dis"); 2478 2479 if (new != 0) 2480 error = intel_ntb_link_enable(ntb->device, NTB_SPEED_AUTO, NTB_WIDTH_AUTO); 2481 else 2482 error = intel_ntb_link_disable(ntb->device); 2483 return (error); 2484 } 2485 2486 static int 2487 sysctl_handle_link_status_human(SYSCTL_HANDLER_ARGS) 2488 { 2489 struct ntb_softc *ntb = arg1; 2490 struct sbuf sb; 2491 enum ntb_speed speed; 2492 enum ntb_width width; 2493 int error; 2494 2495 sbuf_new_for_sysctl(&sb, NULL, 32, req); 2496 2497 if (intel_ntb_link_is_up(ntb->device, &speed, &width)) 2498 sbuf_printf(&sb, "up / PCIe Gen %u / Width x%u", 2499 (unsigned)speed, (unsigned)width); 2500 else 2501 sbuf_printf(&sb, "down"); 2502 2503 error = sbuf_finish(&sb); 2504 sbuf_delete(&sb); 2505 2506 if (error || !req->newptr) 2507 return (error); 2508 return (EINVAL); 2509 } 2510 2511 static int 2512 sysctl_handle_link_status(SYSCTL_HANDLER_ARGS) 2513 { 2514 struct ntb_softc *ntb = arg1; 2515 unsigned res; 2516 int error; 2517 2518 res = intel_ntb_link_is_up(ntb->device, NULL, NULL); 2519 2520 error = SYSCTL_OUT(req, &res, sizeof(res)); 2521 if (error || !req->newptr) 2522 return (error); 2523 return (EINVAL); 2524 } 2525 2526 static int 2527 sysctl_handle_register(SYSCTL_HANDLER_ARGS) 2528 { 2529 struct ntb_softc *ntb; 2530 const void *outp; 2531 uintptr_t sz; 2532 uint64_t umv; 2533 char be[sizeof(umv)]; 2534 size_t outsz; 2535 uint32_t reg; 2536 bool db, pci; 2537 int error; 2538 2539 ntb = arg1; 2540 reg = arg2 & ~NTB_REGFLAGS_MASK; 2541 sz = arg2 & NTB_REGSZ_MASK; 2542 db = (arg2 & NTB_DB_READ) != 0; 2543 pci = (arg2 & NTB_PCI_REG) != 0; 2544 2545 KASSERT(!(db && pci), ("bogus")); 2546 2547 if (db) { 2548 KASSERT(sz == NTB_REG_64, ("bogus")); 2549 umv = db_ioread(ntb, reg); 2550 outsz = sizeof(uint64_t); 2551 } else { 2552 switch (sz) { 2553 case NTB_REG_64: 2554 if (pci) 2555 umv = pci_read_config(ntb->device, reg, 8); 2556 else 2557 umv = intel_ntb_reg_read(8, reg); 2558 outsz = sizeof(uint64_t); 2559 break; 2560 case NTB_REG_32: 2561 if (pci) 2562 umv = pci_read_config(ntb->device, reg, 4); 2563 else 2564 umv = intel_ntb_reg_read(4, reg); 2565 outsz = sizeof(uint32_t); 2566 break; 2567 case NTB_REG_16: 2568 if (pci) 2569 umv = pci_read_config(ntb->device, reg, 2); 2570 else 2571 umv = intel_ntb_reg_read(2, reg); 2572 outsz = sizeof(uint16_t); 2573 break; 2574 case NTB_REG_8: 2575 if (pci) 2576 umv = pci_read_config(ntb->device, reg, 1); 2577 else 2578 umv = intel_ntb_reg_read(1, reg); 2579 outsz = sizeof(uint8_t); 2580 break; 2581 default: 2582 panic("bogus"); 2583 break; 2584 } 2585 } 2586 2587 /* Encode bigendian so that sysctl -x is legible. */ 2588 be64enc(be, umv); 2589 outp = ((char *)be) + sizeof(umv) - outsz; 2590 2591 error = SYSCTL_OUT(req, outp, outsz); 2592 if (error || !req->newptr) 2593 return (error); 2594 return (EINVAL); 2595 } 2596 2597 static unsigned 2598 intel_ntb_user_mw_to_idx(struct ntb_softc *ntb, unsigned uidx) 2599 { 2600 2601 if ((ntb->b2b_mw_idx != B2B_MW_DISABLED && ntb->b2b_off == 0 && 2602 uidx >= ntb->b2b_mw_idx) || 2603 (ntb->msix_mw_idx != B2B_MW_DISABLED && uidx >= ntb->msix_mw_idx)) 2604 uidx++; 2605 if ((ntb->b2b_mw_idx != B2B_MW_DISABLED && ntb->b2b_off == 0 && 2606 uidx >= ntb->b2b_mw_idx) && 2607 (ntb->msix_mw_idx != B2B_MW_DISABLED && uidx >= ntb->msix_mw_idx)) 2608 uidx++; 2609 return (uidx); 2610 } 2611 2612 #ifndef EARLY_AP_STARTUP 2613 static int msix_ready; 2614 2615 static void 2616 intel_ntb_msix_ready(void *arg __unused) 2617 { 2618 2619 msix_ready = 1; 2620 } 2621 SYSINIT(intel_ntb_msix_ready, SI_SUB_SMP, SI_ORDER_ANY, 2622 intel_ntb_msix_ready, NULL); 2623 #endif 2624 2625 static void 2626 intel_ntb_exchange_msix(void *ctx) 2627 { 2628 struct ntb_softc *ntb; 2629 uint32_t val; 2630 unsigned i; 2631 2632 ntb = ctx; 2633 2634 if (ntb->peer_msix_good) 2635 goto msix_good; 2636 if (ntb->peer_msix_done) 2637 goto msix_done; 2638 2639 #ifndef EARLY_AP_STARTUP 2640 /* Block MSIX negotiation until SMP started and IRQ reshuffled. */ 2641 if (!msix_ready) 2642 goto reschedule; 2643 #endif 2644 2645 intel_ntb_get_msix_info(ntb); 2646 for (i = 0; i < XEON_NONLINK_DB_MSIX_BITS; i++) { 2647 intel_ntb_peer_spad_write(ntb->device, NTB_MSIX_DATA0 + i, 2648 ntb->msix_data[i].nmd_data); 2649 intel_ntb_peer_spad_write(ntb->device, NTB_MSIX_OFS0 + i, 2650 ntb->msix_data[i].nmd_ofs - ntb->msix_xlat); 2651 } 2652 intel_ntb_peer_spad_write(ntb->device, NTB_MSIX_GUARD, NTB_MSIX_VER_GUARD); 2653 2654 intel_ntb_spad_read(ntb->device, NTB_MSIX_GUARD, &val); 2655 if (val != NTB_MSIX_VER_GUARD) 2656 goto reschedule; 2657 2658 for (i = 0; i < XEON_NONLINK_DB_MSIX_BITS; i++) { 2659 intel_ntb_spad_read(ntb->device, NTB_MSIX_DATA0 + i, &val); 2660 intel_ntb_printf(2, "remote MSIX data(%u): 0x%x\n", i, val); 2661 ntb->peer_msix_data[i].nmd_data = val; 2662 intel_ntb_spad_read(ntb->device, NTB_MSIX_OFS0 + i, &val); 2663 intel_ntb_printf(2, "remote MSIX addr(%u): 0x%x\n", i, val); 2664 ntb->peer_msix_data[i].nmd_ofs = val; 2665 } 2666 2667 ntb->peer_msix_done = true; 2668 2669 msix_done: 2670 intel_ntb_peer_spad_write(ntb->device, NTB_MSIX_DONE, NTB_MSIX_RECEIVED); 2671 intel_ntb_spad_read(ntb->device, NTB_MSIX_DONE, &val); 2672 if (val != NTB_MSIX_RECEIVED) 2673 goto reschedule; 2674 2675 intel_ntb_spad_clear(ntb->device); 2676 ntb->peer_msix_good = true; 2677 /* Give peer time to see our NTB_MSIX_RECEIVED. */ 2678 goto reschedule; 2679 2680 msix_good: 2681 intel_ntb_poll_link(ntb); 2682 ntb_link_event(ntb->device); 2683 return; 2684 2685 reschedule: 2686 ntb->lnk_sta = pci_read_config(ntb->device, ntb->reg->lnk_sta, 2); 2687 if (_xeon_link_is_up(ntb)) { 2688 callout_reset(&ntb->peer_msix_work, 2689 hz * (ntb->peer_msix_good ? 2 : 1) / 10, 2690 intel_ntb_exchange_msix, ntb); 2691 } else 2692 intel_ntb_spad_clear(ntb->device); 2693 } 2694 2695 /* 2696 * Public API to the rest of the OS 2697 */ 2698 2699 static uint8_t 2700 intel_ntb_spad_count(device_t dev) 2701 { 2702 struct ntb_softc *ntb = device_get_softc(dev); 2703 2704 return (ntb->spad_count); 2705 } 2706 2707 static uint8_t 2708 intel_ntb_mw_count(device_t dev) 2709 { 2710 struct ntb_softc *ntb = device_get_softc(dev); 2711 uint8_t res; 2712 2713 res = ntb->mw_count; 2714 if (ntb->b2b_mw_idx != B2B_MW_DISABLED && ntb->b2b_off == 0) 2715 res--; 2716 if (ntb->msix_mw_idx != B2B_MW_DISABLED) 2717 res--; 2718 return (res); 2719 } 2720 2721 static int 2722 intel_ntb_spad_write(device_t dev, unsigned int idx, uint32_t val) 2723 { 2724 struct ntb_softc *ntb = device_get_softc(dev); 2725 2726 if (idx >= ntb->spad_count) 2727 return (EINVAL); 2728 2729 intel_ntb_reg_write(4, ntb->self_reg->spad + idx * 4, val); 2730 2731 return (0); 2732 } 2733 2734 /* 2735 * Zeros the local scratchpad. 2736 */ 2737 static void 2738 intel_ntb_spad_clear(device_t dev) 2739 { 2740 struct ntb_softc *ntb = device_get_softc(dev); 2741 unsigned i; 2742 2743 for (i = 0; i < ntb->spad_count; i++) 2744 intel_ntb_spad_write(dev, i, 0); 2745 } 2746 2747 static int 2748 intel_ntb_spad_read(device_t dev, unsigned int idx, uint32_t *val) 2749 { 2750 struct ntb_softc *ntb = device_get_softc(dev); 2751 2752 if (idx >= ntb->spad_count) 2753 return (EINVAL); 2754 2755 *val = intel_ntb_reg_read(4, ntb->self_reg->spad + idx * 4); 2756 2757 return (0); 2758 } 2759 2760 static int 2761 intel_ntb_peer_spad_write(device_t dev, unsigned int idx, uint32_t val) 2762 { 2763 struct ntb_softc *ntb = device_get_softc(dev); 2764 2765 if (idx >= ntb->spad_count) 2766 return (EINVAL); 2767 2768 if (HAS_FEATURE(ntb, NTB_SDOORBELL_LOCKUP)) 2769 intel_ntb_mw_write(4, XEON_SPAD_OFFSET + idx * 4, val); 2770 else 2771 intel_ntb_reg_write(4, ntb->peer_reg->spad + idx * 4, val); 2772 2773 return (0); 2774 } 2775 2776 static int 2777 intel_ntb_peer_spad_read(device_t dev, unsigned int idx, uint32_t *val) 2778 { 2779 struct ntb_softc *ntb = device_get_softc(dev); 2780 2781 if (idx >= ntb->spad_count) 2782 return (EINVAL); 2783 2784 if (HAS_FEATURE(ntb, NTB_SDOORBELL_LOCKUP)) 2785 *val = intel_ntb_mw_read(4, XEON_SPAD_OFFSET + idx * 4); 2786 else 2787 *val = intel_ntb_reg_read(4, ntb->peer_reg->spad + idx * 4); 2788 2789 return (0); 2790 } 2791 2792 static int 2793 intel_ntb_mw_get_range(device_t dev, unsigned mw_idx, vm_paddr_t *base, 2794 caddr_t *vbase, size_t *size, size_t *align, size_t *align_size, 2795 bus_addr_t *plimit) 2796 { 2797 struct ntb_softc *ntb = device_get_softc(dev); 2798 struct ntb_pci_bar_info *bar; 2799 bus_addr_t limit; 2800 size_t bar_b2b_off; 2801 enum ntb_bar bar_num; 2802 2803 if (mw_idx >= intel_ntb_mw_count(dev)) 2804 return (EINVAL); 2805 mw_idx = intel_ntb_user_mw_to_idx(ntb, mw_idx); 2806 2807 bar_num = intel_ntb_mw_to_bar(ntb, mw_idx); 2808 bar = &ntb->bar_info[bar_num]; 2809 bar_b2b_off = 0; 2810 if (mw_idx == ntb->b2b_mw_idx) { 2811 KASSERT(ntb->b2b_off != 0, 2812 ("user shouldn't get non-shared b2b mw")); 2813 bar_b2b_off = ntb->b2b_off; 2814 } 2815 2816 if (bar_is_64bit(ntb, bar_num)) 2817 limit = BUS_SPACE_MAXADDR; 2818 else 2819 limit = BUS_SPACE_MAXADDR_32BIT; 2820 2821 if (base != NULL) 2822 *base = bar->pbase + bar_b2b_off; 2823 if (vbase != NULL) 2824 *vbase = bar->vbase + bar_b2b_off; 2825 if (size != NULL) 2826 *size = bar->size - bar_b2b_off; 2827 if (align != NULL) 2828 *align = bar->size; 2829 if (align_size != NULL) 2830 *align_size = 1; 2831 if (plimit != NULL) 2832 *plimit = limit; 2833 return (0); 2834 } 2835 2836 static int 2837 intel_ntb_mw_set_trans(device_t dev, unsigned idx, bus_addr_t addr, size_t size) 2838 { 2839 struct ntb_softc *ntb = device_get_softc(dev); 2840 struct ntb_pci_bar_info *bar; 2841 uint64_t base, limit, reg_val; 2842 size_t bar_size, mw_size; 2843 uint32_t base_reg, xlat_reg, limit_reg; 2844 enum ntb_bar bar_num; 2845 2846 if (idx >= intel_ntb_mw_count(dev)) 2847 return (EINVAL); 2848 idx = intel_ntb_user_mw_to_idx(ntb, idx); 2849 2850 bar_num = intel_ntb_mw_to_bar(ntb, idx); 2851 bar = &ntb->bar_info[bar_num]; 2852 2853 bar_size = bar->size; 2854 if (idx == ntb->b2b_mw_idx) 2855 mw_size = bar_size - ntb->b2b_off; 2856 else 2857 mw_size = bar_size; 2858 2859 /* Hardware requires that addr is aligned to bar size */ 2860 if ((addr & (bar_size - 1)) != 0) 2861 return (EINVAL); 2862 2863 if (size > mw_size) 2864 return (EINVAL); 2865 2866 bar_get_xlat_params(ntb, bar_num, &base_reg, &xlat_reg, &limit_reg); 2867 2868 limit = 0; 2869 if (bar_is_64bit(ntb, bar_num)) { 2870 base = intel_ntb_reg_read(8, base_reg) & BAR_HIGH_MASK; 2871 2872 if (limit_reg != 0 && size != mw_size) 2873 limit = base + size; 2874 2875 /* Set and verify translation address */ 2876 intel_ntb_reg_write(8, xlat_reg, addr); 2877 reg_val = intel_ntb_reg_read(8, xlat_reg) & BAR_HIGH_MASK; 2878 if (reg_val != addr) { 2879 intel_ntb_reg_write(8, xlat_reg, 0); 2880 return (EIO); 2881 } 2882 2883 /* Set and verify the limit */ 2884 intel_ntb_reg_write(8, limit_reg, limit); 2885 reg_val = intel_ntb_reg_read(8, limit_reg) & BAR_HIGH_MASK; 2886 if (reg_val != limit) { 2887 intel_ntb_reg_write(8, limit_reg, base); 2888 intel_ntb_reg_write(8, xlat_reg, 0); 2889 return (EIO); 2890 } 2891 } else { 2892 /* Configure 32-bit (split) BAR MW */ 2893 2894 if ((addr & UINT32_MAX) != addr) 2895 return (ERANGE); 2896 if (((addr + size) & UINT32_MAX) != (addr + size)) 2897 return (ERANGE); 2898 2899 base = intel_ntb_reg_read(4, base_reg) & BAR_HIGH_MASK; 2900 2901 if (limit_reg != 0 && size != mw_size) 2902 limit = base + size; 2903 2904 /* Set and verify translation address */ 2905 intel_ntb_reg_write(4, xlat_reg, addr); 2906 reg_val = intel_ntb_reg_read(4, xlat_reg) & BAR_HIGH_MASK; 2907 if (reg_val != addr) { 2908 intel_ntb_reg_write(4, xlat_reg, 0); 2909 return (EIO); 2910 } 2911 2912 /* Set and verify the limit */ 2913 intel_ntb_reg_write(4, limit_reg, limit); 2914 reg_val = intel_ntb_reg_read(4, limit_reg) & BAR_HIGH_MASK; 2915 if (reg_val != limit) { 2916 intel_ntb_reg_write(4, limit_reg, base); 2917 intel_ntb_reg_write(4, xlat_reg, 0); 2918 return (EIO); 2919 } 2920 } 2921 return (0); 2922 } 2923 2924 static int 2925 intel_ntb_mw_clear_trans(device_t dev, unsigned mw_idx) 2926 { 2927 2928 return (intel_ntb_mw_set_trans(dev, mw_idx, 0, 0)); 2929 } 2930 2931 static int 2932 intel_ntb_mw_get_wc(device_t dev, unsigned idx, vm_memattr_t *mode) 2933 { 2934 struct ntb_softc *ntb = device_get_softc(dev); 2935 struct ntb_pci_bar_info *bar; 2936 2937 if (idx >= intel_ntb_mw_count(dev)) 2938 return (EINVAL); 2939 idx = intel_ntb_user_mw_to_idx(ntb, idx); 2940 2941 bar = &ntb->bar_info[intel_ntb_mw_to_bar(ntb, idx)]; 2942 *mode = bar->map_mode; 2943 return (0); 2944 } 2945 2946 static int 2947 intel_ntb_mw_set_wc(device_t dev, unsigned idx, vm_memattr_t mode) 2948 { 2949 struct ntb_softc *ntb = device_get_softc(dev); 2950 2951 if (idx >= intel_ntb_mw_count(dev)) 2952 return (EINVAL); 2953 2954 idx = intel_ntb_user_mw_to_idx(ntb, idx); 2955 return (intel_ntb_mw_set_wc_internal(ntb, idx, mode)); 2956 } 2957 2958 static int 2959 intel_ntb_mw_set_wc_internal(struct ntb_softc *ntb, unsigned idx, vm_memattr_t mode) 2960 { 2961 struct ntb_pci_bar_info *bar; 2962 int rc; 2963 2964 bar = &ntb->bar_info[intel_ntb_mw_to_bar(ntb, idx)]; 2965 if (bar->map_mode == mode) 2966 return (0); 2967 2968 rc = pmap_change_attr((vm_offset_t)bar->vbase, bar->size, mode); 2969 if (rc == 0) 2970 bar->map_mode = mode; 2971 2972 return (rc); 2973 } 2974 2975 static void 2976 intel_ntb_peer_db_set(device_t dev, uint64_t bit) 2977 { 2978 struct ntb_softc *ntb = device_get_softc(dev); 2979 2980 if (HAS_FEATURE(ntb, NTB_SB01BASE_LOCKUP)) { 2981 struct ntb_pci_bar_info *lapic; 2982 unsigned i; 2983 2984 lapic = ntb->peer_lapic_bar; 2985 2986 for (i = 0; i < XEON_NONLINK_DB_MSIX_BITS; i++) { 2987 if ((bit & intel_ntb_db_vector_mask(dev, i)) != 0) 2988 bus_space_write_4(lapic->pci_bus_tag, 2989 lapic->pci_bus_handle, 2990 ntb->peer_msix_data[i].nmd_ofs, 2991 ntb->peer_msix_data[i].nmd_data); 2992 } 2993 return; 2994 } 2995 2996 if (HAS_FEATURE(ntb, NTB_SDOORBELL_LOCKUP)) { 2997 intel_ntb_mw_write(2, XEON_PDOORBELL_OFFSET, bit); 2998 return; 2999 } 3000 3001 db_iowrite(ntb, ntb->peer_reg->db_bell, bit); 3002 } 3003 3004 static int 3005 intel_ntb_peer_db_addr(device_t dev, bus_addr_t *db_addr, vm_size_t *db_size) 3006 { 3007 struct ntb_softc *ntb = device_get_softc(dev); 3008 struct ntb_pci_bar_info *bar; 3009 uint64_t regoff; 3010 3011 KASSERT((db_addr != NULL && db_size != NULL), ("must be non-NULL")); 3012 3013 if (!HAS_FEATURE(ntb, NTB_SDOORBELL_LOCKUP)) { 3014 bar = &ntb->bar_info[NTB_CONFIG_BAR]; 3015 regoff = ntb->peer_reg->db_bell; 3016 } else { 3017 KASSERT(ntb->b2b_mw_idx != B2B_MW_DISABLED, 3018 ("invalid b2b idx")); 3019 3020 bar = &ntb->bar_info[intel_ntb_mw_to_bar(ntb, ntb->b2b_mw_idx)]; 3021 regoff = XEON_PDOORBELL_OFFSET; 3022 } 3023 KASSERT(bar->pci_bus_tag != X86_BUS_SPACE_IO, ("uh oh")); 3024 3025 /* HACK: Specific to current x86 bus implementation. */ 3026 *db_addr = ((uint64_t)bar->pci_bus_handle + regoff); 3027 *db_size = ntb->reg->db_size; 3028 return (0); 3029 } 3030 3031 static uint64_t 3032 intel_ntb_db_valid_mask(device_t dev) 3033 { 3034 struct ntb_softc *ntb = device_get_softc(dev); 3035 3036 return (ntb->db_valid_mask); 3037 } 3038 3039 static int 3040 intel_ntb_db_vector_count(device_t dev) 3041 { 3042 struct ntb_softc *ntb = device_get_softc(dev); 3043 3044 return (ntb->db_vec_count); 3045 } 3046 3047 static uint64_t 3048 intel_ntb_db_vector_mask(device_t dev, uint32_t vector) 3049 { 3050 struct ntb_softc *ntb = device_get_softc(dev); 3051 3052 if (vector > ntb->db_vec_count) 3053 return (0); 3054 return (ntb->db_valid_mask & intel_ntb_vec_mask(ntb, vector)); 3055 } 3056 3057 static bool 3058 intel_ntb_link_is_up(device_t dev, enum ntb_speed *speed, enum ntb_width *width) 3059 { 3060 struct ntb_softc *ntb = device_get_softc(dev); 3061 3062 if (speed != NULL) 3063 *speed = intel_ntb_link_sta_speed(ntb); 3064 if (width != NULL) 3065 *width = intel_ntb_link_sta_width(ntb); 3066 return (link_is_up(ntb)); 3067 } 3068 3069 static void 3070 save_bar_parameters(struct ntb_pci_bar_info *bar) 3071 { 3072 3073 bar->pci_bus_tag = rman_get_bustag(bar->pci_resource); 3074 bar->pci_bus_handle = rman_get_bushandle(bar->pci_resource); 3075 bar->pbase = rman_get_start(bar->pci_resource); 3076 bar->size = rman_get_size(bar->pci_resource); 3077 bar->vbase = rman_get_virtual(bar->pci_resource); 3078 } 3079 3080 static device_method_t ntb_intel_methods[] = { 3081 /* Device interface */ 3082 DEVMETHOD(device_probe, intel_ntb_probe), 3083 DEVMETHOD(device_attach, intel_ntb_attach), 3084 DEVMETHOD(device_detach, intel_ntb_detach), 3085 /* Bus interface */ 3086 DEVMETHOD(bus_child_location_str, ntb_child_location_str), 3087 DEVMETHOD(bus_print_child, ntb_print_child), 3088 /* NTB interface */ 3089 DEVMETHOD(ntb_link_is_up, intel_ntb_link_is_up), 3090 DEVMETHOD(ntb_link_enable, intel_ntb_link_enable), 3091 DEVMETHOD(ntb_link_disable, intel_ntb_link_disable), 3092 DEVMETHOD(ntb_link_enabled, intel_ntb_link_enabled), 3093 DEVMETHOD(ntb_mw_count, intel_ntb_mw_count), 3094 DEVMETHOD(ntb_mw_get_range, intel_ntb_mw_get_range), 3095 DEVMETHOD(ntb_mw_set_trans, intel_ntb_mw_set_trans), 3096 DEVMETHOD(ntb_mw_clear_trans, intel_ntb_mw_clear_trans), 3097 DEVMETHOD(ntb_mw_get_wc, intel_ntb_mw_get_wc), 3098 DEVMETHOD(ntb_mw_set_wc, intel_ntb_mw_set_wc), 3099 DEVMETHOD(ntb_spad_count, intel_ntb_spad_count), 3100 DEVMETHOD(ntb_spad_clear, intel_ntb_spad_clear), 3101 DEVMETHOD(ntb_spad_write, intel_ntb_spad_write), 3102 DEVMETHOD(ntb_spad_read, intel_ntb_spad_read), 3103 DEVMETHOD(ntb_peer_spad_write, intel_ntb_peer_spad_write), 3104 DEVMETHOD(ntb_peer_spad_read, intel_ntb_peer_spad_read), 3105 DEVMETHOD(ntb_db_valid_mask, intel_ntb_db_valid_mask), 3106 DEVMETHOD(ntb_db_vector_count, intel_ntb_db_vector_count), 3107 DEVMETHOD(ntb_db_vector_mask, intel_ntb_db_vector_mask), 3108 DEVMETHOD(ntb_db_clear, intel_ntb_db_clear), 3109 DEVMETHOD(ntb_db_clear_mask, intel_ntb_db_clear_mask), 3110 DEVMETHOD(ntb_db_read, intel_ntb_db_read), 3111 DEVMETHOD(ntb_db_set_mask, intel_ntb_db_set_mask), 3112 DEVMETHOD(ntb_peer_db_addr, intel_ntb_peer_db_addr), 3113 DEVMETHOD(ntb_peer_db_set, intel_ntb_peer_db_set), 3114 DEVMETHOD_END 3115 }; 3116 3117 static DEFINE_CLASS_0(ntb_hw, ntb_intel_driver, ntb_intel_methods, 3118 sizeof(struct ntb_softc)); 3119 DRIVER_MODULE(ntb_hw_intel, pci, ntb_intel_driver, ntb_hw_devclass, NULL, NULL); 3120 MODULE_DEPEND(ntb_hw_intel, ntb, 1, 1, 1); 3121 MODULE_VERSION(ntb_hw_intel, 1); 3122 MODULE_PNP_INFO("W32:vendor/device;D:#", pci, ntb_hw_intel, pci_ids, 3123 sizeof(pci_ids[0]), nitems(pci_ids)); 3124