1 /* 2 * IBM Power Virtual Ethernet Device Driver 3 * 4 * This program is free software; you can redistribute it and/or modify 5 * it under the terms of the GNU General Public License as published by 6 * the Free Software Foundation; either version 2 of the License, or 7 * (at your option) any later version. 8 * 9 * This program is distributed in the hope that it will be useful, 10 * but WITHOUT ANY WARRANTY; without even the implied warranty of 11 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the 12 * GNU General Public License for more details. 13 * 14 * You should have received a copy of the GNU General Public License 15 * along with this program; if not, see <http://www.gnu.org/licenses/>. 16 * 17 * Copyright (C) IBM Corporation, 2003, 2010 18 * 19 * Authors: Dave Larson <larson1@us.ibm.com> 20 * Santiago Leon <santil@linux.vnet.ibm.com> 21 * Brian King <brking@linux.vnet.ibm.com> 22 * Robert Jennings <rcj@linux.vnet.ibm.com> 23 * Anton Blanchard <anton@au.ibm.com> 24 */ 25 26 #include <linux/module.h> 27 #include <linux/moduleparam.h> 28 #include <linux/types.h> 29 #include <linux/errno.h> 30 #include <linux/dma-mapping.h> 31 #include <linux/kernel.h> 32 #include <linux/netdevice.h> 33 #include <linux/etherdevice.h> 34 #include <linux/skbuff.h> 35 #include <linux/init.h> 36 #include <linux/interrupt.h> 37 #include <linux/mm.h> 38 #include <linux/pm.h> 39 #include <linux/ethtool.h> 40 #include <linux/in.h> 41 #include <linux/ip.h> 42 #include <linux/ipv6.h> 43 #include <linux/slab.h> 44 #include <asm/hvcall.h> 45 #include <linux/atomic.h> 46 #include <asm/vio.h> 47 #include <asm/iommu.h> 48 #include <asm/firmware.h> 49 50 #include "ibmveth.h" 51 52 static irqreturn_t ibmveth_interrupt(int irq, void *dev_instance); 53 static void ibmveth_rxq_harvest_buffer(struct ibmveth_adapter *adapter); 54 static unsigned long ibmveth_get_desired_dma(struct vio_dev *vdev); 55 56 static struct kobj_type ktype_veth_pool; 57 58 59 static const char ibmveth_driver_name[] = "ibmveth"; 60 static const char ibmveth_driver_string[] = "IBM Power Virtual Ethernet Driver"; 61 #define ibmveth_driver_version "1.06" 62 63 MODULE_AUTHOR("Santiago Leon <santil@linux.vnet.ibm.com>"); 64 MODULE_DESCRIPTION("IBM Power Virtual Ethernet Driver"); 65 MODULE_LICENSE("GPL"); 66 MODULE_VERSION(ibmveth_driver_version); 67 68 static unsigned int tx_copybreak __read_mostly = 128; 69 module_param(tx_copybreak, uint, 0644); 70 MODULE_PARM_DESC(tx_copybreak, 71 "Maximum size of packet that is copied to a new buffer on transmit"); 72 73 static unsigned int rx_copybreak __read_mostly = 128; 74 module_param(rx_copybreak, uint, 0644); 75 MODULE_PARM_DESC(rx_copybreak, 76 "Maximum size of packet that is copied to a new buffer on receive"); 77 78 static unsigned int rx_flush __read_mostly = 0; 79 module_param(rx_flush, uint, 0644); 80 MODULE_PARM_DESC(rx_flush, "Flush receive buffers before use"); 81 82 static bool old_large_send __read_mostly; 83 module_param(old_large_send, bool, S_IRUGO); 84 MODULE_PARM_DESC(old_large_send, 85 "Use old large send method on firmware that supports the new method"); 86 87 struct ibmveth_stat { 88 char name[ETH_GSTRING_LEN]; 89 int offset; 90 }; 91 92 #define IBMVETH_STAT_OFF(stat) offsetof(struct ibmveth_adapter, stat) 93 #define IBMVETH_GET_STAT(a, off) *((u64 *)(((unsigned long)(a)) + off)) 94 95 struct ibmveth_stat ibmveth_stats[] = { 96 { "replenish_task_cycles", IBMVETH_STAT_OFF(replenish_task_cycles) }, 97 { "replenish_no_mem", IBMVETH_STAT_OFF(replenish_no_mem) }, 98 { "replenish_add_buff_failure", 99 IBMVETH_STAT_OFF(replenish_add_buff_failure) }, 100 { "replenish_add_buff_success", 101 IBMVETH_STAT_OFF(replenish_add_buff_success) }, 102 { "rx_invalid_buffer", IBMVETH_STAT_OFF(rx_invalid_buffer) }, 103 { "rx_no_buffer", IBMVETH_STAT_OFF(rx_no_buffer) }, 104 { "tx_map_failed", IBMVETH_STAT_OFF(tx_map_failed) }, 105 { "tx_send_failed", IBMVETH_STAT_OFF(tx_send_failed) }, 106 { "fw_enabled_ipv4_csum", IBMVETH_STAT_OFF(fw_ipv4_csum_support) }, 107 { "fw_enabled_ipv6_csum", IBMVETH_STAT_OFF(fw_ipv6_csum_support) }, 108 { "tx_large_packets", IBMVETH_STAT_OFF(tx_large_packets) }, 109 { "rx_large_packets", IBMVETH_STAT_OFF(rx_large_packets) }, 110 { "fw_enabled_large_send", IBMVETH_STAT_OFF(fw_large_send_support) } 111 }; 112 113 /* simple methods of getting data from the current rxq entry */ 114 static inline u32 ibmveth_rxq_flags(struct ibmveth_adapter *adapter) 115 { 116 return be32_to_cpu(adapter->rx_queue.queue_addr[adapter->rx_queue.index].flags_off); 117 } 118 119 static inline int ibmveth_rxq_toggle(struct ibmveth_adapter *adapter) 120 { 121 return (ibmveth_rxq_flags(adapter) & IBMVETH_RXQ_TOGGLE) >> 122 IBMVETH_RXQ_TOGGLE_SHIFT; 123 } 124 125 static inline int ibmveth_rxq_pending_buffer(struct ibmveth_adapter *adapter) 126 { 127 return ibmveth_rxq_toggle(adapter) == adapter->rx_queue.toggle; 128 } 129 130 static inline int ibmveth_rxq_buffer_valid(struct ibmveth_adapter *adapter) 131 { 132 return ibmveth_rxq_flags(adapter) & IBMVETH_RXQ_VALID; 133 } 134 135 static inline int ibmveth_rxq_frame_offset(struct ibmveth_adapter *adapter) 136 { 137 return ibmveth_rxq_flags(adapter) & IBMVETH_RXQ_OFF_MASK; 138 } 139 140 static inline int ibmveth_rxq_large_packet(struct ibmveth_adapter *adapter) 141 { 142 return ibmveth_rxq_flags(adapter) & IBMVETH_RXQ_LRG_PKT; 143 } 144 145 static inline int ibmveth_rxq_frame_length(struct ibmveth_adapter *adapter) 146 { 147 return be32_to_cpu(adapter->rx_queue.queue_addr[adapter->rx_queue.index].length); 148 } 149 150 static inline int ibmveth_rxq_csum_good(struct ibmveth_adapter *adapter) 151 { 152 return ibmveth_rxq_flags(adapter) & IBMVETH_RXQ_CSUM_GOOD; 153 } 154 155 /* setup the initial settings for a buffer pool */ 156 static void ibmveth_init_buffer_pool(struct ibmveth_buff_pool *pool, 157 u32 pool_index, u32 pool_size, 158 u32 buff_size, u32 pool_active) 159 { 160 pool->size = pool_size; 161 pool->index = pool_index; 162 pool->buff_size = buff_size; 163 pool->threshold = pool_size * 7 / 8; 164 pool->active = pool_active; 165 } 166 167 /* allocate and setup an buffer pool - called during open */ 168 static int ibmveth_alloc_buffer_pool(struct ibmveth_buff_pool *pool) 169 { 170 int i; 171 172 pool->free_map = kmalloc(sizeof(u16) * pool->size, GFP_KERNEL); 173 174 if (!pool->free_map) 175 return -1; 176 177 pool->dma_addr = kcalloc(pool->size, sizeof(dma_addr_t), GFP_KERNEL); 178 if (!pool->dma_addr) { 179 kfree(pool->free_map); 180 pool->free_map = NULL; 181 return -1; 182 } 183 184 pool->skbuff = kcalloc(pool->size, sizeof(void *), GFP_KERNEL); 185 186 if (!pool->skbuff) { 187 kfree(pool->dma_addr); 188 pool->dma_addr = NULL; 189 190 kfree(pool->free_map); 191 pool->free_map = NULL; 192 return -1; 193 } 194 195 for (i = 0; i < pool->size; ++i) 196 pool->free_map[i] = i; 197 198 atomic_set(&pool->available, 0); 199 pool->producer_index = 0; 200 pool->consumer_index = 0; 201 202 return 0; 203 } 204 205 static inline void ibmveth_flush_buffer(void *addr, unsigned long length) 206 { 207 unsigned long offset; 208 209 for (offset = 0; offset < length; offset += SMP_CACHE_BYTES) 210 asm("dcbfl %0,%1" :: "b" (addr), "r" (offset)); 211 } 212 213 /* replenish the buffers for a pool. note that we don't need to 214 * skb_reserve these since they are used for incoming... 215 */ 216 static void ibmveth_replenish_buffer_pool(struct ibmveth_adapter *adapter, 217 struct ibmveth_buff_pool *pool) 218 { 219 u32 i; 220 u32 count = pool->size - atomic_read(&pool->available); 221 u32 buffers_added = 0; 222 struct sk_buff *skb; 223 unsigned int free_index, index; 224 u64 correlator; 225 unsigned long lpar_rc; 226 dma_addr_t dma_addr; 227 228 mb(); 229 230 for (i = 0; i < count; ++i) { 231 union ibmveth_buf_desc desc; 232 233 skb = netdev_alloc_skb(adapter->netdev, pool->buff_size); 234 235 if (!skb) { 236 netdev_dbg(adapter->netdev, 237 "replenish: unable to allocate skb\n"); 238 adapter->replenish_no_mem++; 239 break; 240 } 241 242 free_index = pool->consumer_index; 243 pool->consumer_index++; 244 if (pool->consumer_index >= pool->size) 245 pool->consumer_index = 0; 246 index = pool->free_map[free_index]; 247 248 BUG_ON(index == IBM_VETH_INVALID_MAP); 249 BUG_ON(pool->skbuff[index] != NULL); 250 251 dma_addr = dma_map_single(&adapter->vdev->dev, skb->data, 252 pool->buff_size, DMA_FROM_DEVICE); 253 254 if (dma_mapping_error(&adapter->vdev->dev, dma_addr)) 255 goto failure; 256 257 pool->free_map[free_index] = IBM_VETH_INVALID_MAP; 258 pool->dma_addr[index] = dma_addr; 259 pool->skbuff[index] = skb; 260 261 correlator = ((u64)pool->index << 32) | index; 262 *(u64 *)skb->data = correlator; 263 264 desc.fields.flags_len = IBMVETH_BUF_VALID | pool->buff_size; 265 desc.fields.address = dma_addr; 266 267 if (rx_flush) { 268 unsigned int len = min(pool->buff_size, 269 adapter->netdev->mtu + 270 IBMVETH_BUFF_OH); 271 ibmveth_flush_buffer(skb->data, len); 272 } 273 lpar_rc = h_add_logical_lan_buffer(adapter->vdev->unit_address, 274 desc.desc); 275 276 if (lpar_rc != H_SUCCESS) { 277 goto failure; 278 } else { 279 buffers_added++; 280 adapter->replenish_add_buff_success++; 281 } 282 } 283 284 mb(); 285 atomic_add(buffers_added, &(pool->available)); 286 return; 287 288 failure: 289 pool->free_map[free_index] = index; 290 pool->skbuff[index] = NULL; 291 if (pool->consumer_index == 0) 292 pool->consumer_index = pool->size - 1; 293 else 294 pool->consumer_index--; 295 if (!dma_mapping_error(&adapter->vdev->dev, dma_addr)) 296 dma_unmap_single(&adapter->vdev->dev, 297 pool->dma_addr[index], pool->buff_size, 298 DMA_FROM_DEVICE); 299 dev_kfree_skb_any(skb); 300 adapter->replenish_add_buff_failure++; 301 302 mb(); 303 atomic_add(buffers_added, &(pool->available)); 304 } 305 306 /* 307 * The final 8 bytes of the buffer list is a counter of frames dropped 308 * because there was not a buffer in the buffer list capable of holding 309 * the frame. 310 */ 311 static void ibmveth_update_rx_no_buffer(struct ibmveth_adapter *adapter) 312 { 313 __be64 *p = adapter->buffer_list_addr + 4096 - 8; 314 315 adapter->rx_no_buffer = be64_to_cpup(p); 316 } 317 318 /* replenish routine */ 319 static void ibmveth_replenish_task(struct ibmveth_adapter *adapter) 320 { 321 int i; 322 323 adapter->replenish_task_cycles++; 324 325 for (i = (IBMVETH_NUM_BUFF_POOLS - 1); i >= 0; i--) { 326 struct ibmveth_buff_pool *pool = &adapter->rx_buff_pool[i]; 327 328 if (pool->active && 329 (atomic_read(&pool->available) < pool->threshold)) 330 ibmveth_replenish_buffer_pool(adapter, pool); 331 } 332 333 ibmveth_update_rx_no_buffer(adapter); 334 } 335 336 /* empty and free ana buffer pool - also used to do cleanup in error paths */ 337 static void ibmveth_free_buffer_pool(struct ibmveth_adapter *adapter, 338 struct ibmveth_buff_pool *pool) 339 { 340 int i; 341 342 kfree(pool->free_map); 343 pool->free_map = NULL; 344 345 if (pool->skbuff && pool->dma_addr) { 346 for (i = 0; i < pool->size; ++i) { 347 struct sk_buff *skb = pool->skbuff[i]; 348 if (skb) { 349 dma_unmap_single(&adapter->vdev->dev, 350 pool->dma_addr[i], 351 pool->buff_size, 352 DMA_FROM_DEVICE); 353 dev_kfree_skb_any(skb); 354 pool->skbuff[i] = NULL; 355 } 356 } 357 } 358 359 if (pool->dma_addr) { 360 kfree(pool->dma_addr); 361 pool->dma_addr = NULL; 362 } 363 364 if (pool->skbuff) { 365 kfree(pool->skbuff); 366 pool->skbuff = NULL; 367 } 368 } 369 370 /* remove a buffer from a pool */ 371 static void ibmveth_remove_buffer_from_pool(struct ibmveth_adapter *adapter, 372 u64 correlator) 373 { 374 unsigned int pool = correlator >> 32; 375 unsigned int index = correlator & 0xffffffffUL; 376 unsigned int free_index; 377 struct sk_buff *skb; 378 379 BUG_ON(pool >= IBMVETH_NUM_BUFF_POOLS); 380 BUG_ON(index >= adapter->rx_buff_pool[pool].size); 381 382 skb = adapter->rx_buff_pool[pool].skbuff[index]; 383 384 BUG_ON(skb == NULL); 385 386 adapter->rx_buff_pool[pool].skbuff[index] = NULL; 387 388 dma_unmap_single(&adapter->vdev->dev, 389 adapter->rx_buff_pool[pool].dma_addr[index], 390 adapter->rx_buff_pool[pool].buff_size, 391 DMA_FROM_DEVICE); 392 393 free_index = adapter->rx_buff_pool[pool].producer_index; 394 adapter->rx_buff_pool[pool].producer_index++; 395 if (adapter->rx_buff_pool[pool].producer_index >= 396 adapter->rx_buff_pool[pool].size) 397 adapter->rx_buff_pool[pool].producer_index = 0; 398 adapter->rx_buff_pool[pool].free_map[free_index] = index; 399 400 mb(); 401 402 atomic_dec(&(adapter->rx_buff_pool[pool].available)); 403 } 404 405 /* get the current buffer on the rx queue */ 406 static inline struct sk_buff *ibmveth_rxq_get_buffer(struct ibmveth_adapter *adapter) 407 { 408 u64 correlator = adapter->rx_queue.queue_addr[adapter->rx_queue.index].correlator; 409 unsigned int pool = correlator >> 32; 410 unsigned int index = correlator & 0xffffffffUL; 411 412 BUG_ON(pool >= IBMVETH_NUM_BUFF_POOLS); 413 BUG_ON(index >= adapter->rx_buff_pool[pool].size); 414 415 return adapter->rx_buff_pool[pool].skbuff[index]; 416 } 417 418 /* recycle the current buffer on the rx queue */ 419 static int ibmveth_rxq_recycle_buffer(struct ibmveth_adapter *adapter) 420 { 421 u32 q_index = adapter->rx_queue.index; 422 u64 correlator = adapter->rx_queue.queue_addr[q_index].correlator; 423 unsigned int pool = correlator >> 32; 424 unsigned int index = correlator & 0xffffffffUL; 425 union ibmveth_buf_desc desc; 426 unsigned long lpar_rc; 427 int ret = 1; 428 429 BUG_ON(pool >= IBMVETH_NUM_BUFF_POOLS); 430 BUG_ON(index >= adapter->rx_buff_pool[pool].size); 431 432 if (!adapter->rx_buff_pool[pool].active) { 433 ibmveth_rxq_harvest_buffer(adapter); 434 ibmveth_free_buffer_pool(adapter, &adapter->rx_buff_pool[pool]); 435 goto out; 436 } 437 438 desc.fields.flags_len = IBMVETH_BUF_VALID | 439 adapter->rx_buff_pool[pool].buff_size; 440 desc.fields.address = adapter->rx_buff_pool[pool].dma_addr[index]; 441 442 lpar_rc = h_add_logical_lan_buffer(adapter->vdev->unit_address, desc.desc); 443 444 if (lpar_rc != H_SUCCESS) { 445 netdev_dbg(adapter->netdev, "h_add_logical_lan_buffer failed " 446 "during recycle rc=%ld", lpar_rc); 447 ibmveth_remove_buffer_from_pool(adapter, adapter->rx_queue.queue_addr[adapter->rx_queue.index].correlator); 448 ret = 0; 449 } 450 451 if (++adapter->rx_queue.index == adapter->rx_queue.num_slots) { 452 adapter->rx_queue.index = 0; 453 adapter->rx_queue.toggle = !adapter->rx_queue.toggle; 454 } 455 456 out: 457 return ret; 458 } 459 460 static void ibmveth_rxq_harvest_buffer(struct ibmveth_adapter *adapter) 461 { 462 ibmveth_remove_buffer_from_pool(adapter, adapter->rx_queue.queue_addr[adapter->rx_queue.index].correlator); 463 464 if (++adapter->rx_queue.index == adapter->rx_queue.num_slots) { 465 adapter->rx_queue.index = 0; 466 adapter->rx_queue.toggle = !adapter->rx_queue.toggle; 467 } 468 } 469 470 static void ibmveth_cleanup(struct ibmveth_adapter *adapter) 471 { 472 int i; 473 struct device *dev = &adapter->vdev->dev; 474 475 if (adapter->buffer_list_addr != NULL) { 476 if (!dma_mapping_error(dev, adapter->buffer_list_dma)) { 477 dma_unmap_single(dev, adapter->buffer_list_dma, 4096, 478 DMA_BIDIRECTIONAL); 479 adapter->buffer_list_dma = DMA_ERROR_CODE; 480 } 481 free_page((unsigned long)adapter->buffer_list_addr); 482 adapter->buffer_list_addr = NULL; 483 } 484 485 if (adapter->filter_list_addr != NULL) { 486 if (!dma_mapping_error(dev, adapter->filter_list_dma)) { 487 dma_unmap_single(dev, adapter->filter_list_dma, 4096, 488 DMA_BIDIRECTIONAL); 489 adapter->filter_list_dma = DMA_ERROR_CODE; 490 } 491 free_page((unsigned long)adapter->filter_list_addr); 492 adapter->filter_list_addr = NULL; 493 } 494 495 if (adapter->rx_queue.queue_addr != NULL) { 496 dma_free_coherent(dev, adapter->rx_queue.queue_len, 497 adapter->rx_queue.queue_addr, 498 adapter->rx_queue.queue_dma); 499 adapter->rx_queue.queue_addr = NULL; 500 } 501 502 for (i = 0; i < IBMVETH_NUM_BUFF_POOLS; i++) 503 if (adapter->rx_buff_pool[i].active) 504 ibmveth_free_buffer_pool(adapter, 505 &adapter->rx_buff_pool[i]); 506 507 if (adapter->bounce_buffer != NULL) { 508 if (!dma_mapping_error(dev, adapter->bounce_buffer_dma)) { 509 dma_unmap_single(&adapter->vdev->dev, 510 adapter->bounce_buffer_dma, 511 adapter->netdev->mtu + IBMVETH_BUFF_OH, 512 DMA_BIDIRECTIONAL); 513 adapter->bounce_buffer_dma = DMA_ERROR_CODE; 514 } 515 kfree(adapter->bounce_buffer); 516 adapter->bounce_buffer = NULL; 517 } 518 } 519 520 static int ibmveth_register_logical_lan(struct ibmveth_adapter *adapter, 521 union ibmveth_buf_desc rxq_desc, u64 mac_address) 522 { 523 int rc, try_again = 1; 524 525 /* 526 * After a kexec the adapter will still be open, so our attempt to 527 * open it will fail. So if we get a failure we free the adapter and 528 * try again, but only once. 529 */ 530 retry: 531 rc = h_register_logical_lan(adapter->vdev->unit_address, 532 adapter->buffer_list_dma, rxq_desc.desc, 533 adapter->filter_list_dma, mac_address); 534 535 if (rc != H_SUCCESS && try_again) { 536 do { 537 rc = h_free_logical_lan(adapter->vdev->unit_address); 538 } while (H_IS_LONG_BUSY(rc) || (rc == H_BUSY)); 539 540 try_again = 0; 541 goto retry; 542 } 543 544 return rc; 545 } 546 547 static u64 ibmveth_encode_mac_addr(u8 *mac) 548 { 549 int i; 550 u64 encoded = 0; 551 552 for (i = 0; i < ETH_ALEN; i++) 553 encoded = (encoded << 8) | mac[i]; 554 555 return encoded; 556 } 557 558 static int ibmveth_open(struct net_device *netdev) 559 { 560 struct ibmveth_adapter *adapter = netdev_priv(netdev); 561 u64 mac_address; 562 int rxq_entries = 1; 563 unsigned long lpar_rc; 564 int rc; 565 union ibmveth_buf_desc rxq_desc; 566 int i; 567 struct device *dev; 568 569 netdev_dbg(netdev, "open starting\n"); 570 571 napi_enable(&adapter->napi); 572 573 for(i = 0; i < IBMVETH_NUM_BUFF_POOLS; i++) 574 rxq_entries += adapter->rx_buff_pool[i].size; 575 576 adapter->buffer_list_addr = (void*) get_zeroed_page(GFP_KERNEL); 577 adapter->filter_list_addr = (void*) get_zeroed_page(GFP_KERNEL); 578 579 if (!adapter->buffer_list_addr || !adapter->filter_list_addr) { 580 netdev_err(netdev, "unable to allocate filter or buffer list " 581 "pages\n"); 582 rc = -ENOMEM; 583 goto err_out; 584 } 585 586 dev = &adapter->vdev->dev; 587 588 adapter->rx_queue.queue_len = sizeof(struct ibmveth_rx_q_entry) * 589 rxq_entries; 590 adapter->rx_queue.queue_addr = 591 dma_alloc_coherent(dev, adapter->rx_queue.queue_len, 592 &adapter->rx_queue.queue_dma, GFP_KERNEL); 593 if (!adapter->rx_queue.queue_addr) { 594 rc = -ENOMEM; 595 goto err_out; 596 } 597 598 adapter->buffer_list_dma = dma_map_single(dev, 599 adapter->buffer_list_addr, 4096, DMA_BIDIRECTIONAL); 600 adapter->filter_list_dma = dma_map_single(dev, 601 adapter->filter_list_addr, 4096, DMA_BIDIRECTIONAL); 602 603 if ((dma_mapping_error(dev, adapter->buffer_list_dma)) || 604 (dma_mapping_error(dev, adapter->filter_list_dma))) { 605 netdev_err(netdev, "unable to map filter or buffer list " 606 "pages\n"); 607 rc = -ENOMEM; 608 goto err_out; 609 } 610 611 adapter->rx_queue.index = 0; 612 adapter->rx_queue.num_slots = rxq_entries; 613 adapter->rx_queue.toggle = 1; 614 615 mac_address = ibmveth_encode_mac_addr(netdev->dev_addr); 616 617 rxq_desc.fields.flags_len = IBMVETH_BUF_VALID | 618 adapter->rx_queue.queue_len; 619 rxq_desc.fields.address = adapter->rx_queue.queue_dma; 620 621 netdev_dbg(netdev, "buffer list @ 0x%p\n", adapter->buffer_list_addr); 622 netdev_dbg(netdev, "filter list @ 0x%p\n", adapter->filter_list_addr); 623 netdev_dbg(netdev, "receive q @ 0x%p\n", adapter->rx_queue.queue_addr); 624 625 h_vio_signal(adapter->vdev->unit_address, VIO_IRQ_DISABLE); 626 627 lpar_rc = ibmveth_register_logical_lan(adapter, rxq_desc, mac_address); 628 629 if (lpar_rc != H_SUCCESS) { 630 netdev_err(netdev, "h_register_logical_lan failed with %ld\n", 631 lpar_rc); 632 netdev_err(netdev, "buffer TCE:0x%llx filter TCE:0x%llx rxq " 633 "desc:0x%llx MAC:0x%llx\n", 634 adapter->buffer_list_dma, 635 adapter->filter_list_dma, 636 rxq_desc.desc, 637 mac_address); 638 rc = -ENONET; 639 goto err_out; 640 } 641 642 for (i = 0; i < IBMVETH_NUM_BUFF_POOLS; i++) { 643 if (!adapter->rx_buff_pool[i].active) 644 continue; 645 if (ibmveth_alloc_buffer_pool(&adapter->rx_buff_pool[i])) { 646 netdev_err(netdev, "unable to alloc pool\n"); 647 adapter->rx_buff_pool[i].active = 0; 648 rc = -ENOMEM; 649 goto err_out; 650 } 651 } 652 653 netdev_dbg(netdev, "registering irq 0x%x\n", netdev->irq); 654 rc = request_irq(netdev->irq, ibmveth_interrupt, 0, netdev->name, 655 netdev); 656 if (rc != 0) { 657 netdev_err(netdev, "unable to request irq 0x%x, rc %d\n", 658 netdev->irq, rc); 659 do { 660 lpar_rc = h_free_logical_lan(adapter->vdev->unit_address); 661 } while (H_IS_LONG_BUSY(lpar_rc) || (lpar_rc == H_BUSY)); 662 663 goto err_out; 664 } 665 666 adapter->bounce_buffer = 667 kmalloc(netdev->mtu + IBMVETH_BUFF_OH, GFP_KERNEL); 668 if (!adapter->bounce_buffer) { 669 rc = -ENOMEM; 670 goto err_out_free_irq; 671 } 672 adapter->bounce_buffer_dma = 673 dma_map_single(&adapter->vdev->dev, adapter->bounce_buffer, 674 netdev->mtu + IBMVETH_BUFF_OH, DMA_BIDIRECTIONAL); 675 if (dma_mapping_error(dev, adapter->bounce_buffer_dma)) { 676 netdev_err(netdev, "unable to map bounce buffer\n"); 677 rc = -ENOMEM; 678 goto err_out_free_irq; 679 } 680 681 netdev_dbg(netdev, "initial replenish cycle\n"); 682 ibmveth_interrupt(netdev->irq, netdev); 683 684 netif_start_queue(netdev); 685 686 netdev_dbg(netdev, "open complete\n"); 687 688 return 0; 689 690 err_out_free_irq: 691 free_irq(netdev->irq, netdev); 692 err_out: 693 ibmveth_cleanup(adapter); 694 napi_disable(&adapter->napi); 695 return rc; 696 } 697 698 static int ibmveth_close(struct net_device *netdev) 699 { 700 struct ibmveth_adapter *adapter = netdev_priv(netdev); 701 long lpar_rc; 702 703 netdev_dbg(netdev, "close starting\n"); 704 705 napi_disable(&adapter->napi); 706 707 if (!adapter->pool_config) 708 netif_stop_queue(netdev); 709 710 h_vio_signal(adapter->vdev->unit_address, VIO_IRQ_DISABLE); 711 712 do { 713 lpar_rc = h_free_logical_lan(adapter->vdev->unit_address); 714 } while (H_IS_LONG_BUSY(lpar_rc) || (lpar_rc == H_BUSY)); 715 716 if (lpar_rc != H_SUCCESS) { 717 netdev_err(netdev, "h_free_logical_lan failed with %lx, " 718 "continuing with close\n", lpar_rc); 719 } 720 721 free_irq(netdev->irq, netdev); 722 723 ibmveth_update_rx_no_buffer(adapter); 724 725 ibmveth_cleanup(adapter); 726 727 netdev_dbg(netdev, "close complete\n"); 728 729 return 0; 730 } 731 732 static int netdev_get_settings(struct net_device *dev, struct ethtool_cmd *cmd) 733 { 734 cmd->supported = (SUPPORTED_1000baseT_Full | SUPPORTED_Autoneg | 735 SUPPORTED_FIBRE); 736 cmd->advertising = (ADVERTISED_1000baseT_Full | ADVERTISED_Autoneg | 737 ADVERTISED_FIBRE); 738 ethtool_cmd_speed_set(cmd, SPEED_1000); 739 cmd->duplex = DUPLEX_FULL; 740 cmd->port = PORT_FIBRE; 741 cmd->phy_address = 0; 742 cmd->transceiver = XCVR_INTERNAL; 743 cmd->autoneg = AUTONEG_ENABLE; 744 cmd->maxtxpkt = 0; 745 cmd->maxrxpkt = 1; 746 return 0; 747 } 748 749 static void netdev_get_drvinfo(struct net_device *dev, 750 struct ethtool_drvinfo *info) 751 { 752 strlcpy(info->driver, ibmveth_driver_name, sizeof(info->driver)); 753 strlcpy(info->version, ibmveth_driver_version, sizeof(info->version)); 754 } 755 756 static netdev_features_t ibmveth_fix_features(struct net_device *dev, 757 netdev_features_t features) 758 { 759 /* 760 * Since the ibmveth firmware interface does not have the 761 * concept of separate tx/rx checksum offload enable, if rx 762 * checksum is disabled we also have to disable tx checksum 763 * offload. Once we disable rx checksum offload, we are no 764 * longer allowed to send tx buffers that are not properly 765 * checksummed. 766 */ 767 768 if (!(features & NETIF_F_RXCSUM)) 769 features &= ~NETIF_F_CSUM_MASK; 770 771 return features; 772 } 773 774 static int ibmveth_set_csum_offload(struct net_device *dev, u32 data) 775 { 776 struct ibmveth_adapter *adapter = netdev_priv(dev); 777 unsigned long set_attr, clr_attr, ret_attr; 778 unsigned long set_attr6, clr_attr6; 779 long ret, ret4, ret6; 780 int rc1 = 0, rc2 = 0; 781 int restart = 0; 782 783 if (netif_running(dev)) { 784 restart = 1; 785 adapter->pool_config = 1; 786 ibmveth_close(dev); 787 adapter->pool_config = 0; 788 } 789 790 set_attr = 0; 791 clr_attr = 0; 792 set_attr6 = 0; 793 clr_attr6 = 0; 794 795 if (data) { 796 set_attr = IBMVETH_ILLAN_IPV4_TCP_CSUM; 797 set_attr6 = IBMVETH_ILLAN_IPV6_TCP_CSUM; 798 } else { 799 clr_attr = IBMVETH_ILLAN_IPV4_TCP_CSUM; 800 clr_attr6 = IBMVETH_ILLAN_IPV6_TCP_CSUM; 801 } 802 803 ret = h_illan_attributes(adapter->vdev->unit_address, 0, 0, &ret_attr); 804 805 if (ret == H_SUCCESS && !(ret_attr & IBMVETH_ILLAN_ACTIVE_TRUNK) && 806 !(ret_attr & IBMVETH_ILLAN_TRUNK_PRI_MASK) && 807 (ret_attr & IBMVETH_ILLAN_PADDED_PKT_CSUM)) { 808 ret4 = h_illan_attributes(adapter->vdev->unit_address, clr_attr, 809 set_attr, &ret_attr); 810 811 if (ret4 != H_SUCCESS) { 812 netdev_err(dev, "unable to change IPv4 checksum " 813 "offload settings. %d rc=%ld\n", 814 data, ret4); 815 816 h_illan_attributes(adapter->vdev->unit_address, 817 set_attr, clr_attr, &ret_attr); 818 819 if (data == 1) 820 dev->features &= ~NETIF_F_IP_CSUM; 821 822 } else { 823 adapter->fw_ipv4_csum_support = data; 824 } 825 826 ret6 = h_illan_attributes(adapter->vdev->unit_address, 827 clr_attr6, set_attr6, &ret_attr); 828 829 if (ret6 != H_SUCCESS) { 830 netdev_err(dev, "unable to change IPv6 checksum " 831 "offload settings. %d rc=%ld\n", 832 data, ret6); 833 834 h_illan_attributes(adapter->vdev->unit_address, 835 set_attr6, clr_attr6, &ret_attr); 836 837 if (data == 1) 838 dev->features &= ~NETIF_F_IPV6_CSUM; 839 840 } else 841 adapter->fw_ipv6_csum_support = data; 842 843 if (ret4 == H_SUCCESS || ret6 == H_SUCCESS) 844 adapter->rx_csum = data; 845 else 846 rc1 = -EIO; 847 } else { 848 rc1 = -EIO; 849 netdev_err(dev, "unable to change checksum offload settings." 850 " %d rc=%ld ret_attr=%lx\n", data, ret, 851 ret_attr); 852 } 853 854 if (restart) 855 rc2 = ibmveth_open(dev); 856 857 return rc1 ? rc1 : rc2; 858 } 859 860 static int ibmveth_set_tso(struct net_device *dev, u32 data) 861 { 862 struct ibmveth_adapter *adapter = netdev_priv(dev); 863 unsigned long set_attr, clr_attr, ret_attr; 864 long ret1, ret2; 865 int rc1 = 0, rc2 = 0; 866 int restart = 0; 867 868 if (netif_running(dev)) { 869 restart = 1; 870 adapter->pool_config = 1; 871 ibmveth_close(dev); 872 adapter->pool_config = 0; 873 } 874 875 set_attr = 0; 876 clr_attr = 0; 877 878 if (data) 879 set_attr = IBMVETH_ILLAN_LRG_SR_ENABLED; 880 else 881 clr_attr = IBMVETH_ILLAN_LRG_SR_ENABLED; 882 883 ret1 = h_illan_attributes(adapter->vdev->unit_address, 0, 0, &ret_attr); 884 885 if (ret1 == H_SUCCESS && (ret_attr & IBMVETH_ILLAN_LRG_SND_SUPPORT) && 886 !old_large_send) { 887 ret2 = h_illan_attributes(adapter->vdev->unit_address, clr_attr, 888 set_attr, &ret_attr); 889 890 if (ret2 != H_SUCCESS) { 891 netdev_err(dev, "unable to change tso settings. %d rc=%ld\n", 892 data, ret2); 893 894 h_illan_attributes(adapter->vdev->unit_address, 895 set_attr, clr_attr, &ret_attr); 896 897 if (data == 1) 898 dev->features &= ~(NETIF_F_TSO | NETIF_F_TSO6); 899 rc1 = -EIO; 900 901 } else { 902 adapter->fw_large_send_support = data; 903 adapter->large_send = data; 904 } 905 } else { 906 /* Older firmware version of large send offload does not 907 * support tcp6/ipv6 908 */ 909 if (data == 1) { 910 dev->features &= ~NETIF_F_TSO6; 911 netdev_info(dev, "TSO feature requires all partitions to have updated driver"); 912 } 913 adapter->large_send = data; 914 } 915 916 if (restart) 917 rc2 = ibmveth_open(dev); 918 919 return rc1 ? rc1 : rc2; 920 } 921 922 static int ibmveth_set_features(struct net_device *dev, 923 netdev_features_t features) 924 { 925 struct ibmveth_adapter *adapter = netdev_priv(dev); 926 int rx_csum = !!(features & NETIF_F_RXCSUM); 927 int large_send = !!(features & (NETIF_F_TSO | NETIF_F_TSO6)); 928 int rc1 = 0, rc2 = 0; 929 930 if (rx_csum != adapter->rx_csum) { 931 rc1 = ibmveth_set_csum_offload(dev, rx_csum); 932 if (rc1 && !adapter->rx_csum) 933 dev->features = 934 features & ~(NETIF_F_CSUM_MASK | 935 NETIF_F_RXCSUM); 936 } 937 938 if (large_send != adapter->large_send) { 939 rc2 = ibmveth_set_tso(dev, large_send); 940 if (rc2 && !adapter->large_send) 941 dev->features = 942 features & ~(NETIF_F_TSO | NETIF_F_TSO6); 943 } 944 945 return rc1 ? rc1 : rc2; 946 } 947 948 static void ibmveth_get_strings(struct net_device *dev, u32 stringset, u8 *data) 949 { 950 int i; 951 952 if (stringset != ETH_SS_STATS) 953 return; 954 955 for (i = 0; i < ARRAY_SIZE(ibmveth_stats); i++, data += ETH_GSTRING_LEN) 956 memcpy(data, ibmveth_stats[i].name, ETH_GSTRING_LEN); 957 } 958 959 static int ibmveth_get_sset_count(struct net_device *dev, int sset) 960 { 961 switch (sset) { 962 case ETH_SS_STATS: 963 return ARRAY_SIZE(ibmveth_stats); 964 default: 965 return -EOPNOTSUPP; 966 } 967 } 968 969 static void ibmveth_get_ethtool_stats(struct net_device *dev, 970 struct ethtool_stats *stats, u64 *data) 971 { 972 int i; 973 struct ibmveth_adapter *adapter = netdev_priv(dev); 974 975 for (i = 0; i < ARRAY_SIZE(ibmveth_stats); i++) 976 data[i] = IBMVETH_GET_STAT(adapter, ibmveth_stats[i].offset); 977 } 978 979 static const struct ethtool_ops netdev_ethtool_ops = { 980 .get_drvinfo = netdev_get_drvinfo, 981 .get_settings = netdev_get_settings, 982 .get_link = ethtool_op_get_link, 983 .get_strings = ibmveth_get_strings, 984 .get_sset_count = ibmveth_get_sset_count, 985 .get_ethtool_stats = ibmveth_get_ethtool_stats, 986 }; 987 988 static int ibmveth_ioctl(struct net_device *dev, struct ifreq *ifr, int cmd) 989 { 990 return -EOPNOTSUPP; 991 } 992 993 #define page_offset(v) ((unsigned long)(v) & ((1 << 12) - 1)) 994 995 static int ibmveth_send(struct ibmveth_adapter *adapter, 996 union ibmveth_buf_desc *descs, unsigned long mss) 997 { 998 unsigned long correlator; 999 unsigned int retry_count; 1000 unsigned long ret; 1001 1002 /* 1003 * The retry count sets a maximum for the number of broadcast and 1004 * multicast destinations within the system. 1005 */ 1006 retry_count = 1024; 1007 correlator = 0; 1008 do { 1009 ret = h_send_logical_lan(adapter->vdev->unit_address, 1010 descs[0].desc, descs[1].desc, 1011 descs[2].desc, descs[3].desc, 1012 descs[4].desc, descs[5].desc, 1013 correlator, &correlator, mss, 1014 adapter->fw_large_send_support); 1015 } while ((ret == H_BUSY) && (retry_count--)); 1016 1017 if (ret != H_SUCCESS && ret != H_DROPPED) { 1018 netdev_err(adapter->netdev, "tx: h_send_logical_lan failed " 1019 "with rc=%ld\n", ret); 1020 return 1; 1021 } 1022 1023 return 0; 1024 } 1025 1026 static netdev_tx_t ibmveth_start_xmit(struct sk_buff *skb, 1027 struct net_device *netdev) 1028 { 1029 struct ibmveth_adapter *adapter = netdev_priv(netdev); 1030 unsigned int desc_flags; 1031 union ibmveth_buf_desc descs[6]; 1032 int last, i; 1033 int force_bounce = 0; 1034 dma_addr_t dma_addr; 1035 unsigned long mss = 0; 1036 1037 /* 1038 * veth handles a maximum of 6 segments including the header, so 1039 * we have to linearize the skb if there are more than this. 1040 */ 1041 if (skb_shinfo(skb)->nr_frags > 5 && __skb_linearize(skb)) { 1042 netdev->stats.tx_dropped++; 1043 goto out; 1044 } 1045 1046 /* veth can't checksum offload UDP */ 1047 if (skb->ip_summed == CHECKSUM_PARTIAL && 1048 ((skb->protocol == htons(ETH_P_IP) && 1049 ip_hdr(skb)->protocol != IPPROTO_TCP) || 1050 (skb->protocol == htons(ETH_P_IPV6) && 1051 ipv6_hdr(skb)->nexthdr != IPPROTO_TCP)) && 1052 skb_checksum_help(skb)) { 1053 1054 netdev_err(netdev, "tx: failed to checksum packet\n"); 1055 netdev->stats.tx_dropped++; 1056 goto out; 1057 } 1058 1059 desc_flags = IBMVETH_BUF_VALID; 1060 1061 if (skb_is_gso(skb) && adapter->fw_large_send_support) 1062 desc_flags |= IBMVETH_BUF_LRG_SND; 1063 1064 if (skb->ip_summed == CHECKSUM_PARTIAL) { 1065 unsigned char *buf = skb_transport_header(skb) + 1066 skb->csum_offset; 1067 1068 desc_flags |= (IBMVETH_BUF_NO_CSUM | IBMVETH_BUF_CSUM_GOOD); 1069 1070 /* Need to zero out the checksum */ 1071 buf[0] = 0; 1072 buf[1] = 0; 1073 } 1074 1075 retry_bounce: 1076 memset(descs, 0, sizeof(descs)); 1077 1078 /* 1079 * If a linear packet is below the rx threshold then 1080 * copy it into the static bounce buffer. This avoids the 1081 * cost of a TCE insert and remove. 1082 */ 1083 if (force_bounce || (!skb_is_nonlinear(skb) && 1084 (skb->len < tx_copybreak))) { 1085 skb_copy_from_linear_data(skb, adapter->bounce_buffer, 1086 skb->len); 1087 1088 descs[0].fields.flags_len = desc_flags | skb->len; 1089 descs[0].fields.address = adapter->bounce_buffer_dma; 1090 1091 if (ibmveth_send(adapter, descs, 0)) { 1092 adapter->tx_send_failed++; 1093 netdev->stats.tx_dropped++; 1094 } else { 1095 netdev->stats.tx_packets++; 1096 netdev->stats.tx_bytes += skb->len; 1097 } 1098 1099 goto out; 1100 } 1101 1102 /* Map the header */ 1103 dma_addr = dma_map_single(&adapter->vdev->dev, skb->data, 1104 skb_headlen(skb), DMA_TO_DEVICE); 1105 if (dma_mapping_error(&adapter->vdev->dev, dma_addr)) 1106 goto map_failed; 1107 1108 descs[0].fields.flags_len = desc_flags | skb_headlen(skb); 1109 descs[0].fields.address = dma_addr; 1110 1111 /* Map the frags */ 1112 for (i = 0; i < skb_shinfo(skb)->nr_frags; i++) { 1113 const skb_frag_t *frag = &skb_shinfo(skb)->frags[i]; 1114 1115 dma_addr = skb_frag_dma_map(&adapter->vdev->dev, frag, 0, 1116 skb_frag_size(frag), DMA_TO_DEVICE); 1117 1118 if (dma_mapping_error(&adapter->vdev->dev, dma_addr)) 1119 goto map_failed_frags; 1120 1121 descs[i+1].fields.flags_len = desc_flags | skb_frag_size(frag); 1122 descs[i+1].fields.address = dma_addr; 1123 } 1124 1125 if (skb_is_gso(skb)) { 1126 if (adapter->fw_large_send_support) { 1127 mss = (unsigned long)skb_shinfo(skb)->gso_size; 1128 adapter->tx_large_packets++; 1129 } else if (!skb_is_gso_v6(skb)) { 1130 /* Put -1 in the IP checksum to tell phyp it 1131 * is a largesend packet. Put the mss in 1132 * the TCP checksum. 1133 */ 1134 ip_hdr(skb)->check = 0xffff; 1135 tcp_hdr(skb)->check = 1136 cpu_to_be16(skb_shinfo(skb)->gso_size); 1137 adapter->tx_large_packets++; 1138 } 1139 } 1140 1141 if (ibmveth_send(adapter, descs, mss)) { 1142 adapter->tx_send_failed++; 1143 netdev->stats.tx_dropped++; 1144 } else { 1145 netdev->stats.tx_packets++; 1146 netdev->stats.tx_bytes += skb->len; 1147 } 1148 1149 dma_unmap_single(&adapter->vdev->dev, 1150 descs[0].fields.address, 1151 descs[0].fields.flags_len & IBMVETH_BUF_LEN_MASK, 1152 DMA_TO_DEVICE); 1153 1154 for (i = 1; i < skb_shinfo(skb)->nr_frags + 1; i++) 1155 dma_unmap_page(&adapter->vdev->dev, descs[i].fields.address, 1156 descs[i].fields.flags_len & IBMVETH_BUF_LEN_MASK, 1157 DMA_TO_DEVICE); 1158 1159 out: 1160 dev_consume_skb_any(skb); 1161 return NETDEV_TX_OK; 1162 1163 map_failed_frags: 1164 last = i+1; 1165 for (i = 0; i < last; i++) 1166 dma_unmap_page(&adapter->vdev->dev, descs[i].fields.address, 1167 descs[i].fields.flags_len & IBMVETH_BUF_LEN_MASK, 1168 DMA_TO_DEVICE); 1169 1170 map_failed: 1171 if (!firmware_has_feature(FW_FEATURE_CMO)) 1172 netdev_err(netdev, "tx: unable to map xmit buffer\n"); 1173 adapter->tx_map_failed++; 1174 if (skb_linearize(skb)) { 1175 netdev->stats.tx_dropped++; 1176 goto out; 1177 } 1178 force_bounce = 1; 1179 goto retry_bounce; 1180 } 1181 1182 static void ibmveth_rx_mss_helper(struct sk_buff *skb, u16 mss, int lrg_pkt) 1183 { 1184 int offset = 0; 1185 1186 /* only TCP packets will be aggregated */ 1187 if (skb->protocol == htons(ETH_P_IP)) { 1188 struct iphdr *iph = (struct iphdr *)skb->data; 1189 1190 if (iph->protocol == IPPROTO_TCP) { 1191 offset = iph->ihl * 4; 1192 skb_shinfo(skb)->gso_type = SKB_GSO_TCPV4; 1193 } else { 1194 return; 1195 } 1196 } else if (skb->protocol == htons(ETH_P_IPV6)) { 1197 struct ipv6hdr *iph6 = (struct ipv6hdr *)skb->data; 1198 1199 if (iph6->nexthdr == IPPROTO_TCP) { 1200 offset = sizeof(struct ipv6hdr); 1201 skb_shinfo(skb)->gso_type = SKB_GSO_TCPV6; 1202 } else { 1203 return; 1204 } 1205 } else { 1206 return; 1207 } 1208 /* if mss is not set through Large Packet bit/mss in rx buffer, 1209 * expect that the mss will be written to the tcp header checksum. 1210 */ 1211 if (lrg_pkt) { 1212 skb_shinfo(skb)->gso_size = mss; 1213 } else if (offset) { 1214 struct tcphdr *tcph = (struct tcphdr *)(skb->data + offset); 1215 1216 skb_shinfo(skb)->gso_size = ntohs(tcph->check); 1217 tcph->check = 0; 1218 } 1219 } 1220 1221 static int ibmveth_poll(struct napi_struct *napi, int budget) 1222 { 1223 struct ibmveth_adapter *adapter = 1224 container_of(napi, struct ibmveth_adapter, napi); 1225 struct net_device *netdev = adapter->netdev; 1226 int frames_processed = 0; 1227 unsigned long lpar_rc; 1228 struct iphdr *iph; 1229 u16 mss = 0; 1230 1231 restart_poll: 1232 while (frames_processed < budget) { 1233 if (!ibmveth_rxq_pending_buffer(adapter)) 1234 break; 1235 1236 smp_rmb(); 1237 if (!ibmveth_rxq_buffer_valid(adapter)) { 1238 wmb(); /* suggested by larson1 */ 1239 adapter->rx_invalid_buffer++; 1240 netdev_dbg(netdev, "recycling invalid buffer\n"); 1241 ibmveth_rxq_recycle_buffer(adapter); 1242 } else { 1243 struct sk_buff *skb, *new_skb; 1244 int length = ibmveth_rxq_frame_length(adapter); 1245 int offset = ibmveth_rxq_frame_offset(adapter); 1246 int csum_good = ibmveth_rxq_csum_good(adapter); 1247 int lrg_pkt = ibmveth_rxq_large_packet(adapter); 1248 1249 skb = ibmveth_rxq_get_buffer(adapter); 1250 1251 /* if the large packet bit is set in the rx queue 1252 * descriptor, the mss will be written by PHYP eight 1253 * bytes from the start of the rx buffer, which is 1254 * skb->data at this stage 1255 */ 1256 if (lrg_pkt) { 1257 __be64 *rxmss = (__be64 *)(skb->data + 8); 1258 1259 mss = (u16)be64_to_cpu(*rxmss); 1260 } 1261 1262 new_skb = NULL; 1263 if (length < rx_copybreak) 1264 new_skb = netdev_alloc_skb(netdev, length); 1265 1266 if (new_skb) { 1267 skb_copy_to_linear_data(new_skb, 1268 skb->data + offset, 1269 length); 1270 if (rx_flush) 1271 ibmveth_flush_buffer(skb->data, 1272 length + offset); 1273 if (!ibmveth_rxq_recycle_buffer(adapter)) 1274 kfree_skb(skb); 1275 skb = new_skb; 1276 } else { 1277 ibmveth_rxq_harvest_buffer(adapter); 1278 skb_reserve(skb, offset); 1279 } 1280 1281 skb_put(skb, length); 1282 skb->protocol = eth_type_trans(skb, netdev); 1283 1284 if (csum_good) { 1285 skb->ip_summed = CHECKSUM_UNNECESSARY; 1286 if (be16_to_cpu(skb->protocol) == ETH_P_IP) { 1287 iph = (struct iphdr *)skb->data; 1288 1289 /* If the IP checksum is not offloaded and if the packet 1290 * is large send, the checksum must be rebuilt. 1291 */ 1292 if (iph->check == 0xffff) { 1293 iph->check = 0; 1294 iph->check = ip_fast_csum((unsigned char *)iph, iph->ihl); 1295 } 1296 } 1297 } 1298 1299 if (length > netdev->mtu + ETH_HLEN) { 1300 ibmveth_rx_mss_helper(skb, mss, lrg_pkt); 1301 adapter->rx_large_packets++; 1302 } 1303 1304 napi_gro_receive(napi, skb); /* send it up */ 1305 1306 netdev->stats.rx_packets++; 1307 netdev->stats.rx_bytes += length; 1308 frames_processed++; 1309 } 1310 } 1311 1312 ibmveth_replenish_task(adapter); 1313 1314 if (frames_processed < budget) { 1315 napi_complete(napi); 1316 1317 /* We think we are done - reenable interrupts, 1318 * then check once more to make sure we are done. 1319 */ 1320 lpar_rc = h_vio_signal(adapter->vdev->unit_address, 1321 VIO_IRQ_ENABLE); 1322 1323 BUG_ON(lpar_rc != H_SUCCESS); 1324 1325 if (ibmveth_rxq_pending_buffer(adapter) && 1326 napi_reschedule(napi)) { 1327 lpar_rc = h_vio_signal(adapter->vdev->unit_address, 1328 VIO_IRQ_DISABLE); 1329 goto restart_poll; 1330 } 1331 } 1332 1333 return frames_processed; 1334 } 1335 1336 static irqreturn_t ibmveth_interrupt(int irq, void *dev_instance) 1337 { 1338 struct net_device *netdev = dev_instance; 1339 struct ibmveth_adapter *adapter = netdev_priv(netdev); 1340 unsigned long lpar_rc; 1341 1342 if (napi_schedule_prep(&adapter->napi)) { 1343 lpar_rc = h_vio_signal(adapter->vdev->unit_address, 1344 VIO_IRQ_DISABLE); 1345 BUG_ON(lpar_rc != H_SUCCESS); 1346 __napi_schedule(&adapter->napi); 1347 } 1348 return IRQ_HANDLED; 1349 } 1350 1351 static void ibmveth_set_multicast_list(struct net_device *netdev) 1352 { 1353 struct ibmveth_adapter *adapter = netdev_priv(netdev); 1354 unsigned long lpar_rc; 1355 1356 if ((netdev->flags & IFF_PROMISC) || 1357 (netdev_mc_count(netdev) > adapter->mcastFilterSize)) { 1358 lpar_rc = h_multicast_ctrl(adapter->vdev->unit_address, 1359 IbmVethMcastEnableRecv | 1360 IbmVethMcastDisableFiltering, 1361 0); 1362 if (lpar_rc != H_SUCCESS) { 1363 netdev_err(netdev, "h_multicast_ctrl rc=%ld when " 1364 "entering promisc mode\n", lpar_rc); 1365 } 1366 } else { 1367 struct netdev_hw_addr *ha; 1368 /* clear the filter table & disable filtering */ 1369 lpar_rc = h_multicast_ctrl(adapter->vdev->unit_address, 1370 IbmVethMcastEnableRecv | 1371 IbmVethMcastDisableFiltering | 1372 IbmVethMcastClearFilterTable, 1373 0); 1374 if (lpar_rc != H_SUCCESS) { 1375 netdev_err(netdev, "h_multicast_ctrl rc=%ld when " 1376 "attempting to clear filter table\n", 1377 lpar_rc); 1378 } 1379 /* add the addresses to the filter table */ 1380 netdev_for_each_mc_addr(ha, netdev) { 1381 /* add the multicast address to the filter table */ 1382 u64 mcast_addr; 1383 mcast_addr = ibmveth_encode_mac_addr(ha->addr); 1384 lpar_rc = h_multicast_ctrl(adapter->vdev->unit_address, 1385 IbmVethMcastAddFilter, 1386 mcast_addr); 1387 if (lpar_rc != H_SUCCESS) { 1388 netdev_err(netdev, "h_multicast_ctrl rc=%ld " 1389 "when adding an entry to the filter " 1390 "table\n", lpar_rc); 1391 } 1392 } 1393 1394 /* re-enable filtering */ 1395 lpar_rc = h_multicast_ctrl(adapter->vdev->unit_address, 1396 IbmVethMcastEnableFiltering, 1397 0); 1398 if (lpar_rc != H_SUCCESS) { 1399 netdev_err(netdev, "h_multicast_ctrl rc=%ld when " 1400 "enabling filtering\n", lpar_rc); 1401 } 1402 } 1403 } 1404 1405 static int ibmveth_change_mtu(struct net_device *dev, int new_mtu) 1406 { 1407 struct ibmveth_adapter *adapter = netdev_priv(dev); 1408 struct vio_dev *viodev = adapter->vdev; 1409 int new_mtu_oh = new_mtu + IBMVETH_BUFF_OH; 1410 int i, rc; 1411 int need_restart = 0; 1412 1413 for (i = 0; i < IBMVETH_NUM_BUFF_POOLS; i++) 1414 if (new_mtu_oh <= adapter->rx_buff_pool[i].buff_size) 1415 break; 1416 1417 if (i == IBMVETH_NUM_BUFF_POOLS) 1418 return -EINVAL; 1419 1420 /* Deactivate all the buffer pools so that the next loop can activate 1421 only the buffer pools necessary to hold the new MTU */ 1422 if (netif_running(adapter->netdev)) { 1423 need_restart = 1; 1424 adapter->pool_config = 1; 1425 ibmveth_close(adapter->netdev); 1426 adapter->pool_config = 0; 1427 } 1428 1429 /* Look for an active buffer pool that can hold the new MTU */ 1430 for (i = 0; i < IBMVETH_NUM_BUFF_POOLS; i++) { 1431 adapter->rx_buff_pool[i].active = 1; 1432 1433 if (new_mtu_oh <= adapter->rx_buff_pool[i].buff_size) { 1434 dev->mtu = new_mtu; 1435 vio_cmo_set_dev_desired(viodev, 1436 ibmveth_get_desired_dma 1437 (viodev)); 1438 if (need_restart) { 1439 return ibmveth_open(adapter->netdev); 1440 } 1441 return 0; 1442 } 1443 } 1444 1445 if (need_restart && (rc = ibmveth_open(adapter->netdev))) 1446 return rc; 1447 1448 return -EINVAL; 1449 } 1450 1451 #ifdef CONFIG_NET_POLL_CONTROLLER 1452 static void ibmveth_poll_controller(struct net_device *dev) 1453 { 1454 ibmveth_replenish_task(netdev_priv(dev)); 1455 ibmveth_interrupt(dev->irq, dev); 1456 } 1457 #endif 1458 1459 /** 1460 * ibmveth_get_desired_dma - Calculate IO memory desired by the driver 1461 * 1462 * @vdev: struct vio_dev for the device whose desired IO mem is to be returned 1463 * 1464 * Return value: 1465 * Number of bytes of IO data the driver will need to perform well. 1466 */ 1467 static unsigned long ibmveth_get_desired_dma(struct vio_dev *vdev) 1468 { 1469 struct net_device *netdev = dev_get_drvdata(&vdev->dev); 1470 struct ibmveth_adapter *adapter; 1471 struct iommu_table *tbl; 1472 unsigned long ret; 1473 int i; 1474 int rxqentries = 1; 1475 1476 tbl = get_iommu_table_base(&vdev->dev); 1477 1478 /* netdev inits at probe time along with the structures we need below*/ 1479 if (netdev == NULL) 1480 return IOMMU_PAGE_ALIGN(IBMVETH_IO_ENTITLEMENT_DEFAULT, tbl); 1481 1482 adapter = netdev_priv(netdev); 1483 1484 ret = IBMVETH_BUFF_LIST_SIZE + IBMVETH_FILT_LIST_SIZE; 1485 ret += IOMMU_PAGE_ALIGN(netdev->mtu, tbl); 1486 1487 for (i = 0; i < IBMVETH_NUM_BUFF_POOLS; i++) { 1488 /* add the size of the active receive buffers */ 1489 if (adapter->rx_buff_pool[i].active) 1490 ret += 1491 adapter->rx_buff_pool[i].size * 1492 IOMMU_PAGE_ALIGN(adapter->rx_buff_pool[i]. 1493 buff_size, tbl); 1494 rxqentries += adapter->rx_buff_pool[i].size; 1495 } 1496 /* add the size of the receive queue entries */ 1497 ret += IOMMU_PAGE_ALIGN( 1498 rxqentries * sizeof(struct ibmveth_rx_q_entry), tbl); 1499 1500 return ret; 1501 } 1502 1503 static int ibmveth_set_mac_addr(struct net_device *dev, void *p) 1504 { 1505 struct ibmveth_adapter *adapter = netdev_priv(dev); 1506 struct sockaddr *addr = p; 1507 u64 mac_address; 1508 int rc; 1509 1510 if (!is_valid_ether_addr(addr->sa_data)) 1511 return -EADDRNOTAVAIL; 1512 1513 mac_address = ibmveth_encode_mac_addr(addr->sa_data); 1514 rc = h_change_logical_lan_mac(adapter->vdev->unit_address, mac_address); 1515 if (rc) { 1516 netdev_err(adapter->netdev, "h_change_logical_lan_mac failed with rc=%d\n", rc); 1517 return rc; 1518 } 1519 1520 ether_addr_copy(dev->dev_addr, addr->sa_data); 1521 1522 return 0; 1523 } 1524 1525 static const struct net_device_ops ibmveth_netdev_ops = { 1526 .ndo_open = ibmveth_open, 1527 .ndo_stop = ibmveth_close, 1528 .ndo_start_xmit = ibmveth_start_xmit, 1529 .ndo_set_rx_mode = ibmveth_set_multicast_list, 1530 .ndo_do_ioctl = ibmveth_ioctl, 1531 .ndo_change_mtu = ibmveth_change_mtu, 1532 .ndo_fix_features = ibmveth_fix_features, 1533 .ndo_set_features = ibmveth_set_features, 1534 .ndo_validate_addr = eth_validate_addr, 1535 .ndo_set_mac_address = ibmveth_set_mac_addr, 1536 #ifdef CONFIG_NET_POLL_CONTROLLER 1537 .ndo_poll_controller = ibmveth_poll_controller, 1538 #endif 1539 }; 1540 1541 static int ibmveth_probe(struct vio_dev *dev, const struct vio_device_id *id) 1542 { 1543 int rc, i, mac_len; 1544 struct net_device *netdev; 1545 struct ibmveth_adapter *adapter; 1546 unsigned char *mac_addr_p; 1547 unsigned int *mcastFilterSize_p; 1548 long ret; 1549 unsigned long ret_attr; 1550 1551 dev_dbg(&dev->dev, "entering ibmveth_probe for UA 0x%x\n", 1552 dev->unit_address); 1553 1554 mac_addr_p = (unsigned char *)vio_get_attribute(dev, VETH_MAC_ADDR, 1555 &mac_len); 1556 if (!mac_addr_p) { 1557 dev_err(&dev->dev, "Can't find VETH_MAC_ADDR attribute\n"); 1558 return -EINVAL; 1559 } 1560 /* Workaround for old/broken pHyp */ 1561 if (mac_len == 8) 1562 mac_addr_p += 2; 1563 else if (mac_len != 6) { 1564 dev_err(&dev->dev, "VETH_MAC_ADDR attribute wrong len %d\n", 1565 mac_len); 1566 return -EINVAL; 1567 } 1568 1569 mcastFilterSize_p = (unsigned int *)vio_get_attribute(dev, 1570 VETH_MCAST_FILTER_SIZE, NULL); 1571 if (!mcastFilterSize_p) { 1572 dev_err(&dev->dev, "Can't find VETH_MCAST_FILTER_SIZE " 1573 "attribute\n"); 1574 return -EINVAL; 1575 } 1576 1577 netdev = alloc_etherdev(sizeof(struct ibmveth_adapter)); 1578 1579 if (!netdev) 1580 return -ENOMEM; 1581 1582 adapter = netdev_priv(netdev); 1583 dev_set_drvdata(&dev->dev, netdev); 1584 1585 adapter->vdev = dev; 1586 adapter->netdev = netdev; 1587 adapter->mcastFilterSize = *mcastFilterSize_p; 1588 adapter->pool_config = 0; 1589 1590 netif_napi_add(netdev, &adapter->napi, ibmveth_poll, 16); 1591 1592 netdev->irq = dev->irq; 1593 netdev->netdev_ops = &ibmveth_netdev_ops; 1594 netdev->ethtool_ops = &netdev_ethtool_ops; 1595 SET_NETDEV_DEV(netdev, &dev->dev); 1596 netdev->hw_features = NETIF_F_SG | NETIF_F_RXCSUM | 1597 NETIF_F_IP_CSUM | NETIF_F_IPV6_CSUM; 1598 1599 netdev->features |= netdev->hw_features; 1600 1601 ret = h_illan_attributes(adapter->vdev->unit_address, 0, 0, &ret_attr); 1602 1603 /* If running older firmware, TSO should not be enabled by default */ 1604 if (ret == H_SUCCESS && (ret_attr & IBMVETH_ILLAN_LRG_SND_SUPPORT) && 1605 !old_large_send) { 1606 netdev->hw_features |= NETIF_F_TSO | NETIF_F_TSO6; 1607 netdev->features |= netdev->hw_features; 1608 } else { 1609 netdev->hw_features |= NETIF_F_TSO; 1610 } 1611 1612 netdev->min_mtu = IBMVETH_MIN_MTU; 1613 netdev->max_mtu = ETH_MAX_MTU; 1614 1615 memcpy(netdev->dev_addr, mac_addr_p, ETH_ALEN); 1616 1617 if (firmware_has_feature(FW_FEATURE_CMO)) 1618 memcpy(pool_count, pool_count_cmo, sizeof(pool_count)); 1619 1620 for (i = 0; i < IBMVETH_NUM_BUFF_POOLS; i++) { 1621 struct kobject *kobj = &adapter->rx_buff_pool[i].kobj; 1622 int error; 1623 1624 ibmveth_init_buffer_pool(&adapter->rx_buff_pool[i], i, 1625 pool_count[i], pool_size[i], 1626 pool_active[i]); 1627 error = kobject_init_and_add(kobj, &ktype_veth_pool, 1628 &dev->dev.kobj, "pool%d", i); 1629 if (!error) 1630 kobject_uevent(kobj, KOBJ_ADD); 1631 } 1632 1633 netdev_dbg(netdev, "adapter @ 0x%p\n", adapter); 1634 1635 adapter->buffer_list_dma = DMA_ERROR_CODE; 1636 adapter->filter_list_dma = DMA_ERROR_CODE; 1637 adapter->rx_queue.queue_dma = DMA_ERROR_CODE; 1638 1639 netdev_dbg(netdev, "registering netdev...\n"); 1640 1641 ibmveth_set_features(netdev, netdev->features); 1642 1643 rc = register_netdev(netdev); 1644 1645 if (rc) { 1646 netdev_dbg(netdev, "failed to register netdev rc=%d\n", rc); 1647 free_netdev(netdev); 1648 return rc; 1649 } 1650 1651 netdev_dbg(netdev, "registered\n"); 1652 1653 return 0; 1654 } 1655 1656 static int ibmveth_remove(struct vio_dev *dev) 1657 { 1658 struct net_device *netdev = dev_get_drvdata(&dev->dev); 1659 struct ibmveth_adapter *adapter = netdev_priv(netdev); 1660 int i; 1661 1662 for (i = 0; i < IBMVETH_NUM_BUFF_POOLS; i++) 1663 kobject_put(&adapter->rx_buff_pool[i].kobj); 1664 1665 unregister_netdev(netdev); 1666 1667 free_netdev(netdev); 1668 dev_set_drvdata(&dev->dev, NULL); 1669 1670 return 0; 1671 } 1672 1673 static struct attribute veth_active_attr; 1674 static struct attribute veth_num_attr; 1675 static struct attribute veth_size_attr; 1676 1677 static ssize_t veth_pool_show(struct kobject *kobj, 1678 struct attribute *attr, char *buf) 1679 { 1680 struct ibmveth_buff_pool *pool = container_of(kobj, 1681 struct ibmveth_buff_pool, 1682 kobj); 1683 1684 if (attr == &veth_active_attr) 1685 return sprintf(buf, "%d\n", pool->active); 1686 else if (attr == &veth_num_attr) 1687 return sprintf(buf, "%d\n", pool->size); 1688 else if (attr == &veth_size_attr) 1689 return sprintf(buf, "%d\n", pool->buff_size); 1690 return 0; 1691 } 1692 1693 static ssize_t veth_pool_store(struct kobject *kobj, struct attribute *attr, 1694 const char *buf, size_t count) 1695 { 1696 struct ibmveth_buff_pool *pool = container_of(kobj, 1697 struct ibmveth_buff_pool, 1698 kobj); 1699 struct net_device *netdev = dev_get_drvdata( 1700 container_of(kobj->parent, struct device, kobj)); 1701 struct ibmveth_adapter *adapter = netdev_priv(netdev); 1702 long value = simple_strtol(buf, NULL, 10); 1703 long rc; 1704 1705 if (attr == &veth_active_attr) { 1706 if (value && !pool->active) { 1707 if (netif_running(netdev)) { 1708 if (ibmveth_alloc_buffer_pool(pool)) { 1709 netdev_err(netdev, 1710 "unable to alloc pool\n"); 1711 return -ENOMEM; 1712 } 1713 pool->active = 1; 1714 adapter->pool_config = 1; 1715 ibmveth_close(netdev); 1716 adapter->pool_config = 0; 1717 if ((rc = ibmveth_open(netdev))) 1718 return rc; 1719 } else { 1720 pool->active = 1; 1721 } 1722 } else if (!value && pool->active) { 1723 int mtu = netdev->mtu + IBMVETH_BUFF_OH; 1724 int i; 1725 /* Make sure there is a buffer pool with buffers that 1726 can hold a packet of the size of the MTU */ 1727 for (i = 0; i < IBMVETH_NUM_BUFF_POOLS; i++) { 1728 if (pool == &adapter->rx_buff_pool[i]) 1729 continue; 1730 if (!adapter->rx_buff_pool[i].active) 1731 continue; 1732 if (mtu <= adapter->rx_buff_pool[i].buff_size) 1733 break; 1734 } 1735 1736 if (i == IBMVETH_NUM_BUFF_POOLS) { 1737 netdev_err(netdev, "no active pool >= MTU\n"); 1738 return -EPERM; 1739 } 1740 1741 if (netif_running(netdev)) { 1742 adapter->pool_config = 1; 1743 ibmveth_close(netdev); 1744 pool->active = 0; 1745 adapter->pool_config = 0; 1746 if ((rc = ibmveth_open(netdev))) 1747 return rc; 1748 } 1749 pool->active = 0; 1750 } 1751 } else if (attr == &veth_num_attr) { 1752 if (value <= 0 || value > IBMVETH_MAX_POOL_COUNT) { 1753 return -EINVAL; 1754 } else { 1755 if (netif_running(netdev)) { 1756 adapter->pool_config = 1; 1757 ibmveth_close(netdev); 1758 adapter->pool_config = 0; 1759 pool->size = value; 1760 if ((rc = ibmveth_open(netdev))) 1761 return rc; 1762 } else { 1763 pool->size = value; 1764 } 1765 } 1766 } else if (attr == &veth_size_attr) { 1767 if (value <= IBMVETH_BUFF_OH || value > IBMVETH_MAX_BUF_SIZE) { 1768 return -EINVAL; 1769 } else { 1770 if (netif_running(netdev)) { 1771 adapter->pool_config = 1; 1772 ibmveth_close(netdev); 1773 adapter->pool_config = 0; 1774 pool->buff_size = value; 1775 if ((rc = ibmveth_open(netdev))) 1776 return rc; 1777 } else { 1778 pool->buff_size = value; 1779 } 1780 } 1781 } 1782 1783 /* kick the interrupt handler to allocate/deallocate pools */ 1784 ibmveth_interrupt(netdev->irq, netdev); 1785 return count; 1786 } 1787 1788 1789 #define ATTR(_name, _mode) \ 1790 struct attribute veth_##_name##_attr = { \ 1791 .name = __stringify(_name), .mode = _mode, \ 1792 }; 1793 1794 static ATTR(active, 0644); 1795 static ATTR(num, 0644); 1796 static ATTR(size, 0644); 1797 1798 static struct attribute *veth_pool_attrs[] = { 1799 &veth_active_attr, 1800 &veth_num_attr, 1801 &veth_size_attr, 1802 NULL, 1803 }; 1804 1805 static const struct sysfs_ops veth_pool_ops = { 1806 .show = veth_pool_show, 1807 .store = veth_pool_store, 1808 }; 1809 1810 static struct kobj_type ktype_veth_pool = { 1811 .release = NULL, 1812 .sysfs_ops = &veth_pool_ops, 1813 .default_attrs = veth_pool_attrs, 1814 }; 1815 1816 static int ibmveth_resume(struct device *dev) 1817 { 1818 struct net_device *netdev = dev_get_drvdata(dev); 1819 ibmveth_interrupt(netdev->irq, netdev); 1820 return 0; 1821 } 1822 1823 static struct vio_device_id ibmveth_device_table[] = { 1824 { "network", "IBM,l-lan"}, 1825 { "", "" } 1826 }; 1827 MODULE_DEVICE_TABLE(vio, ibmveth_device_table); 1828 1829 static struct dev_pm_ops ibmveth_pm_ops = { 1830 .resume = ibmveth_resume 1831 }; 1832 1833 static struct vio_driver ibmveth_driver = { 1834 .id_table = ibmveth_device_table, 1835 .probe = ibmveth_probe, 1836 .remove = ibmveth_remove, 1837 .get_desired_dma = ibmveth_get_desired_dma, 1838 .name = ibmveth_driver_name, 1839 .pm = &ibmveth_pm_ops, 1840 }; 1841 1842 static int __init ibmveth_module_init(void) 1843 { 1844 printk(KERN_DEBUG "%s: %s %s\n", ibmveth_driver_name, 1845 ibmveth_driver_string, ibmveth_driver_version); 1846 1847 return vio_register_driver(&ibmveth_driver); 1848 } 1849 1850 static void __exit ibmveth_module_exit(void) 1851 { 1852 vio_unregister_driver(&ibmveth_driver); 1853 } 1854 1855 module_init(ibmveth_module_init); 1856 module_exit(ibmveth_module_exit); 1857