1 // SPDX-License-Identifier: GPL-2.0 2 /* 3 * Copyright (c) 2015 MediaTek Inc. 4 * Author: 5 * Zhigang.Wei <zhigang.wei@mediatek.com> 6 * Chunfeng.Yun <chunfeng.yun@mediatek.com> 7 */ 8 9 #include <linux/kernel.h> 10 #include <linux/module.h> 11 #include <linux/slab.h> 12 13 #include "xhci.h" 14 #include "xhci-mtk.h" 15 16 #define SSP_BW_BOUNDARY 130000 17 #define SS_BW_BOUNDARY 51000 18 /* table 5-5. High-speed Isoc Transaction Limits in usb_20 spec */ 19 #define HS_BW_BOUNDARY 6144 20 /* usb2 spec section11.18.1: at most 188 FS bytes per microframe */ 21 #define FS_PAYLOAD_MAX 188 22 #define LS_PAYLOAD_MAX 18 23 /* section 11.18.1, per fs frame */ 24 #define FS_BW_BOUNDARY 1157 25 #define LS_BW_BOUNDARY 144 26 27 /* 28 * max number of microframes for split transfer, assume extra-cs budget is 0 29 * for fs isoc in : 1 ss + 1 idle + 6 cs (roundup(1023/188)) 30 */ 31 #define TT_MICROFRAMES_MAX 8 32 /* offset from SS for fs/ls isoc/intr ep (ss + idle) */ 33 #define CS_OFFSET 2 34 35 #define DBG_BUF_EN 64 36 37 /* schedule error type */ 38 #define ESCH_SS_Y6 1001 39 #define ESCH_SS_OVERLAP 1002 40 #define ESCH_CS_OVERFLOW 1003 41 #define ESCH_BW_OVERFLOW 1004 42 #define ESCH_FIXME 1005 43 44 /* mtk scheduler bitmasks */ 45 #define EP_BPKTS(p) ((p) & 0x7f) 46 #define EP_BCSCOUNT(p) (((p) & 0x7) << 8) 47 #define EP_BBM(p) ((p) << 11) 48 #define EP_BOFFSET(p) ((p) & 0x3fff) 49 #define EP_BREPEAT(p) (((p) & 0x7fff) << 16) 50 51 static char *sch_error_string(int err_num) 52 { 53 switch (err_num) { 54 case ESCH_SS_Y6: 55 return "Can't schedule Start-Split in Y6"; 56 case ESCH_SS_OVERLAP: 57 return "Can't find a suitable Start-Split location"; 58 case ESCH_CS_OVERFLOW: 59 return "The last Complete-Split is greater than 7"; 60 case ESCH_BW_OVERFLOW: 61 return "Bandwidth exceeds the maximum limit"; 62 case ESCH_FIXME: 63 return "FIXME, to be resolved"; 64 default: 65 return "Unknown"; 66 } 67 } 68 69 static int is_fs_or_ls(enum usb_device_speed speed) 70 { 71 return speed == USB_SPEED_FULL || speed == USB_SPEED_LOW; 72 } 73 74 static const char * 75 decode_ep(struct usb_host_endpoint *ep, enum usb_device_speed speed) 76 { 77 static char buf[DBG_BUF_EN]; 78 struct usb_endpoint_descriptor *epd = &ep->desc; 79 unsigned int interval; 80 const char *unit; 81 82 interval = usb_decode_interval(epd, speed); 83 if (interval % 1000) { 84 unit = "us"; 85 } else { 86 unit = "ms"; 87 interval /= 1000; 88 } 89 90 snprintf(buf, DBG_BUF_EN, "%s ep%d%s %s, mpkt:%d, interval:%d/%d%s", 91 usb_speed_string(speed), usb_endpoint_num(epd), 92 usb_endpoint_dir_in(epd) ? "in" : "out", 93 usb_ep_type_string(usb_endpoint_type(epd)), 94 usb_endpoint_maxp(epd), epd->bInterval, interval, unit); 95 96 return buf; 97 } 98 99 static u32 get_bw_boundary(enum usb_device_speed speed) 100 { 101 u32 boundary; 102 103 switch (speed) { 104 case USB_SPEED_SUPER_PLUS: 105 boundary = SSP_BW_BOUNDARY; 106 break; 107 case USB_SPEED_SUPER: 108 boundary = SS_BW_BOUNDARY; 109 break; 110 default: 111 boundary = HS_BW_BOUNDARY; 112 break; 113 } 114 115 return boundary; 116 } 117 118 /* 119 * get the bandwidth domain which @ep belongs to. 120 * 121 * the bandwidth domain array is saved to @sch_array of struct xhci_hcd_mtk, 122 * each HS root port is treated as a single bandwidth domain, 123 * but each SS root port is treated as two bandwidth domains, one for IN eps, 124 * one for OUT eps. 125 * @real_port value is defined as follow according to xHCI spec: 126 * 1 for SSport0, ..., N+1 for SSportN, N+2 for HSport0, N+3 for HSport1, etc 127 * so the bandwidth domain array is organized as follow for simplification: 128 * SSport0-OUT, SSport0-IN, ..., SSportX-OUT, SSportX-IN, HSport0, ..., HSportY 129 */ 130 static struct mu3h_sch_bw_info * 131 get_bw_info(struct xhci_hcd_mtk *mtk, struct usb_device *udev, 132 struct usb_host_endpoint *ep) 133 { 134 struct xhci_hcd *xhci = hcd_to_xhci(mtk->hcd); 135 struct xhci_virt_device *virt_dev; 136 int bw_index; 137 138 virt_dev = xhci->devs[udev->slot_id]; 139 if (!virt_dev->real_port) { 140 WARN_ONCE(1, "%s invalid real_port\n", dev_name(&udev->dev)); 141 return NULL; 142 } 143 144 if (udev->speed >= USB_SPEED_SUPER) { 145 if (usb_endpoint_dir_out(&ep->desc)) 146 bw_index = (virt_dev->real_port - 1) * 2; 147 else 148 bw_index = (virt_dev->real_port - 1) * 2 + 1; 149 } else { 150 /* add one more for each SS port */ 151 bw_index = virt_dev->real_port + xhci->usb3_rhub.num_ports - 1; 152 } 153 154 return &mtk->sch_array[bw_index]; 155 } 156 157 static u32 get_esit(struct xhci_ep_ctx *ep_ctx) 158 { 159 u32 esit; 160 161 esit = 1 << CTX_TO_EP_INTERVAL(le32_to_cpu(ep_ctx->ep_info)); 162 if (esit > XHCI_MTK_MAX_ESIT) 163 esit = XHCI_MTK_MAX_ESIT; 164 165 return esit; 166 } 167 168 static struct mu3h_sch_tt *find_tt(struct usb_device *udev) 169 { 170 struct usb_tt *utt = udev->tt; 171 struct mu3h_sch_tt *tt, **tt_index, **ptt; 172 bool allocated_index = false; 173 174 if (!utt) 175 return NULL; /* Not below a TT */ 176 177 /* 178 * Find/create our data structure. 179 * For hubs with a single TT, we get it directly. 180 * For hubs with multiple TTs, there's an extra level of pointers. 181 */ 182 tt_index = NULL; 183 if (utt->multi) { 184 tt_index = utt->hcpriv; 185 if (!tt_index) { /* Create the index array */ 186 tt_index = kcalloc(utt->hub->maxchild, 187 sizeof(*tt_index), GFP_KERNEL); 188 if (!tt_index) 189 return ERR_PTR(-ENOMEM); 190 utt->hcpriv = tt_index; 191 allocated_index = true; 192 } 193 ptt = &tt_index[udev->ttport - 1]; 194 } else { 195 ptt = (struct mu3h_sch_tt **) &utt->hcpriv; 196 } 197 198 tt = *ptt; 199 if (!tt) { /* Create the mu3h_sch_tt */ 200 tt = kzalloc(sizeof(*tt), GFP_KERNEL); 201 if (!tt) { 202 if (allocated_index) { 203 utt->hcpriv = NULL; 204 kfree(tt_index); 205 } 206 return ERR_PTR(-ENOMEM); 207 } 208 INIT_LIST_HEAD(&tt->ep_list); 209 *ptt = tt; 210 } 211 212 return tt; 213 } 214 215 /* Release the TT above udev, if it's not in use */ 216 static void drop_tt(struct usb_device *udev) 217 { 218 struct usb_tt *utt = udev->tt; 219 struct mu3h_sch_tt *tt, **tt_index, **ptt; 220 int i, cnt; 221 222 if (!utt || !utt->hcpriv) 223 return; /* Not below a TT, or never allocated */ 224 225 cnt = 0; 226 if (utt->multi) { 227 tt_index = utt->hcpriv; 228 ptt = &tt_index[udev->ttport - 1]; 229 /* How many entries are left in tt_index? */ 230 for (i = 0; i < utt->hub->maxchild; ++i) 231 cnt += !!tt_index[i]; 232 } else { 233 tt_index = NULL; 234 ptt = (struct mu3h_sch_tt **)&utt->hcpriv; 235 } 236 237 tt = *ptt; 238 if (!tt || !list_empty(&tt->ep_list)) 239 return; /* never allocated , or still in use*/ 240 241 *ptt = NULL; 242 kfree(tt); 243 244 if (cnt == 1) { 245 utt->hcpriv = NULL; 246 kfree(tt_index); 247 } 248 } 249 250 static struct mu3h_sch_ep_info * 251 create_sch_ep(struct xhci_hcd_mtk *mtk, struct usb_device *udev, 252 struct usb_host_endpoint *ep, struct xhci_ep_ctx *ep_ctx) 253 { 254 struct mu3h_sch_ep_info *sch_ep; 255 struct mu3h_sch_bw_info *bw_info; 256 struct mu3h_sch_tt *tt = NULL; 257 u32 len; 258 259 bw_info = get_bw_info(mtk, udev, ep); 260 if (!bw_info) 261 return ERR_PTR(-ENODEV); 262 263 if (is_fs_or_ls(udev->speed)) 264 len = TT_MICROFRAMES_MAX; 265 else if ((udev->speed >= USB_SPEED_SUPER) && 266 usb_endpoint_xfer_isoc(&ep->desc)) 267 len = get_esit(ep_ctx); 268 else 269 len = 1; 270 271 sch_ep = kzalloc(struct_size(sch_ep, bw_budget_table, len), GFP_KERNEL); 272 if (!sch_ep) 273 return ERR_PTR(-ENOMEM); 274 275 if (is_fs_or_ls(udev->speed)) { 276 tt = find_tt(udev); 277 if (IS_ERR(tt)) { 278 kfree(sch_ep); 279 return ERR_PTR(-ENOMEM); 280 } 281 } 282 283 sch_ep->bw_info = bw_info; 284 sch_ep->sch_tt = tt; 285 sch_ep->ep = ep; 286 sch_ep->speed = udev->speed; 287 INIT_LIST_HEAD(&sch_ep->endpoint); 288 INIT_LIST_HEAD(&sch_ep->tt_endpoint); 289 INIT_HLIST_NODE(&sch_ep->hentry); 290 291 return sch_ep; 292 } 293 294 static void setup_sch_info(struct xhci_ep_ctx *ep_ctx, 295 struct mu3h_sch_ep_info *sch_ep) 296 { 297 u32 ep_type; 298 u32 maxpkt; 299 u32 max_burst; 300 u32 mult; 301 u32 esit_pkts; 302 u32 max_esit_payload; 303 u32 bw_per_microframe; 304 u32 *bwb_table; 305 int i; 306 307 bwb_table = sch_ep->bw_budget_table; 308 ep_type = CTX_TO_EP_TYPE(le32_to_cpu(ep_ctx->ep_info2)); 309 maxpkt = MAX_PACKET_DECODED(le32_to_cpu(ep_ctx->ep_info2)); 310 max_burst = CTX_TO_MAX_BURST(le32_to_cpu(ep_ctx->ep_info2)); 311 mult = CTX_TO_EP_MULT(le32_to_cpu(ep_ctx->ep_info)); 312 max_esit_payload = 313 (CTX_TO_MAX_ESIT_PAYLOAD_HI( 314 le32_to_cpu(ep_ctx->ep_info)) << 16) | 315 CTX_TO_MAX_ESIT_PAYLOAD(le32_to_cpu(ep_ctx->tx_info)); 316 317 sch_ep->esit = get_esit(ep_ctx); 318 sch_ep->num_esit = XHCI_MTK_MAX_ESIT / sch_ep->esit; 319 sch_ep->ep_type = ep_type; 320 sch_ep->maxpkt = maxpkt; 321 sch_ep->offset = 0; 322 sch_ep->burst_mode = 0; 323 sch_ep->repeat = 0; 324 325 if (sch_ep->speed == USB_SPEED_HIGH) { 326 sch_ep->cs_count = 0; 327 328 /* 329 * usb_20 spec section5.9 330 * a single microframe is enough for HS synchromous endpoints 331 * in a interval 332 */ 333 sch_ep->num_budget_microframes = 1; 334 335 /* 336 * xHCI spec section6.2.3.4 337 * @max_burst is the number of additional transactions 338 * opportunities per microframe 339 */ 340 sch_ep->pkts = max_burst + 1; 341 bwb_table[0] = maxpkt * sch_ep->pkts; 342 } else if (sch_ep->speed >= USB_SPEED_SUPER) { 343 /* usb3_r1 spec section4.4.7 & 4.4.8 */ 344 sch_ep->cs_count = 0; 345 sch_ep->burst_mode = 1; 346 /* 347 * some device's (d)wBytesPerInterval is set as 0, 348 * then max_esit_payload is 0, so evaluate esit_pkts from 349 * mult and burst 350 */ 351 esit_pkts = DIV_ROUND_UP(max_esit_payload, maxpkt); 352 if (esit_pkts == 0) 353 esit_pkts = (mult + 1) * (max_burst + 1); 354 355 if (ep_type == INT_IN_EP || ep_type == INT_OUT_EP) { 356 sch_ep->pkts = esit_pkts; 357 sch_ep->num_budget_microframes = 1; 358 bwb_table[0] = maxpkt * sch_ep->pkts; 359 } 360 361 if (ep_type == ISOC_IN_EP || ep_type == ISOC_OUT_EP) { 362 363 if (sch_ep->esit == 1) 364 sch_ep->pkts = esit_pkts; 365 else if (esit_pkts <= sch_ep->esit) 366 sch_ep->pkts = 1; 367 else 368 sch_ep->pkts = roundup_pow_of_two(esit_pkts) 369 / sch_ep->esit; 370 371 sch_ep->num_budget_microframes = 372 DIV_ROUND_UP(esit_pkts, sch_ep->pkts); 373 374 sch_ep->repeat = !!(sch_ep->num_budget_microframes > 1); 375 bw_per_microframe = maxpkt * sch_ep->pkts; 376 377 for (i = 0; i < sch_ep->num_budget_microframes - 1; i++) 378 bwb_table[i] = bw_per_microframe; 379 380 /* last one <= bw_per_microframe */ 381 bwb_table[i] = maxpkt * esit_pkts - i * bw_per_microframe; 382 } 383 } else if (is_fs_or_ls(sch_ep->speed)) { 384 sch_ep->pkts = 1; /* at most one packet for each microframe */ 385 386 /* 387 * @cs_count will be updated to add extra-cs when 388 * check TT for INT_OUT_EP, ISOC/INT_IN_EP type 389 * @maxpkt <= 1023; 390 */ 391 sch_ep->cs_count = DIV_ROUND_UP(maxpkt, FS_PAYLOAD_MAX); 392 sch_ep->num_budget_microframes = sch_ep->cs_count; 393 394 /* init budget table */ 395 if (ep_type == ISOC_OUT_EP) { 396 for (i = 0; i < sch_ep->cs_count - 1; i++) 397 bwb_table[i] = FS_PAYLOAD_MAX; 398 399 bwb_table[i] = maxpkt - i * FS_PAYLOAD_MAX; 400 } else if (ep_type == INT_OUT_EP) { 401 /* only first one used (maxpkt <= 64), others zero */ 402 bwb_table[0] = maxpkt; 403 } else { /* INT_IN_EP or ISOC_IN_EP */ 404 bwb_table[0] = 0; /* start split */ 405 bwb_table[1] = 0; /* idle */ 406 /* 407 * @cs_count will be updated according to cs position 408 * (add 1 or 2 extra-cs), but assume only first 409 * @num_budget_microframes elements will be used later, 410 * although in fact it does not (extra-cs budget many receive 411 * some data for IN ep); 412 * @cs_count is 1 for INT_IN_EP (maxpkt <= 64); 413 */ 414 for (i = 0; i < sch_ep->cs_count - 1; i++) 415 bwb_table[i + CS_OFFSET] = FS_PAYLOAD_MAX; 416 417 bwb_table[i + CS_OFFSET] = maxpkt - i * FS_PAYLOAD_MAX; 418 /* ss + idle */ 419 sch_ep->num_budget_microframes += CS_OFFSET; 420 } 421 } 422 } 423 424 /* Get maximum bandwidth when we schedule at offset slot. */ 425 static u32 get_max_bw(struct mu3h_sch_bw_info *sch_bw, 426 struct mu3h_sch_ep_info *sch_ep, u32 offset) 427 { 428 u32 max_bw = 0; 429 u32 bw; 430 int i, j, k; 431 432 for (i = 0; i < sch_ep->num_esit; i++) { 433 u32 base = offset + i * sch_ep->esit; 434 435 for (j = 0; j < sch_ep->num_budget_microframes; j++) { 436 k = XHCI_MTK_BW_INDEX(base + j); 437 bw = sch_bw->bus_bw[k] + sch_ep->bw_budget_table[j]; 438 if (bw > max_bw) 439 max_bw = bw; 440 } 441 } 442 return max_bw; 443 } 444 445 /* 446 * for OUT: get first SS consumed bw; 447 * for IN: get first CS consumed bw; 448 */ 449 static u16 get_fs_bw(struct mu3h_sch_ep_info *sch_ep, int offset) 450 { 451 struct mu3h_sch_tt *tt = sch_ep->sch_tt; 452 u16 fs_bw; 453 454 if (sch_ep->ep_type == ISOC_OUT_EP || sch_ep->ep_type == INT_OUT_EP) 455 fs_bw = tt->fs_bus_bw_out[XHCI_MTK_BW_INDEX(offset)]; 456 else /* skip ss + idle */ 457 fs_bw = tt->fs_bus_bw_in[XHCI_MTK_BW_INDEX(offset + CS_OFFSET)]; 458 459 return fs_bw; 460 } 461 462 static void update_bus_bw(struct mu3h_sch_bw_info *sch_bw, 463 struct mu3h_sch_ep_info *sch_ep, bool used) 464 { 465 u32 base; 466 int i, j, k; 467 468 for (i = 0; i < sch_ep->num_esit; i++) { 469 base = sch_ep->offset + i * sch_ep->esit; 470 for (j = 0; j < sch_ep->num_budget_microframes; j++) { 471 k = XHCI_MTK_BW_INDEX(base + j); 472 if (used) 473 sch_bw->bus_bw[k] += sch_ep->bw_budget_table[j]; 474 else 475 sch_bw->bus_bw[k] -= sch_ep->bw_budget_table[j]; 476 } 477 } 478 } 479 480 static int check_ls_budget_microframes(struct mu3h_sch_ep_info *sch_ep, int offset) 481 { 482 struct mu3h_sch_tt *tt = sch_ep->sch_tt; 483 int i; 484 485 if (sch_ep->speed != USB_SPEED_LOW) 486 return 0; 487 488 if (sch_ep->ep_type == INT_OUT_EP) 489 i = XHCI_MTK_BW_INDEX(offset); 490 else if (sch_ep->ep_type == INT_IN_EP) 491 i = XHCI_MTK_BW_INDEX(offset + CS_OFFSET); /* skip ss + idle */ 492 else 493 return -EINVAL; 494 495 if (tt->ls_bus_bw[i] + sch_ep->maxpkt > LS_PAYLOAD_MAX) 496 return -ESCH_BW_OVERFLOW; 497 498 return 0; 499 } 500 501 static int check_fs_budget_microframes(struct mu3h_sch_ep_info *sch_ep, int offset) 502 { 503 struct mu3h_sch_tt *tt = sch_ep->sch_tt; 504 u32 tmp; 505 int i, k; 506 507 /* 508 * for OUT eps, will transfer exactly assigned length of data, 509 * so can't allocate more than 188 bytes; 510 * but it's not for IN eps, usually it can't receive full 511 * 188 bytes in a uframe, if it not assign full 188 bytes, 512 * can add another one; 513 */ 514 for (i = 0; i < sch_ep->num_budget_microframes; i++) { 515 k = XHCI_MTK_BW_INDEX(offset + i); 516 if (sch_ep->ep_type == ISOC_OUT_EP || sch_ep->ep_type == INT_OUT_EP) 517 tmp = tt->fs_bus_bw_out[k] + sch_ep->bw_budget_table[i]; 518 else /* ep_type : ISOC IN / INTR IN */ 519 tmp = tt->fs_bus_bw_in[k]; 520 521 if (tmp > FS_PAYLOAD_MAX) 522 return -ESCH_BW_OVERFLOW; 523 } 524 525 return 0; 526 } 527 528 static int check_fs_budget_frames(struct mu3h_sch_ep_info *sch_ep, int offset) 529 { 530 struct mu3h_sch_tt *tt = sch_ep->sch_tt; 531 u32 head, tail; 532 int i, j, k; 533 534 /* bugdet scheduled may cross at most two fs frames */ 535 j = XHCI_MTK_BW_INDEX(offset) / UFRAMES_PER_FRAME; 536 k = XHCI_MTK_BW_INDEX(offset + sch_ep->num_budget_microframes - 1) / UFRAMES_PER_FRAME; 537 538 if (j != k) { 539 head = tt->fs_frame_bw[j]; 540 tail = tt->fs_frame_bw[k]; 541 } else { 542 head = tt->fs_frame_bw[j]; 543 tail = 0; 544 } 545 546 j = roundup(offset, UFRAMES_PER_FRAME); 547 for (i = 0; i < sch_ep->num_budget_microframes; i++) { 548 if ((offset + i) < j) 549 head += sch_ep->bw_budget_table[i]; 550 else 551 tail += sch_ep->bw_budget_table[i]; 552 } 553 554 if (head > FS_BW_BOUNDARY || tail > FS_BW_BOUNDARY) 555 return -ESCH_BW_OVERFLOW; 556 557 return 0; 558 } 559 560 static int check_fs_bus_bw(struct mu3h_sch_ep_info *sch_ep, int offset) 561 { 562 int i, base; 563 int ret = 0; 564 565 for (i = 0; i < sch_ep->num_esit; i++) { 566 base = offset + i * sch_ep->esit; 567 568 ret = check_ls_budget_microframes(sch_ep, base); 569 if (ret) 570 goto err; 571 572 ret = check_fs_budget_microframes(sch_ep, base); 573 if (ret) 574 goto err; 575 576 ret = check_fs_budget_frames(sch_ep, base); 577 if (ret) 578 goto err; 579 } 580 581 err: 582 return ret; 583 } 584 585 static int check_ss_and_cs(struct mu3h_sch_ep_info *sch_ep, u32 offset) 586 { 587 u32 start_ss, last_ss; 588 u32 start_cs, last_cs; 589 590 start_ss = offset % UFRAMES_PER_FRAME; 591 592 if (sch_ep->ep_type == ISOC_OUT_EP) { 593 last_ss = start_ss + sch_ep->cs_count - 1; 594 595 /* 596 * usb_20 spec section11.18: 597 * must never schedule Start-Split in Y6 598 */ 599 if (!(start_ss == 7 || last_ss < 6)) 600 return -ESCH_SS_Y6; 601 602 } else { 603 /* maxpkt <= 1023, cs <= 6 */ 604 u32 cs_count = DIV_ROUND_UP(sch_ep->maxpkt, FS_PAYLOAD_MAX); 605 606 /* 607 * usb_20 spec section11.18: 608 * must never schedule Start-Split in Y6 609 */ 610 if (start_ss == 6) 611 return -ESCH_SS_Y6; 612 613 /* one uframe for ss + one uframe for idle */ 614 start_cs = (start_ss + CS_OFFSET) % UFRAMES_PER_FRAME; 615 last_cs = start_cs + cs_count - 1; 616 if (last_cs > 7) 617 return -ESCH_CS_OVERFLOW; 618 619 /* add extra-cs */ 620 cs_count += (last_cs == 7) ? 1 : 2; 621 if (cs_count > 7) 622 cs_count = 7; /* HW limit */ 623 624 sch_ep->cs_count = cs_count; 625 626 } 627 628 return 0; 629 } 630 631 /* 632 * when isoc-out transfers 188 bytes in a uframe, and send isoc/intr's 633 * ss token in the uframe, may cause 'bit stuff error' in downstream 634 * port; 635 * when isoc-out transfer less than 188 bytes in a uframe, shall send 636 * isoc-in's ss after isoc-out's ss (but hw can't ensure the sequence, 637 * so just avoid overlap). 638 */ 639 static int check_isoc_ss_overlap(struct mu3h_sch_ep_info *sch_ep, u32 offset) 640 { 641 struct mu3h_sch_tt *tt = sch_ep->sch_tt; 642 int base; 643 int i, j, k; 644 645 if (!tt) 646 return 0; 647 648 for (i = 0; i < sch_ep->num_esit; i++) { 649 base = offset + i * sch_ep->esit; 650 651 if (sch_ep->ep_type == ISOC_OUT_EP) { 652 for (j = 0; j < sch_ep->num_budget_microframes; j++) { 653 k = XHCI_MTK_BW_INDEX(base + j); 654 if (tt->in_ss_cnt[k]) 655 return -ESCH_SS_OVERLAP; 656 } 657 } else if (sch_ep->ep_type == ISOC_IN_EP || sch_ep->ep_type == INT_IN_EP) { 658 k = XHCI_MTK_BW_INDEX(base); 659 /* only check IN's ss */ 660 if (tt->fs_bus_bw_out[k]) 661 return -ESCH_SS_OVERLAP; 662 } 663 } 664 665 return 0; 666 } 667 668 static int check_sch_tt_budget(struct mu3h_sch_ep_info *sch_ep, u32 offset) 669 { 670 int ret; 671 672 ret = check_ss_and_cs(sch_ep, offset); 673 if (ret) 674 return ret; 675 676 ret = check_isoc_ss_overlap(sch_ep, offset); 677 if (ret) 678 return ret; 679 680 return check_fs_bus_bw(sch_ep, offset); 681 } 682 683 /* allocate microframes in the ls/fs frame */ 684 static int alloc_sch_portion_of_frame(struct mu3h_sch_ep_info *sch_ep) 685 { 686 struct mu3h_sch_bw_info *sch_bw = sch_ep->bw_info; 687 const u32 bw_boundary = get_bw_boundary(sch_ep->speed); 688 u32 bw_max, fs_bw_min; 689 u32 offset, offset_min; 690 u16 fs_bw; 691 int frames; 692 int i, j; 693 int ret; 694 695 frames = sch_ep->esit / UFRAMES_PER_FRAME; 696 697 for (i = 0; i < UFRAMES_PER_FRAME; i++) { 698 fs_bw_min = FS_PAYLOAD_MAX; 699 offset_min = XHCI_MTK_MAX_ESIT; 700 701 for (j = 0; j < frames; j++) { 702 offset = (i + j * UFRAMES_PER_FRAME) % sch_ep->esit; 703 704 ret = check_sch_tt_budget(sch_ep, offset); 705 if (ret) 706 continue; 707 708 /* check hs bw domain */ 709 bw_max = get_max_bw(sch_bw, sch_ep, offset); 710 if (bw_max > bw_boundary) { 711 ret = -ESCH_BW_OVERFLOW; 712 continue; 713 } 714 715 /* use best-fit between frames */ 716 fs_bw = get_fs_bw(sch_ep, offset); 717 if (fs_bw < fs_bw_min) { 718 fs_bw_min = fs_bw; 719 offset_min = offset; 720 } 721 722 if (!fs_bw_min) 723 break; 724 } 725 726 /* use first-fit between microframes in a frame */ 727 if (offset_min < XHCI_MTK_MAX_ESIT) 728 break; 729 } 730 731 if (offset_min == XHCI_MTK_MAX_ESIT) 732 return -ESCH_BW_OVERFLOW; 733 734 sch_ep->offset = offset_min; 735 736 return 0; 737 } 738 739 static void update_sch_tt(struct mu3h_sch_ep_info *sch_ep, bool used) 740 { 741 struct mu3h_sch_tt *tt = sch_ep->sch_tt; 742 u16 *fs_bus_bw; 743 u32 base; 744 int i, j, k, f; 745 746 if (sch_ep->ep_type == ISOC_OUT_EP || sch_ep->ep_type == INT_OUT_EP) 747 fs_bus_bw = tt->fs_bus_bw_out; 748 else 749 fs_bus_bw = tt->fs_bus_bw_in; 750 751 for (i = 0; i < sch_ep->num_esit; i++) { 752 base = sch_ep->offset + i * sch_ep->esit; 753 754 for (j = 0; j < sch_ep->num_budget_microframes; j++) { 755 k = XHCI_MTK_BW_INDEX(base + j); 756 f = k / UFRAMES_PER_FRAME; 757 if (used) { 758 if (sch_ep->speed == USB_SPEED_LOW) 759 tt->ls_bus_bw[k] += (u8)sch_ep->bw_budget_table[j]; 760 761 fs_bus_bw[k] += (u16)sch_ep->bw_budget_table[j]; 762 tt->fs_frame_bw[f] += (u16)sch_ep->bw_budget_table[j]; 763 } else { 764 if (sch_ep->speed == USB_SPEED_LOW) 765 tt->ls_bus_bw[k] -= (u8)sch_ep->bw_budget_table[j]; 766 767 fs_bus_bw[k] -= (u16)sch_ep->bw_budget_table[j]; 768 tt->fs_frame_bw[f] -= (u16)sch_ep->bw_budget_table[j]; 769 } 770 } 771 772 if (sch_ep->ep_type == ISOC_IN_EP || sch_ep->ep_type == INT_IN_EP) { 773 k = XHCI_MTK_BW_INDEX(base); 774 if (used) 775 tt->in_ss_cnt[k]++; 776 else 777 tt->in_ss_cnt[k]--; 778 } 779 } 780 781 if (used) 782 list_add_tail(&sch_ep->tt_endpoint, &tt->ep_list); 783 else 784 list_del(&sch_ep->tt_endpoint); 785 } 786 787 static int load_ep_bw(struct mu3h_sch_bw_info *sch_bw, 788 struct mu3h_sch_ep_info *sch_ep, bool loaded) 789 { 790 if (sch_ep->sch_tt) 791 update_sch_tt(sch_ep, loaded); 792 793 /* update bus bandwidth info */ 794 update_bus_bw(sch_bw, sch_ep, loaded); 795 sch_ep->allocated = loaded; 796 797 return 0; 798 } 799 800 /* allocate microframes for hs/ss/ssp */ 801 static int alloc_sch_microframes(struct mu3h_sch_ep_info *sch_ep) 802 { 803 struct mu3h_sch_bw_info *sch_bw = sch_ep->bw_info; 804 const u32 bw_boundary = get_bw_boundary(sch_ep->speed); 805 u32 offset; 806 u32 worst_bw; 807 u32 min_bw = ~0; 808 int min_index = -1; 809 810 /* 811 * Search through all possible schedule microframes. 812 * and find a microframe where its worst bandwidth is minimum. 813 */ 814 for (offset = 0; offset < sch_ep->esit; offset++) { 815 816 worst_bw = get_max_bw(sch_bw, sch_ep, offset); 817 if (worst_bw > bw_boundary) 818 continue; 819 820 if (min_bw > worst_bw) { 821 min_bw = worst_bw; 822 min_index = offset; 823 } 824 } 825 826 if (min_index < 0) 827 return -ESCH_BW_OVERFLOW; 828 829 sch_ep->offset = min_index; 830 831 return 0; 832 } 833 834 static int check_sch_bw(struct mu3h_sch_ep_info *sch_ep) 835 { 836 int ret; 837 838 if (sch_ep->sch_tt) 839 ret = alloc_sch_portion_of_frame(sch_ep); 840 else 841 ret = alloc_sch_microframes(sch_ep); 842 843 if (ret) 844 return ret; 845 846 return load_ep_bw(sch_ep->bw_info, sch_ep, true); 847 } 848 849 static void destroy_sch_ep(struct xhci_hcd_mtk *mtk, struct usb_device *udev, 850 struct mu3h_sch_ep_info *sch_ep) 851 { 852 /* only release ep bw check passed by check_sch_bw() */ 853 if (sch_ep->allocated) 854 load_ep_bw(sch_ep->bw_info, sch_ep, false); 855 856 if (sch_ep->sch_tt) 857 drop_tt(udev); 858 859 list_del(&sch_ep->endpoint); 860 hlist_del(&sch_ep->hentry); 861 kfree(sch_ep); 862 } 863 864 static bool need_bw_sch(struct usb_device *udev, 865 struct usb_host_endpoint *ep) 866 { 867 bool has_tt = udev->tt && udev->tt->hub->parent; 868 869 /* only for periodic endpoints */ 870 if (usb_endpoint_xfer_control(&ep->desc) 871 || usb_endpoint_xfer_bulk(&ep->desc)) 872 return false; 873 874 /* 875 * for LS & FS periodic endpoints which its device is not behind 876 * a TT are also ignored, root-hub will schedule them directly, 877 * but need set @bpkts field of endpoint context to 1. 878 */ 879 if (is_fs_or_ls(udev->speed) && !has_tt) 880 return false; 881 882 /* skip endpoint with zero maxpkt */ 883 if (usb_endpoint_maxp(&ep->desc) == 0) 884 return false; 885 886 return true; 887 } 888 889 int xhci_mtk_sch_init(struct xhci_hcd_mtk *mtk) 890 { 891 struct xhci_hcd *xhci = hcd_to_xhci(mtk->hcd); 892 struct mu3h_sch_bw_info *sch_array; 893 int num_usb_bus; 894 895 /* ss IN and OUT are separated */ 896 num_usb_bus = xhci->usb3_rhub.num_ports * 2 + xhci->usb2_rhub.num_ports; 897 898 sch_array = kcalloc(num_usb_bus, sizeof(*sch_array), GFP_KERNEL); 899 if (sch_array == NULL) 900 return -ENOMEM; 901 902 mtk->sch_array = sch_array; 903 904 INIT_LIST_HEAD(&mtk->bw_ep_chk_list); 905 hash_init(mtk->sch_ep_hash); 906 907 return 0; 908 } 909 910 void xhci_mtk_sch_exit(struct xhci_hcd_mtk *mtk) 911 { 912 kfree(mtk->sch_array); 913 } 914 915 static int add_ep_quirk(struct usb_hcd *hcd, struct usb_device *udev, 916 struct usb_host_endpoint *ep) 917 { 918 struct xhci_hcd_mtk *mtk = hcd_to_mtk(hcd); 919 struct xhci_hcd *xhci = hcd_to_xhci(hcd); 920 struct xhci_ep_ctx *ep_ctx; 921 struct xhci_virt_device *virt_dev; 922 struct mu3h_sch_ep_info *sch_ep; 923 unsigned int ep_index; 924 925 virt_dev = xhci->devs[udev->slot_id]; 926 ep_index = xhci_get_endpoint_index(&ep->desc); 927 ep_ctx = xhci_get_ep_ctx(xhci, virt_dev->in_ctx, ep_index); 928 929 if (!need_bw_sch(udev, ep)) { 930 /* 931 * set @bpkts to 1 if it is LS or FS periodic endpoint, and its 932 * device does not connected through an external HS hub 933 */ 934 if (usb_endpoint_xfer_int(&ep->desc) 935 || usb_endpoint_xfer_isoc(&ep->desc)) 936 ep_ctx->reserved[0] = cpu_to_le32(EP_BPKTS(1)); 937 938 return 0; 939 } 940 941 xhci_dbg(xhci, "%s %s\n", __func__, decode_ep(ep, udev->speed)); 942 943 sch_ep = create_sch_ep(mtk, udev, ep, ep_ctx); 944 if (IS_ERR_OR_NULL(sch_ep)) 945 return -ENOMEM; 946 947 setup_sch_info(ep_ctx, sch_ep); 948 949 list_add_tail(&sch_ep->endpoint, &mtk->bw_ep_chk_list); 950 hash_add(mtk->sch_ep_hash, &sch_ep->hentry, (unsigned long)ep); 951 952 return 0; 953 } 954 955 static void drop_ep_quirk(struct usb_hcd *hcd, struct usb_device *udev, 956 struct usb_host_endpoint *ep) 957 { 958 struct xhci_hcd_mtk *mtk = hcd_to_mtk(hcd); 959 struct xhci_hcd *xhci = hcd_to_xhci(hcd); 960 struct mu3h_sch_ep_info *sch_ep; 961 struct hlist_node *hn; 962 963 if (!need_bw_sch(udev, ep)) 964 return; 965 966 xhci_dbg(xhci, "%s %s\n", __func__, decode_ep(ep, udev->speed)); 967 968 hash_for_each_possible_safe(mtk->sch_ep_hash, sch_ep, 969 hn, hentry, (unsigned long)ep) { 970 if (sch_ep->ep == ep) { 971 destroy_sch_ep(mtk, udev, sch_ep); 972 break; 973 } 974 } 975 } 976 977 int xhci_mtk_check_bandwidth(struct usb_hcd *hcd, struct usb_device *udev) 978 { 979 struct xhci_hcd_mtk *mtk = hcd_to_mtk(hcd); 980 struct xhci_hcd *xhci = hcd_to_xhci(hcd); 981 struct xhci_virt_device *virt_dev = xhci->devs[udev->slot_id]; 982 struct mu3h_sch_ep_info *sch_ep; 983 int ret; 984 985 xhci_dbg(xhci, "%s() udev %s\n", __func__, dev_name(&udev->dev)); 986 987 list_for_each_entry(sch_ep, &mtk->bw_ep_chk_list, endpoint) { 988 struct xhci_ep_ctx *ep_ctx; 989 struct usb_host_endpoint *ep = sch_ep->ep; 990 unsigned int ep_index = xhci_get_endpoint_index(&ep->desc); 991 992 ret = check_sch_bw(sch_ep); 993 if (ret) { 994 xhci_err(xhci, "Not enough bandwidth! (%s)\n", 995 sch_error_string(-ret)); 996 return -ENOSPC; 997 } 998 999 ep_ctx = xhci_get_ep_ctx(xhci, virt_dev->in_ctx, ep_index); 1000 ep_ctx->reserved[0] = cpu_to_le32(EP_BPKTS(sch_ep->pkts) 1001 | EP_BCSCOUNT(sch_ep->cs_count) 1002 | EP_BBM(sch_ep->burst_mode)); 1003 ep_ctx->reserved[1] = cpu_to_le32(EP_BOFFSET(sch_ep->offset) 1004 | EP_BREPEAT(sch_ep->repeat)); 1005 1006 xhci_dbg(xhci, " PKTS:%x, CSCOUNT:%x, BM:%x, OFFSET:%x, REPEAT:%x\n", 1007 sch_ep->pkts, sch_ep->cs_count, sch_ep->burst_mode, 1008 sch_ep->offset, sch_ep->repeat); 1009 } 1010 1011 ret = xhci_check_bandwidth(hcd, udev); 1012 if (!ret) 1013 list_del_init(&mtk->bw_ep_chk_list); 1014 1015 return ret; 1016 } 1017 1018 void xhci_mtk_reset_bandwidth(struct usb_hcd *hcd, struct usb_device *udev) 1019 { 1020 struct xhci_hcd_mtk *mtk = hcd_to_mtk(hcd); 1021 struct xhci_hcd *xhci = hcd_to_xhci(hcd); 1022 struct mu3h_sch_ep_info *sch_ep, *tmp; 1023 1024 xhci_dbg(xhci, "%s() udev %s\n", __func__, dev_name(&udev->dev)); 1025 1026 list_for_each_entry_safe(sch_ep, tmp, &mtk->bw_ep_chk_list, endpoint) 1027 destroy_sch_ep(mtk, udev, sch_ep); 1028 1029 xhci_reset_bandwidth(hcd, udev); 1030 } 1031 1032 int xhci_mtk_add_ep(struct usb_hcd *hcd, struct usb_device *udev, 1033 struct usb_host_endpoint *ep) 1034 { 1035 int ret; 1036 1037 ret = xhci_add_endpoint(hcd, udev, ep); 1038 if (ret) 1039 return ret; 1040 1041 if (ep->hcpriv) 1042 ret = add_ep_quirk(hcd, udev, ep); 1043 1044 return ret; 1045 } 1046 1047 int xhci_mtk_drop_ep(struct usb_hcd *hcd, struct usb_device *udev, 1048 struct usb_host_endpoint *ep) 1049 { 1050 int ret; 1051 1052 ret = xhci_drop_endpoint(hcd, udev, ep); 1053 if (ret) 1054 return ret; 1055 1056 /* needn't check @ep->hcpriv, xhci_endpoint_disable set it NULL */ 1057 drop_ep_quirk(hcd, udev, ep); 1058 1059 return 0; 1060 } 1061