1 // SPDX-License-Identifier: MIT 2 /* 3 * Copyright © 2018 Intel Corporation 4 * 5 * Author: Gaurav K Singh <gaurav.k.singh@intel.com> 6 * Manasi Navare <manasi.d.navare@intel.com> 7 */ 8 #include <linux/limits.h> 9 10 #include <drm/display/drm_dsc_helper.h> 11 #include <drm/drm_fixed.h> 12 #include <drm/drm_print.h> 13 14 #include "intel_crtc.h" 15 #include "intel_de.h" 16 #include "intel_display_types.h" 17 #include "intel_display_utils.h" 18 #include "intel_dp.h" 19 #include "intel_dsi.h" 20 #include "intel_qp_tables.h" 21 #include "intel_vdsc.h" 22 #include "intel_vdsc_regs.h" 23 24 bool intel_dsc_source_support(const struct intel_crtc_state *crtc_state) 25 { 26 struct intel_display *display = to_intel_display(crtc_state); 27 enum transcoder cpu_transcoder = crtc_state->cpu_transcoder; 28 29 if (!HAS_DSC(display)) 30 return false; 31 32 if (DISPLAY_VER(display) == 11 && cpu_transcoder == TRANSCODER_A) 33 return false; 34 35 return true; 36 } 37 38 static bool is_pipe_dsc(struct intel_crtc *crtc, enum transcoder cpu_transcoder) 39 { 40 struct intel_display *display = to_intel_display(crtc); 41 42 if (DISPLAY_VER(display) >= 12) 43 return true; 44 45 if (cpu_transcoder == TRANSCODER_EDP || 46 cpu_transcoder == TRANSCODER_DSI_0 || 47 cpu_transcoder == TRANSCODER_DSI_1) 48 return false; 49 50 /* There's no pipe A DSC engine on ICL */ 51 drm_WARN_ON(display->drm, crtc->pipe == PIPE_A); 52 53 return true; 54 } 55 56 static void 57 intel_vdsc_set_min_max_qp(struct drm_dsc_config *vdsc_cfg, int buf, 58 int bpp) 59 { 60 int bpc = vdsc_cfg->bits_per_component; 61 62 /* Read range_minqp and range_max_qp from qp tables */ 63 vdsc_cfg->rc_range_params[buf].range_min_qp = 64 intel_lookup_range_min_qp(bpc, buf, bpp, vdsc_cfg->native_420); 65 vdsc_cfg->rc_range_params[buf].range_max_qp = 66 intel_lookup_range_max_qp(bpc, buf, bpp, vdsc_cfg->native_420); 67 } 68 69 static int 70 get_range_bpg_offset(int bpp_low, int offset_low, int bpp_high, int offset_high, int bpp) 71 { 72 return offset_low + DIV_ROUND_UP((offset_high - offset_low) * (bpp - bpp_low), 73 (bpp_low - bpp_high)); 74 } 75 76 /* 77 * We are using the method provided in DSC 1.2a C-Model in codec_main.c 78 * Above method use a common formula to derive values for any combination of DSC 79 * variables. The formula approach may yield slight differences in the derived PPS 80 * parameters from the original parameter sets. These differences are not consequential 81 * to the coding performance because all parameter sets have been shown to produce 82 * visually lossless quality (provides the same PPS values as 83 * DSCParameterValuesVESA V1-2 spreadsheet). 84 */ 85 static void 86 calculate_rc_params(struct drm_dsc_config *vdsc_cfg) 87 { 88 int bpp = fxp_q4_to_int(vdsc_cfg->bits_per_pixel); 89 int bpc = vdsc_cfg->bits_per_component; 90 int qp_bpc_modifier = (bpc - 8) * 2; 91 int uncompressed_bpg_rate; 92 int first_line_bpg_offset; 93 u32 buf_i, bpp_i; 94 95 if (vdsc_cfg->slice_height >= 8) 96 first_line_bpg_offset = 97 12 + (9 * min(34, vdsc_cfg->slice_height - 8)) / 100; 98 else 99 first_line_bpg_offset = 2 * (vdsc_cfg->slice_height - 1); 100 101 uncompressed_bpg_rate = (3 * bpc + (vdsc_cfg->convert_rgb ? 0 : 2)) * 3; 102 vdsc_cfg->first_line_bpg_offset = clamp(first_line_bpg_offset, 0, 103 uncompressed_bpg_rate - 3 * bpp); 104 105 /* 106 * According to DSC 1.2 spec in Section 4.1 if native_420 is set: 107 * -second_line_bpg_offset is 12 in general and equal to 2*(slice_height-1) if slice 108 * height < 8. 109 * -second_line_offset_adj is 512 as shown by empirical values to yield best chroma 110 * preservation in second line. 111 * -nsl_bpg_offset is calculated as second_line_offset/slice_height -1 then rounded 112 * up to 16 fractional bits, we left shift second line offset by 11 to preserve 11 113 * fractional bits. 114 */ 115 if (vdsc_cfg->native_420) { 116 if (vdsc_cfg->slice_height >= 8) 117 vdsc_cfg->second_line_bpg_offset = 12; 118 else 119 vdsc_cfg->second_line_bpg_offset = 120 2 * (vdsc_cfg->slice_height - 1); 121 122 vdsc_cfg->second_line_offset_adj = 512; 123 vdsc_cfg->nsl_bpg_offset = DIV_ROUND_UP(vdsc_cfg->second_line_bpg_offset << 11, 124 vdsc_cfg->slice_height - 1); 125 } 126 127 if (bpp >= 12) 128 vdsc_cfg->initial_offset = 2048; 129 else if (bpp >= 10) 130 vdsc_cfg->initial_offset = 5632 - DIV_ROUND_UP(((bpp - 10) * 3584), 2); 131 else if (bpp >= 8) 132 vdsc_cfg->initial_offset = 6144 - DIV_ROUND_UP(((bpp - 8) * 512), 2); 133 else 134 vdsc_cfg->initial_offset = 6144; 135 136 /* initial_xmit_delay = rc_model_size/2/compression_bpp */ 137 vdsc_cfg->initial_xmit_delay = DIV_ROUND_UP(DSC_RC_MODEL_SIZE_CONST, 2 * bpp); 138 139 vdsc_cfg->flatness_min_qp = 3 + qp_bpc_modifier; 140 vdsc_cfg->flatness_max_qp = 12 + qp_bpc_modifier; 141 142 vdsc_cfg->rc_quant_incr_limit0 = 11 + qp_bpc_modifier; 143 vdsc_cfg->rc_quant_incr_limit1 = 11 + qp_bpc_modifier; 144 145 if (vdsc_cfg->native_420) { 146 static const s8 ofs_und4[] = { 147 2, 0, 0, -2, -4, -6, -8, -8, -8, -10, -10, -12, -12, -12, -12 148 }; 149 static const s8 ofs_und5[] = { 150 2, 0, 0, -2, -4, -6, -8, -8, -8, -10, -10, -10, -12, -12, -12 151 }; 152 static const s8 ofs_und6[] = { 153 2, 0, 0, -2, -4, -6, -8, -8, -8, -10, -10, -10, -12, -12, -12 154 }; 155 static const s8 ofs_und8[] = { 156 10, 8, 6, 4, 2, 0, -2, -4, -6, -8, -10, -10, -12, -12, -12 157 }; 158 /* 159 * For 420 format since bits_per_pixel (bpp) is set to target bpp * 2, 160 * QP table values for target bpp 4.0 to 4.4375 (rounded to 4.0) are 161 * actually for bpp 8 to 8.875 (rounded to 4.0 * 2 i.e 8). 162 * Similarly values for target bpp 4.5 to 4.8375 (rounded to 4.5) 163 * are for bpp 9 to 9.875 (rounded to 4.5 * 2 i.e 9), and so on. 164 */ 165 bpp_i = bpp - 8; 166 for (buf_i = 0; buf_i < DSC_NUM_BUF_RANGES; buf_i++) { 167 u8 range_bpg_offset; 168 169 intel_vdsc_set_min_max_qp(vdsc_cfg, buf_i, bpp_i); 170 171 /* Calculate range_bpg_offset */ 172 if (bpp <= 8) 173 range_bpg_offset = ofs_und4[buf_i]; 174 else if (bpp <= 10) 175 range_bpg_offset = get_range_bpg_offset(8, ofs_und4[buf_i], 176 10, ofs_und5[buf_i], bpp); 177 else if (bpp <= 12) 178 range_bpg_offset = get_range_bpg_offset(10, ofs_und5[buf_i], 179 12, ofs_und6[buf_i], bpp); 180 else if (bpp <= 16) 181 range_bpg_offset = get_range_bpg_offset(12, ofs_und6[buf_i], 182 16, ofs_und8[buf_i], bpp); 183 else 184 range_bpg_offset = ofs_und8[buf_i]; 185 186 vdsc_cfg->rc_range_params[buf_i].range_bpg_offset = 187 range_bpg_offset & DSC_RANGE_BPG_OFFSET_MASK; 188 } 189 } else { 190 /* fractional bpp part * 10000 (for precision up to 4 decimal places) */ 191 int fractional_bits = fxp_q4_to_frac(vdsc_cfg->bits_per_pixel); 192 193 static const s8 ofs_und6[] = { 194 0, -2, -2, -4, -6, -6, -8, -8, -8, -10, -10, -12, -12, -12, -12 195 }; 196 static const s8 ofs_und8[] = { 197 2, 0, 0, -2, -4, -6, -8, -8, -8, -10, -10, -10, -12, -12, -12 198 }; 199 static const s8 ofs_und12[] = { 200 2, 0, 0, -2, -4, -6, -8, -8, -8, -10, -10, -10, -12, -12, -12 201 }; 202 static const s8 ofs_und15[] = { 203 10, 8, 6, 4, 2, 0, -2, -4, -6, -8, -10, -10, -12, -12, -12 204 }; 205 206 /* 207 * QP table rows have values in increment of 0.5. 208 * So 6.0 bpp to 6.4375 will have index 0, 6.5 to 6.9375 will have index 1, 209 * and so on. 210 * 0.5 fractional part with 4 decimal precision becomes 5000 211 */ 212 bpp_i = ((bpp - 6) + (fractional_bits < 5000 ? 0 : 1)); 213 214 for (buf_i = 0; buf_i < DSC_NUM_BUF_RANGES; buf_i++) { 215 u8 range_bpg_offset; 216 217 intel_vdsc_set_min_max_qp(vdsc_cfg, buf_i, bpp_i); 218 219 /* Calculate range_bpg_offset */ 220 if (bpp <= 6) 221 range_bpg_offset = ofs_und6[buf_i]; 222 else if (bpp <= 8) 223 range_bpg_offset = get_range_bpg_offset(6, ofs_und6[buf_i], 224 8, ofs_und8[buf_i], bpp); 225 else if (bpp <= 12) 226 range_bpg_offset = get_range_bpg_offset(8, ofs_und8[buf_i], 227 12, ofs_und12[buf_i], bpp); 228 else if (bpp <= 15) 229 range_bpg_offset = get_range_bpg_offset(12, ofs_und12[buf_i], 230 15, ofs_und15[buf_i], bpp); 231 else 232 range_bpg_offset = ofs_und15[buf_i]; 233 234 vdsc_cfg->rc_range_params[buf_i].range_bpg_offset = 235 range_bpg_offset & DSC_RANGE_BPG_OFFSET_MASK; 236 } 237 } 238 } 239 240 static int intel_dsc_slice_dimensions_valid(struct intel_crtc_state *pipe_config, 241 struct drm_dsc_config *vdsc_cfg) 242 { 243 if (pipe_config->output_format == INTEL_OUTPUT_FORMAT_RGB || 244 pipe_config->output_format == INTEL_OUTPUT_FORMAT_YCBCR444) { 245 if (vdsc_cfg->slice_height > 4095) 246 return -EINVAL; 247 if (vdsc_cfg->slice_height * vdsc_cfg->slice_width < 15000) 248 return -EINVAL; 249 } else if (pipe_config->output_format == INTEL_OUTPUT_FORMAT_YCBCR420) { 250 if (vdsc_cfg->slice_width % 2) 251 return -EINVAL; 252 if (vdsc_cfg->slice_height % 2) 253 return -EINVAL; 254 if (vdsc_cfg->slice_height > 4094) 255 return -EINVAL; 256 if (vdsc_cfg->slice_height * vdsc_cfg->slice_width < 30000) 257 return -EINVAL; 258 } 259 260 return 0; 261 } 262 263 static bool is_dsi_dsc_1_1(struct intel_crtc_state *crtc_state) 264 { 265 struct drm_dsc_config *vdsc_cfg = &crtc_state->dsc.config; 266 267 return vdsc_cfg->dsc_version_major == 1 && 268 vdsc_cfg->dsc_version_minor == 1 && 269 intel_crtc_has_type(crtc_state, INTEL_OUTPUT_DSI); 270 } 271 272 int intel_dsc_compute_params(struct intel_crtc_state *pipe_config) 273 { 274 struct intel_display *display = to_intel_display(pipe_config); 275 struct drm_dsc_config *vdsc_cfg = &pipe_config->dsc.config; 276 u16 compressed_bpp = fxp_q4_to_int(pipe_config->dsc.compressed_bpp_x16); 277 int err; 278 int ret; 279 280 vdsc_cfg->pic_width = pipe_config->hw.adjusted_mode.crtc_hdisplay; 281 vdsc_cfg->slice_width = DIV_ROUND_UP(vdsc_cfg->pic_width, 282 pipe_config->dsc.slice_count); 283 284 err = intel_dsc_slice_dimensions_valid(pipe_config, vdsc_cfg); 285 286 if (err) { 287 drm_dbg_kms(display->drm, "Slice dimension requirements not met\n"); 288 return err; 289 } 290 291 /* 292 * According to DSC 1.2 specs if colorspace is YCbCr then convert_rgb is 0 293 * else 1 294 */ 295 vdsc_cfg->convert_rgb = pipe_config->output_format != INTEL_OUTPUT_FORMAT_YCBCR420 && 296 pipe_config->output_format != INTEL_OUTPUT_FORMAT_YCBCR444; 297 298 if (DISPLAY_VER(display) >= 14 && 299 pipe_config->output_format == INTEL_OUTPUT_FORMAT_YCBCR420) 300 vdsc_cfg->native_420 = true; 301 /* We do not support YcBCr422 as of now */ 302 vdsc_cfg->native_422 = false; 303 vdsc_cfg->simple_422 = false; 304 /* Gen 11 does not support VBR */ 305 vdsc_cfg->vbr_enable = false; 306 307 vdsc_cfg->bits_per_pixel = pipe_config->dsc.compressed_bpp_x16; 308 309 /* 310 * According to DSC 1.2 specs in Section 4.1 if native_420 is set 311 * we need to double the current bpp. 312 */ 313 if (vdsc_cfg->native_420) 314 vdsc_cfg->bits_per_pixel <<= 1; 315 316 vdsc_cfg->bits_per_component = pipe_config->pipe_bpp / 3; 317 318 if (vdsc_cfg->bits_per_component < 8) { 319 drm_dbg_kms(display->drm, "DSC bpc requirements not met bpc: %d\n", 320 vdsc_cfg->bits_per_component); 321 return -EINVAL; 322 } 323 324 drm_dsc_set_rc_buf_thresh(vdsc_cfg); 325 326 /* 327 * From XE_LPD onwards we supports compression bpps in steps of 1 328 * upto uncompressed bpp-1, hence add calculations for all the rc 329 * parameters 330 * 331 * We don't want to calculate all rc parameters when the panel 332 * is MIPI DSI and it's using DSC 1.1. The reason being that some 333 * DSI panels vendors have hardcoded PPS params in the VBT causing 334 * the parameters sent from the source which are derived through 335 * interpolation to differ from the params the panel expects. 336 * This causes a noise in the display. 337 * Furthermore for DSI panels we are currently using bits_per_pixel 338 * (compressed bpp) hardcoded from VBT, (unlike other encoders where we 339 * find the optimum compressed bpp) so dont need to rely on interpolation, 340 * as we can get the required rc parameters from the tables. 341 */ 342 if (DISPLAY_VER(display) >= 13 && !is_dsi_dsc_1_1(pipe_config)) { 343 calculate_rc_params(vdsc_cfg); 344 } else { 345 if ((compressed_bpp == 8 || 346 compressed_bpp == 12) && 347 (vdsc_cfg->bits_per_component == 8 || 348 vdsc_cfg->bits_per_component == 10 || 349 vdsc_cfg->bits_per_component == 12)) 350 ret = drm_dsc_setup_rc_params(vdsc_cfg, DRM_DSC_1_1_PRE_SCR); 351 else 352 ret = drm_dsc_setup_rc_params(vdsc_cfg, DRM_DSC_1_2_444); 353 354 if (ret) 355 return ret; 356 } 357 358 /* 359 * BitsPerComponent value determines mux_word_size: 360 * When BitsPerComponent is less than or 10bpc, muxWordSize will be equal to 361 * 48 bits otherwise 64 362 */ 363 if (vdsc_cfg->bits_per_component <= 10) 364 vdsc_cfg->mux_word_size = DSC_MUX_WORD_SIZE_8_10_BPC; 365 else 366 vdsc_cfg->mux_word_size = DSC_MUX_WORD_SIZE_12_BPC; 367 368 /* InitialScaleValue is a 6 bit value with 3 fractional bits (U3.3) */ 369 vdsc_cfg->initial_scale_value = (vdsc_cfg->rc_model_size << 3) / 370 (vdsc_cfg->rc_model_size - vdsc_cfg->initial_offset); 371 372 return 0; 373 } 374 375 void intel_dsc_enable_on_crtc(struct intel_crtc_state *crtc_state) 376 { 377 crtc_state->dsc.compression_enabled_on_link = true; 378 crtc_state->dsc.compression_enable = true; 379 } 380 381 bool intel_dsc_enabled_on_link(const struct intel_crtc_state *crtc_state) 382 { 383 struct intel_display *display = to_intel_display(crtc_state); 384 385 drm_WARN_ON(display->drm, crtc_state->dsc.compression_enable && 386 !crtc_state->dsc.compression_enabled_on_link); 387 388 return crtc_state->dsc.compression_enabled_on_link; 389 } 390 391 enum intel_display_power_domain 392 intel_dsc_power_domain(struct intel_crtc *crtc, enum transcoder cpu_transcoder) 393 { 394 struct intel_display *display = to_intel_display(crtc); 395 enum pipe pipe = crtc->pipe; 396 397 /* 398 * VDSC/joining uses a separate power well, PW2, and requires 399 * POWER_DOMAIN_TRANSCODER_VDSC_PW2 power domain in two cases: 400 * 401 * - ICL eDP/DSI transcoder 402 * - Display version 12 (except RKL) pipe A 403 * 404 * For any other pipe, VDSC/joining uses the power well associated with 405 * the pipe in use. Hence another reference on the pipe power domain 406 * will suffice. (Except no VDSC/joining on ICL pipe A.) 407 */ 408 if (DISPLAY_VER(display) == 12 && !display->platform.rocketlake && 409 pipe == PIPE_A) 410 return POWER_DOMAIN_TRANSCODER_VDSC_PW2; 411 else if (is_pipe_dsc(crtc, cpu_transcoder)) 412 return POWER_DOMAIN_PIPE(pipe); 413 else 414 return POWER_DOMAIN_TRANSCODER_VDSC_PW2; 415 } 416 417 static int intel_dsc_get_vdsc_per_pipe(const struct intel_crtc_state *crtc_state) 418 { 419 return crtc_state->dsc.num_streams; 420 } 421 422 int intel_dsc_get_num_vdsc_instances(const struct intel_crtc_state *crtc_state) 423 { 424 int num_vdsc_instances = intel_dsc_get_vdsc_per_pipe(crtc_state); 425 int num_joined_pipes = intel_crtc_num_joined_pipes(crtc_state); 426 427 num_vdsc_instances *= num_joined_pipes; 428 429 return num_vdsc_instances; 430 } 431 432 static void intel_dsc_get_pps_reg(const struct intel_crtc_state *crtc_state, int pps, 433 i915_reg_t *dsc_reg, int dsc_reg_num) 434 { 435 struct intel_crtc *crtc = to_intel_crtc(crtc_state->uapi.crtc); 436 enum transcoder cpu_transcoder = crtc_state->cpu_transcoder; 437 enum pipe pipe = crtc->pipe; 438 bool pipe_dsc; 439 440 pipe_dsc = is_pipe_dsc(crtc, cpu_transcoder); 441 442 if (dsc_reg_num >= 4) 443 MISSING_CASE(dsc_reg_num); 444 if (dsc_reg_num >= 3) 445 dsc_reg[2] = BMG_DSC2_PPS(pipe, pps); 446 if (dsc_reg_num >= 2) 447 dsc_reg[1] = pipe_dsc ? ICL_DSC1_PPS(pipe, pps) : DSCC_PPS(pps); 448 if (dsc_reg_num >= 1) 449 dsc_reg[0] = pipe_dsc ? ICL_DSC0_PPS(pipe, pps) : DSCA_PPS(pps); 450 } 451 452 static void intel_dsc_pps_write(const struct intel_crtc_state *crtc_state, 453 int pps, u32 pps_val) 454 { 455 struct intel_display *display = to_intel_display(crtc_state); 456 i915_reg_t dsc_reg[3]; 457 int i, vdsc_per_pipe, dsc_reg_num; 458 459 vdsc_per_pipe = intel_dsc_get_vdsc_per_pipe(crtc_state); 460 dsc_reg_num = min_t(int, ARRAY_SIZE(dsc_reg), vdsc_per_pipe); 461 462 drm_WARN_ON_ONCE(display->drm, dsc_reg_num < vdsc_per_pipe); 463 464 intel_dsc_get_pps_reg(crtc_state, pps, dsc_reg, dsc_reg_num); 465 466 for (i = 0; i < dsc_reg_num; i++) 467 intel_de_write(display, dsc_reg[i], pps_val); 468 } 469 470 static void intel_dsc_pps_configure(const struct intel_crtc_state *crtc_state) 471 { 472 struct intel_display *display = to_intel_display(crtc_state); 473 struct intel_crtc *crtc = to_intel_crtc(crtc_state->uapi.crtc); 474 const struct drm_dsc_config *vdsc_cfg = &crtc_state->dsc.config; 475 enum transcoder cpu_transcoder = crtc_state->cpu_transcoder; 476 enum pipe pipe = crtc->pipe; 477 u32 pps_val; 478 u32 rc_buf_thresh_dword[4]; 479 u32 rc_range_params_dword[8]; 480 int i = 0; 481 int num_vdsc_instances = intel_dsc_get_num_vdsc_instances(crtc_state); 482 int vdsc_instances_per_pipe = intel_dsc_get_vdsc_per_pipe(crtc_state); 483 484 /* PPS 0 */ 485 pps_val = DSC_PPS0_VER_MAJOR(1) | 486 DSC_PPS0_VER_MINOR(vdsc_cfg->dsc_version_minor) | 487 DSC_PPS0_BPC(vdsc_cfg->bits_per_component) | 488 DSC_PPS0_LINE_BUF_DEPTH(vdsc_cfg->line_buf_depth); 489 if (vdsc_cfg->dsc_version_minor == 2) { 490 pps_val |= DSC_PPS0_ALT_ICH_SEL; 491 if (vdsc_cfg->native_420) 492 pps_val |= DSC_PPS0_NATIVE_420_ENABLE; 493 if (vdsc_cfg->native_422) 494 pps_val |= DSC_PPS0_NATIVE_422_ENABLE; 495 } 496 if (vdsc_cfg->block_pred_enable) 497 pps_val |= DSC_PPS0_BLOCK_PREDICTION; 498 if (vdsc_cfg->convert_rgb) 499 pps_val |= DSC_PPS0_COLOR_SPACE_CONVERSION; 500 if (vdsc_cfg->simple_422) 501 pps_val |= DSC_PPS0_422_ENABLE; 502 if (vdsc_cfg->vbr_enable) 503 pps_val |= DSC_PPS0_VBR_ENABLE; 504 intel_dsc_pps_write(crtc_state, 0, pps_val); 505 506 /* PPS 1 */ 507 pps_val = DSC_PPS1_BPP(vdsc_cfg->bits_per_pixel); 508 intel_dsc_pps_write(crtc_state, 1, pps_val); 509 510 /* PPS 2 */ 511 pps_val = DSC_PPS2_PIC_HEIGHT(vdsc_cfg->pic_height) | 512 DSC_PPS2_PIC_WIDTH(vdsc_cfg->pic_width / num_vdsc_instances); 513 intel_dsc_pps_write(crtc_state, 2, pps_val); 514 515 /* PPS 3 */ 516 pps_val = DSC_PPS3_SLICE_HEIGHT(vdsc_cfg->slice_height) | 517 DSC_PPS3_SLICE_WIDTH(vdsc_cfg->slice_width); 518 intel_dsc_pps_write(crtc_state, 3, pps_val); 519 520 /* PPS 4 */ 521 pps_val = DSC_PPS4_INITIAL_XMIT_DELAY(vdsc_cfg->initial_xmit_delay) | 522 DSC_PPS4_INITIAL_DEC_DELAY(vdsc_cfg->initial_dec_delay); 523 intel_dsc_pps_write(crtc_state, 4, pps_val); 524 525 /* PPS 5 */ 526 pps_val = DSC_PPS5_SCALE_INC_INT(vdsc_cfg->scale_increment_interval) | 527 DSC_PPS5_SCALE_DEC_INT(vdsc_cfg->scale_decrement_interval); 528 intel_dsc_pps_write(crtc_state, 5, pps_val); 529 530 /* PPS 6 */ 531 pps_val = DSC_PPS6_INITIAL_SCALE_VALUE(vdsc_cfg->initial_scale_value) | 532 DSC_PPS6_FIRST_LINE_BPG_OFFSET(vdsc_cfg->first_line_bpg_offset) | 533 DSC_PPS6_FLATNESS_MIN_QP(vdsc_cfg->flatness_min_qp) | 534 DSC_PPS6_FLATNESS_MAX_QP(vdsc_cfg->flatness_max_qp); 535 intel_dsc_pps_write(crtc_state, 6, pps_val); 536 537 /* PPS 7 */ 538 pps_val = DSC_PPS7_SLICE_BPG_OFFSET(vdsc_cfg->slice_bpg_offset) | 539 DSC_PPS7_NFL_BPG_OFFSET(vdsc_cfg->nfl_bpg_offset); 540 intel_dsc_pps_write(crtc_state, 7, pps_val); 541 542 /* PPS 8 */ 543 pps_val = DSC_PPS8_FINAL_OFFSET(vdsc_cfg->final_offset) | 544 DSC_PPS8_INITIAL_OFFSET(vdsc_cfg->initial_offset); 545 intel_dsc_pps_write(crtc_state, 8, pps_val); 546 547 /* PPS 9 */ 548 pps_val = DSC_PPS9_RC_MODEL_SIZE(vdsc_cfg->rc_model_size) | 549 DSC_PPS9_RC_EDGE_FACTOR(DSC_RC_EDGE_FACTOR_CONST); 550 intel_dsc_pps_write(crtc_state, 9, pps_val); 551 552 /* PPS 10 */ 553 pps_val = DSC_PPS10_RC_QUANT_INC_LIMIT0(vdsc_cfg->rc_quant_incr_limit0) | 554 DSC_PPS10_RC_QUANT_INC_LIMIT1(vdsc_cfg->rc_quant_incr_limit1) | 555 DSC_PPS10_RC_TARGET_OFF_HIGH(DSC_RC_TGT_OFFSET_HI_CONST) | 556 DSC_PPS10_RC_TARGET_OFF_LOW(DSC_RC_TGT_OFFSET_LO_CONST); 557 intel_dsc_pps_write(crtc_state, 10, pps_val); 558 559 /* PPS 16 */ 560 pps_val = DSC_PPS16_SLICE_CHUNK_SIZE(vdsc_cfg->slice_chunk_size) | 561 DSC_PPS16_SLICE_PER_LINE((vdsc_cfg->pic_width / num_vdsc_instances) / 562 vdsc_cfg->slice_width) | 563 DSC_PPS16_SLICE_ROW_PER_FRAME(vdsc_cfg->pic_height / 564 vdsc_cfg->slice_height); 565 intel_dsc_pps_write(crtc_state, 16, pps_val); 566 567 if (DISPLAY_VER(display) >= 14) { 568 /* PPS 17 */ 569 pps_val = DSC_PPS17_SL_BPG_OFFSET(vdsc_cfg->second_line_bpg_offset); 570 intel_dsc_pps_write(crtc_state, 17, pps_val); 571 572 /* PPS 18 */ 573 pps_val = DSC_PPS18_NSL_BPG_OFFSET(vdsc_cfg->nsl_bpg_offset) | 574 DSC_PPS18_SL_OFFSET_ADJ(vdsc_cfg->second_line_offset_adj); 575 intel_dsc_pps_write(crtc_state, 18, pps_val); 576 } 577 578 /* Populate the RC_BUF_THRESH registers */ 579 memset(rc_buf_thresh_dword, 0, sizeof(rc_buf_thresh_dword)); 580 for (i = 0; i < DSC_NUM_BUF_RANGES - 1; i++) 581 rc_buf_thresh_dword[i / 4] |= 582 (u32)(vdsc_cfg->rc_buf_thresh[i] << 583 BITS_PER_BYTE * (i % 4)); 584 if (!is_pipe_dsc(crtc, cpu_transcoder)) { 585 intel_de_write(display, DSCA_RC_BUF_THRESH_0, 586 rc_buf_thresh_dword[0]); 587 intel_de_write(display, DSCA_RC_BUF_THRESH_0_UDW, 588 rc_buf_thresh_dword[1]); 589 intel_de_write(display, DSCA_RC_BUF_THRESH_1, 590 rc_buf_thresh_dword[2]); 591 intel_de_write(display, DSCA_RC_BUF_THRESH_1_UDW, 592 rc_buf_thresh_dword[3]); 593 if (vdsc_instances_per_pipe > 1) { 594 intel_de_write(display, DSCC_RC_BUF_THRESH_0, 595 rc_buf_thresh_dword[0]); 596 intel_de_write(display, DSCC_RC_BUF_THRESH_0_UDW, 597 rc_buf_thresh_dword[1]); 598 intel_de_write(display, DSCC_RC_BUF_THRESH_1, 599 rc_buf_thresh_dword[2]); 600 intel_de_write(display, DSCC_RC_BUF_THRESH_1_UDW, 601 rc_buf_thresh_dword[3]); 602 } 603 } else { 604 intel_de_write(display, ICL_DSC0_RC_BUF_THRESH_0(pipe), 605 rc_buf_thresh_dword[0]); 606 intel_de_write(display, ICL_DSC0_RC_BUF_THRESH_0_UDW(pipe), 607 rc_buf_thresh_dword[1]); 608 intel_de_write(display, ICL_DSC0_RC_BUF_THRESH_1(pipe), 609 rc_buf_thresh_dword[2]); 610 intel_de_write(display, ICL_DSC0_RC_BUF_THRESH_1_UDW(pipe), 611 rc_buf_thresh_dword[3]); 612 if (vdsc_instances_per_pipe > 1) { 613 intel_de_write(display, 614 ICL_DSC1_RC_BUF_THRESH_0(pipe), 615 rc_buf_thresh_dword[0]); 616 intel_de_write(display, 617 ICL_DSC1_RC_BUF_THRESH_0_UDW(pipe), 618 rc_buf_thresh_dword[1]); 619 intel_de_write(display, 620 ICL_DSC1_RC_BUF_THRESH_1(pipe), 621 rc_buf_thresh_dword[2]); 622 intel_de_write(display, 623 ICL_DSC1_RC_BUF_THRESH_1_UDW(pipe), 624 rc_buf_thresh_dword[3]); 625 } 626 } 627 628 /* Populate the RC_RANGE_PARAMETERS registers */ 629 memset(rc_range_params_dword, 0, sizeof(rc_range_params_dword)); 630 for (i = 0; i < DSC_NUM_BUF_RANGES; i++) 631 rc_range_params_dword[i / 2] |= 632 (u32)(((vdsc_cfg->rc_range_params[i].range_bpg_offset << 633 RC_BPG_OFFSET_SHIFT) | 634 (vdsc_cfg->rc_range_params[i].range_max_qp << 635 RC_MAX_QP_SHIFT) | 636 (vdsc_cfg->rc_range_params[i].range_min_qp << 637 RC_MIN_QP_SHIFT)) << 16 * (i % 2)); 638 if (!is_pipe_dsc(crtc, cpu_transcoder)) { 639 intel_de_write(display, DSCA_RC_RANGE_PARAMETERS_0, 640 rc_range_params_dword[0]); 641 intel_de_write(display, DSCA_RC_RANGE_PARAMETERS_0_UDW, 642 rc_range_params_dword[1]); 643 intel_de_write(display, DSCA_RC_RANGE_PARAMETERS_1, 644 rc_range_params_dword[2]); 645 intel_de_write(display, DSCA_RC_RANGE_PARAMETERS_1_UDW, 646 rc_range_params_dword[3]); 647 intel_de_write(display, DSCA_RC_RANGE_PARAMETERS_2, 648 rc_range_params_dword[4]); 649 intel_de_write(display, DSCA_RC_RANGE_PARAMETERS_2_UDW, 650 rc_range_params_dword[5]); 651 intel_de_write(display, DSCA_RC_RANGE_PARAMETERS_3, 652 rc_range_params_dword[6]); 653 intel_de_write(display, DSCA_RC_RANGE_PARAMETERS_3_UDW, 654 rc_range_params_dword[7]); 655 if (vdsc_instances_per_pipe > 1) { 656 intel_de_write(display, DSCC_RC_RANGE_PARAMETERS_0, 657 rc_range_params_dword[0]); 658 intel_de_write(display, 659 DSCC_RC_RANGE_PARAMETERS_0_UDW, 660 rc_range_params_dword[1]); 661 intel_de_write(display, DSCC_RC_RANGE_PARAMETERS_1, 662 rc_range_params_dword[2]); 663 intel_de_write(display, 664 DSCC_RC_RANGE_PARAMETERS_1_UDW, 665 rc_range_params_dword[3]); 666 intel_de_write(display, DSCC_RC_RANGE_PARAMETERS_2, 667 rc_range_params_dword[4]); 668 intel_de_write(display, 669 DSCC_RC_RANGE_PARAMETERS_2_UDW, 670 rc_range_params_dword[5]); 671 intel_de_write(display, DSCC_RC_RANGE_PARAMETERS_3, 672 rc_range_params_dword[6]); 673 intel_de_write(display, 674 DSCC_RC_RANGE_PARAMETERS_3_UDW, 675 rc_range_params_dword[7]); 676 } 677 } else { 678 intel_de_write(display, ICL_DSC0_RC_RANGE_PARAMETERS_0(pipe), 679 rc_range_params_dword[0]); 680 intel_de_write(display, 681 ICL_DSC0_RC_RANGE_PARAMETERS_0_UDW(pipe), 682 rc_range_params_dword[1]); 683 intel_de_write(display, ICL_DSC0_RC_RANGE_PARAMETERS_1(pipe), 684 rc_range_params_dword[2]); 685 intel_de_write(display, 686 ICL_DSC0_RC_RANGE_PARAMETERS_1_UDW(pipe), 687 rc_range_params_dword[3]); 688 intel_de_write(display, ICL_DSC0_RC_RANGE_PARAMETERS_2(pipe), 689 rc_range_params_dword[4]); 690 intel_de_write(display, 691 ICL_DSC0_RC_RANGE_PARAMETERS_2_UDW(pipe), 692 rc_range_params_dword[5]); 693 intel_de_write(display, ICL_DSC0_RC_RANGE_PARAMETERS_3(pipe), 694 rc_range_params_dword[6]); 695 intel_de_write(display, 696 ICL_DSC0_RC_RANGE_PARAMETERS_3_UDW(pipe), 697 rc_range_params_dword[7]); 698 if (vdsc_instances_per_pipe > 1) { 699 intel_de_write(display, 700 ICL_DSC1_RC_RANGE_PARAMETERS_0(pipe), 701 rc_range_params_dword[0]); 702 intel_de_write(display, 703 ICL_DSC1_RC_RANGE_PARAMETERS_0_UDW(pipe), 704 rc_range_params_dword[1]); 705 intel_de_write(display, 706 ICL_DSC1_RC_RANGE_PARAMETERS_1(pipe), 707 rc_range_params_dword[2]); 708 intel_de_write(display, 709 ICL_DSC1_RC_RANGE_PARAMETERS_1_UDW(pipe), 710 rc_range_params_dword[3]); 711 intel_de_write(display, 712 ICL_DSC1_RC_RANGE_PARAMETERS_2(pipe), 713 rc_range_params_dword[4]); 714 intel_de_write(display, 715 ICL_DSC1_RC_RANGE_PARAMETERS_2_UDW(pipe), 716 rc_range_params_dword[5]); 717 intel_de_write(display, 718 ICL_DSC1_RC_RANGE_PARAMETERS_3(pipe), 719 rc_range_params_dword[6]); 720 intel_de_write(display, 721 ICL_DSC1_RC_RANGE_PARAMETERS_3_UDW(pipe), 722 rc_range_params_dword[7]); 723 } 724 } 725 } 726 727 void intel_dsc_dsi_pps_write(struct intel_encoder *encoder, 728 const struct intel_crtc_state *crtc_state) 729 { 730 const struct drm_dsc_config *vdsc_cfg = &crtc_state->dsc.config; 731 struct intel_dsi *intel_dsi = enc_to_intel_dsi(encoder); 732 struct mipi_dsi_device *dsi; 733 struct drm_dsc_picture_parameter_set pps; 734 enum port port; 735 736 if (!crtc_state->dsc.compression_enable) 737 return; 738 739 drm_dsc_pps_payload_pack(&pps, vdsc_cfg); 740 741 for_each_dsi_port(port, intel_dsi->ports) { 742 dsi = intel_dsi->dsi_hosts[port]->device; 743 744 mipi_dsi_picture_parameter_set(dsi, &pps); 745 mipi_dsi_compression_mode(dsi, true); 746 } 747 } 748 749 void intel_dsc_dp_pps_write(struct intel_encoder *encoder, 750 const struct intel_crtc_state *crtc_state) 751 { 752 struct intel_digital_port *dig_port = enc_to_dig_port(encoder); 753 const struct drm_dsc_config *vdsc_cfg = &crtc_state->dsc.config; 754 struct drm_dsc_pps_infoframe dp_dsc_pps_sdp; 755 756 if (!crtc_state->dsc.compression_enable) 757 return; 758 759 /* Prepare DP SDP PPS header as per DP 1.4 spec, Table 2-123 */ 760 drm_dsc_dp_pps_header_init(&dp_dsc_pps_sdp.pps_header); 761 762 /* Fill the PPS payload bytes as per DSC spec 1.2 Table 4-1 */ 763 drm_dsc_pps_payload_pack(&dp_dsc_pps_sdp.pps_payload, vdsc_cfg); 764 765 dig_port->write_infoframe(encoder, crtc_state, 766 DP_SDP_PPS, &dp_dsc_pps_sdp, 767 sizeof(dp_dsc_pps_sdp)); 768 } 769 770 static i915_reg_t dss_ctl1_reg(struct intel_crtc *crtc, enum transcoder cpu_transcoder) 771 { 772 return is_pipe_dsc(crtc, cpu_transcoder) ? 773 ICL_PIPE_DSS_CTL1(crtc->pipe) : DSS_CTL1; 774 } 775 776 static i915_reg_t dss_ctl2_reg(struct intel_crtc *crtc, enum transcoder cpu_transcoder) 777 { 778 return is_pipe_dsc(crtc, cpu_transcoder) ? 779 ICL_PIPE_DSS_CTL2(crtc->pipe) : DSS_CTL2; 780 } 781 782 void intel_uncompressed_joiner_enable(const struct intel_crtc_state *crtc_state) 783 { 784 struct intel_display *display = to_intel_display(crtc_state); 785 struct intel_crtc *crtc = to_intel_crtc(crtc_state->uapi.crtc); 786 u32 dss_ctl1_val = 0; 787 788 if (crtc_state->joiner_pipes && !crtc_state->dsc.compression_enable) { 789 if (intel_crtc_is_bigjoiner_secondary(crtc_state)) 790 dss_ctl1_val |= UNCOMPRESSED_JOINER_SECONDARY; 791 else 792 dss_ctl1_val |= UNCOMPRESSED_JOINER_PRIMARY; 793 794 intel_de_write(display, dss_ctl1_reg(crtc, crtc_state->cpu_transcoder), 795 dss_ctl1_val); 796 } 797 } 798 799 void intel_dsc_enable(const struct intel_crtc_state *crtc_state) 800 { 801 struct intel_display *display = to_intel_display(crtc_state); 802 struct intel_crtc *crtc = to_intel_crtc(crtc_state->uapi.crtc); 803 u32 dss_ctl1_val = 0; 804 u32 dss_ctl2_val = 0; 805 int vdsc_instances_per_pipe = intel_dsc_get_vdsc_per_pipe(crtc_state); 806 807 if (!crtc_state->dsc.compression_enable) 808 return; 809 810 intel_dsc_pps_configure(crtc_state); 811 812 dss_ctl2_val |= VDSC0_ENABLE; 813 if (vdsc_instances_per_pipe > 1) { 814 dss_ctl2_val |= VDSC1_ENABLE; 815 dss_ctl1_val |= JOINER_ENABLE; 816 } 817 818 if (vdsc_instances_per_pipe > 2) { 819 dss_ctl2_val |= VDSC2_ENABLE; 820 dss_ctl2_val |= SMALL_JOINER_CONFIG_3_ENGINES; 821 } 822 823 if (crtc_state->joiner_pipes) { 824 if (intel_crtc_ultrajoiner_enable_needed(crtc_state)) 825 dss_ctl1_val |= ULTRA_JOINER_ENABLE; 826 827 if (intel_crtc_is_ultrajoiner_primary(crtc_state)) 828 dss_ctl1_val |= PRIMARY_ULTRA_JOINER_ENABLE; 829 830 dss_ctl1_val |= BIG_JOINER_ENABLE; 831 832 if (intel_crtc_is_bigjoiner_primary(crtc_state)) 833 dss_ctl1_val |= PRIMARY_BIG_JOINER_ENABLE; 834 } 835 intel_de_write(display, dss_ctl1_reg(crtc, crtc_state->cpu_transcoder), dss_ctl1_val); 836 intel_de_write(display, dss_ctl2_reg(crtc, crtc_state->cpu_transcoder), dss_ctl2_val); 837 } 838 839 void intel_dsc_disable(const struct intel_crtc_state *old_crtc_state) 840 { 841 struct intel_display *display = to_intel_display(old_crtc_state); 842 struct intel_crtc *crtc = to_intel_crtc(old_crtc_state->uapi.crtc); 843 844 /* Disable only if either of them is enabled */ 845 if (old_crtc_state->dsc.compression_enable || 846 old_crtc_state->joiner_pipes) { 847 intel_de_write(display, dss_ctl1_reg(crtc, old_crtc_state->cpu_transcoder), 0); 848 intel_de_write(display, dss_ctl2_reg(crtc, old_crtc_state->cpu_transcoder), 0); 849 } 850 } 851 852 static u32 intel_dsc_pps_read(struct intel_crtc_state *crtc_state, int pps, 853 bool *all_equal) 854 { 855 struct intel_display *display = to_intel_display(crtc_state); 856 i915_reg_t dsc_reg[3]; 857 int i, vdsc_per_pipe, dsc_reg_num; 858 u32 val; 859 860 vdsc_per_pipe = intel_dsc_get_vdsc_per_pipe(crtc_state); 861 dsc_reg_num = min_t(int, ARRAY_SIZE(dsc_reg), vdsc_per_pipe); 862 863 drm_WARN_ON_ONCE(display->drm, dsc_reg_num < vdsc_per_pipe); 864 865 intel_dsc_get_pps_reg(crtc_state, pps, dsc_reg, dsc_reg_num); 866 867 *all_equal = true; 868 869 val = intel_de_read(display, dsc_reg[0]); 870 871 for (i = 1; i < dsc_reg_num; i++) { 872 if (intel_de_read(display, dsc_reg[i]) != val) { 873 *all_equal = false; 874 break; 875 } 876 } 877 878 return val; 879 } 880 881 static u32 intel_dsc_pps_read_and_verify(struct intel_crtc_state *crtc_state, int pps) 882 { 883 struct intel_display *display = to_intel_display(crtc_state); 884 u32 val; 885 bool all_equal; 886 887 val = intel_dsc_pps_read(crtc_state, pps, &all_equal); 888 drm_WARN_ON(display->drm, !all_equal); 889 890 return val; 891 } 892 893 static void intel_dsc_get_pps_config(struct intel_crtc_state *crtc_state) 894 { 895 struct intel_display *display = to_intel_display(crtc_state); 896 struct drm_dsc_config *vdsc_cfg = &crtc_state->dsc.config; 897 int num_vdsc_instances = intel_dsc_get_num_vdsc_instances(crtc_state); 898 u32 pps_temp; 899 900 /* PPS 0 */ 901 pps_temp = intel_dsc_pps_read_and_verify(crtc_state, 0); 902 903 vdsc_cfg->bits_per_component = REG_FIELD_GET(DSC_PPS0_BPC_MASK, pps_temp); 904 vdsc_cfg->line_buf_depth = REG_FIELD_GET(DSC_PPS0_LINE_BUF_DEPTH_MASK, pps_temp); 905 vdsc_cfg->block_pred_enable = pps_temp & DSC_PPS0_BLOCK_PREDICTION; 906 vdsc_cfg->convert_rgb = pps_temp & DSC_PPS0_COLOR_SPACE_CONVERSION; 907 vdsc_cfg->simple_422 = pps_temp & DSC_PPS0_422_ENABLE; 908 vdsc_cfg->native_422 = pps_temp & DSC_PPS0_NATIVE_422_ENABLE; 909 vdsc_cfg->native_420 = pps_temp & DSC_PPS0_NATIVE_420_ENABLE; 910 vdsc_cfg->vbr_enable = pps_temp & DSC_PPS0_VBR_ENABLE; 911 912 /* PPS 1 */ 913 pps_temp = intel_dsc_pps_read_and_verify(crtc_state, 1); 914 915 vdsc_cfg->bits_per_pixel = REG_FIELD_GET(DSC_PPS1_BPP_MASK, pps_temp); 916 917 if (vdsc_cfg->native_420) 918 vdsc_cfg->bits_per_pixel >>= 1; 919 920 crtc_state->dsc.compressed_bpp_x16 = vdsc_cfg->bits_per_pixel; 921 922 /* PPS 2 */ 923 pps_temp = intel_dsc_pps_read_and_verify(crtc_state, 2); 924 925 vdsc_cfg->pic_width = REG_FIELD_GET(DSC_PPS2_PIC_WIDTH_MASK, pps_temp) * num_vdsc_instances; 926 vdsc_cfg->pic_height = REG_FIELD_GET(DSC_PPS2_PIC_HEIGHT_MASK, pps_temp); 927 928 /* PPS 3 */ 929 pps_temp = intel_dsc_pps_read_and_verify(crtc_state, 3); 930 931 vdsc_cfg->slice_width = REG_FIELD_GET(DSC_PPS3_SLICE_WIDTH_MASK, pps_temp); 932 vdsc_cfg->slice_height = REG_FIELD_GET(DSC_PPS3_SLICE_HEIGHT_MASK, pps_temp); 933 934 /* PPS 4 */ 935 pps_temp = intel_dsc_pps_read_and_verify(crtc_state, 4); 936 937 vdsc_cfg->initial_dec_delay = REG_FIELD_GET(DSC_PPS4_INITIAL_DEC_DELAY_MASK, pps_temp); 938 vdsc_cfg->initial_xmit_delay = REG_FIELD_GET(DSC_PPS4_INITIAL_XMIT_DELAY_MASK, pps_temp); 939 940 /* PPS 5 */ 941 pps_temp = intel_dsc_pps_read_and_verify(crtc_state, 5); 942 943 vdsc_cfg->scale_decrement_interval = REG_FIELD_GET(DSC_PPS5_SCALE_DEC_INT_MASK, pps_temp); 944 vdsc_cfg->scale_increment_interval = REG_FIELD_GET(DSC_PPS5_SCALE_INC_INT_MASK, pps_temp); 945 946 /* PPS 6 */ 947 pps_temp = intel_dsc_pps_read_and_verify(crtc_state, 6); 948 949 vdsc_cfg->initial_scale_value = REG_FIELD_GET(DSC_PPS6_INITIAL_SCALE_VALUE_MASK, pps_temp); 950 vdsc_cfg->first_line_bpg_offset = REG_FIELD_GET(DSC_PPS6_FIRST_LINE_BPG_OFFSET_MASK, pps_temp); 951 vdsc_cfg->flatness_min_qp = REG_FIELD_GET(DSC_PPS6_FLATNESS_MIN_QP_MASK, pps_temp); 952 vdsc_cfg->flatness_max_qp = REG_FIELD_GET(DSC_PPS6_FLATNESS_MAX_QP_MASK, pps_temp); 953 954 /* PPS 7 */ 955 pps_temp = intel_dsc_pps_read_and_verify(crtc_state, 7); 956 957 vdsc_cfg->nfl_bpg_offset = REG_FIELD_GET(DSC_PPS7_NFL_BPG_OFFSET_MASK, pps_temp); 958 vdsc_cfg->slice_bpg_offset = REG_FIELD_GET(DSC_PPS7_SLICE_BPG_OFFSET_MASK, pps_temp); 959 960 /* PPS 8 */ 961 pps_temp = intel_dsc_pps_read_and_verify(crtc_state, 8); 962 963 vdsc_cfg->initial_offset = REG_FIELD_GET(DSC_PPS8_INITIAL_OFFSET_MASK, pps_temp); 964 vdsc_cfg->final_offset = REG_FIELD_GET(DSC_PPS8_FINAL_OFFSET_MASK, pps_temp); 965 966 /* PPS 9 */ 967 pps_temp = intel_dsc_pps_read_and_verify(crtc_state, 9); 968 969 vdsc_cfg->rc_model_size = REG_FIELD_GET(DSC_PPS9_RC_MODEL_SIZE_MASK, pps_temp); 970 971 /* PPS 10 */ 972 pps_temp = intel_dsc_pps_read_and_verify(crtc_state, 10); 973 974 vdsc_cfg->rc_quant_incr_limit0 = REG_FIELD_GET(DSC_PPS10_RC_QUANT_INC_LIMIT0_MASK, pps_temp); 975 vdsc_cfg->rc_quant_incr_limit1 = REG_FIELD_GET(DSC_PPS10_RC_QUANT_INC_LIMIT1_MASK, pps_temp); 976 977 /* PPS 16 */ 978 pps_temp = intel_dsc_pps_read_and_verify(crtc_state, 16); 979 980 vdsc_cfg->slice_chunk_size = REG_FIELD_GET(DSC_PPS16_SLICE_CHUNK_SIZE_MASK, pps_temp); 981 982 if (DISPLAY_VER(display) >= 14) { 983 /* PPS 17 */ 984 pps_temp = intel_dsc_pps_read_and_verify(crtc_state, 17); 985 986 vdsc_cfg->second_line_bpg_offset = REG_FIELD_GET(DSC_PPS17_SL_BPG_OFFSET_MASK, pps_temp); 987 988 /* PPS 18 */ 989 pps_temp = intel_dsc_pps_read_and_verify(crtc_state, 18); 990 991 vdsc_cfg->nsl_bpg_offset = REG_FIELD_GET(DSC_PPS18_NSL_BPG_OFFSET_MASK, pps_temp); 992 vdsc_cfg->second_line_offset_adj = REG_FIELD_GET(DSC_PPS18_SL_OFFSET_ADJ_MASK, pps_temp); 993 } 994 } 995 996 void intel_dsc_get_config(struct intel_crtc_state *crtc_state) 997 { 998 struct intel_display *display = to_intel_display(crtc_state); 999 struct intel_crtc *crtc = to_intel_crtc(crtc_state->uapi.crtc); 1000 enum transcoder cpu_transcoder = crtc_state->cpu_transcoder; 1001 enum intel_display_power_domain power_domain; 1002 intel_wakeref_t wakeref; 1003 u32 dss_ctl1, dss_ctl2; 1004 1005 if (!intel_dsc_source_support(crtc_state)) 1006 return; 1007 1008 power_domain = intel_dsc_power_domain(crtc, cpu_transcoder); 1009 1010 wakeref = intel_display_power_get_if_enabled(display, power_domain); 1011 if (!wakeref) 1012 return; 1013 1014 dss_ctl1 = intel_de_read(display, dss_ctl1_reg(crtc, cpu_transcoder)); 1015 dss_ctl2 = intel_de_read(display, dss_ctl2_reg(crtc, cpu_transcoder)); 1016 1017 crtc_state->dsc.compression_enable = dss_ctl2 & VDSC0_ENABLE; 1018 if (!crtc_state->dsc.compression_enable) 1019 goto out; 1020 1021 if (dss_ctl1 & JOINER_ENABLE && dss_ctl2 & (VDSC2_ENABLE | SMALL_JOINER_CONFIG_3_ENGINES)) 1022 crtc_state->dsc.num_streams = 3; 1023 else if (dss_ctl1 & JOINER_ENABLE && dss_ctl2 & VDSC1_ENABLE) 1024 crtc_state->dsc.num_streams = 2; 1025 else 1026 crtc_state->dsc.num_streams = 1; 1027 1028 intel_dsc_get_pps_config(crtc_state); 1029 out: 1030 intel_display_power_put(display, power_domain, wakeref); 1031 } 1032 1033 static void intel_vdsc_dump_state(struct drm_printer *p, int indent, 1034 const struct intel_crtc_state *crtc_state) 1035 { 1036 drm_printf_indent(p, indent, 1037 "dsc-dss: compressed-bpp:" FXP_Q4_FMT ", slice-count: %d, num_streams: %d\n", 1038 FXP_Q4_ARGS(crtc_state->dsc.compressed_bpp_x16), 1039 crtc_state->dsc.slice_count, 1040 crtc_state->dsc.num_streams); 1041 } 1042 1043 void intel_vdsc_state_dump(struct drm_printer *p, int indent, 1044 const struct intel_crtc_state *crtc_state) 1045 { 1046 if (!crtc_state->dsc.compression_enable) 1047 return; 1048 1049 intel_vdsc_dump_state(p, indent, crtc_state); 1050 drm_dsc_dump_config(p, indent, &crtc_state->dsc.config); 1051 } 1052 1053 int intel_vdsc_min_cdclk(const struct intel_crtc_state *crtc_state) 1054 { 1055 struct intel_display *display = to_intel_display(crtc_state); 1056 int num_vdsc_instances = intel_dsc_get_num_vdsc_instances(crtc_state); 1057 int min_cdclk; 1058 1059 if (!crtc_state->dsc.compression_enable) 1060 return 0; 1061 1062 /* 1063 * When we decide to use only one VDSC engine, since 1064 * each VDSC operates with 1 ppc throughput, pixel clock 1065 * cannot be higher than the VDSC clock (cdclk) 1066 * If there 2 VDSC engines, then pixel clock can't be higher than 1067 * VDSC clock(cdclk) * 2 and so on. 1068 */ 1069 min_cdclk = DIV_ROUND_UP(crtc_state->pixel_rate, num_vdsc_instances); 1070 1071 if (crtc_state->joiner_pipes) { 1072 int pixel_clock = intel_dp_mode_to_fec_clock(crtc_state->hw.adjusted_mode.clock); 1073 1074 /* 1075 * According to Bigjoiner bw check: 1076 * compressed_bpp <= PPC * CDCLK * Big joiner Interface bits / Pixel clock 1077 * 1078 * We have already computed compressed_bpp, so now compute the min CDCLK that 1079 * is required to support this compressed_bpp. 1080 * 1081 * => CDCLK >= compressed_bpp * Pixel clock / (PPC * Bigjoiner Interface bits) 1082 * 1083 * Since PPC = 2 with bigjoiner 1084 * => CDCLK >= compressed_bpp * Pixel clock / 2 * Bigjoiner Interface bits 1085 */ 1086 int bigjoiner_interface_bits = DISPLAY_VER(display) >= 14 ? 36 : 24; 1087 int min_cdclk_bj = 1088 (fxp_q4_to_int_roundup(crtc_state->dsc.compressed_bpp_x16) * 1089 pixel_clock) / (2 * bigjoiner_interface_bits); 1090 1091 min_cdclk = max(min_cdclk, min_cdclk_bj); 1092 } 1093 1094 return min_cdclk; 1095 } 1096 1097 unsigned int intel_vdsc_prefill_lines(const struct intel_crtc_state *crtc_state) 1098 { 1099 if (!crtc_state->dsc.compression_enable) 1100 return 0; 1101 1102 return 0x18000; /* 1.5 */ 1103 } 1104