1/* $NetBSD: amdgpu_dcn20_dsc.c,v 1.2 2021/12/18 23:45:03 riastradh Exp $ */ 2 3/* 4 * Copyright 2017 Advanced Micro Devices, Inc. 5 * 6 * Permission is hereby granted, free of charge, to any person obtaining a 7 * copy of this software and associated documentation files (the "Software"), 8 * to deal in the Software without restriction, including without limitation 9 * the rights to use, copy, modify, merge, publish, distribute, sublicense, 10 * and/or sell copies of the Software, and to permit persons to whom the 11 * Software is furnished to do so, subject to the following conditions: 12 * 13 * The above copyright notice and this permission notice shall be included in 14 * all copies or substantial portions of the Software. 15 * 16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL 19 * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR 20 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, 21 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR 22 * OTHER DEALINGS IN THE SOFTWARE. 23 * 24 * Authors: AMD 25 * 26 */ 27 28#include <sys/cdefs.h> 29__KERNEL_RCSID(0, "$NetBSD: amdgpu_dcn20_dsc.c,v 1.2 2021/12/18 23:45:03 riastradh Exp $"); 30 31#include "reg_helper.h" 32#include "dcn20_dsc.h" 33#include "dsc/dscc_types.h" 34 35static void dsc_log_pps(struct display_stream_compressor *dsc, struct drm_dsc_config *pps); 36static bool dsc_prepare_config(const struct dsc_config *dsc_cfg, struct dsc_reg_values *dsc_reg_vals, 37 struct dsc_optc_config *dsc_optc_cfg); 38static void dsc_init_reg_values(struct dsc_reg_values *reg_vals); 39static void dsc_update_from_dsc_parameters(struct dsc_reg_values *reg_vals, const struct dsc_parameters *dsc_params); 40static void dsc_write_to_registers(struct display_stream_compressor *dsc, const struct dsc_reg_values *reg_vals); 41static enum dsc_pixel_format dsc_dc_pixel_encoding_to_dsc_pixel_format(enum dc_pixel_encoding dc_pix_enc, bool is_ycbcr422_simple); 42static enum dsc_bits_per_comp dsc_dc_color_depth_to_dsc_bits_per_comp(enum dc_color_depth); 43 44/* Object I/F functions */ 45static void dsc2_get_enc_caps(struct dsc_enc_caps *dsc_enc_caps, int pixel_clock_100Hz); 46static void dsc2_read_state(struct display_stream_compressor *dsc, struct dcn_dsc_state *s); 47static bool dsc2_validate_stream(struct display_stream_compressor *dsc, const struct dsc_config *dsc_cfg); 48static void dsc2_set_config(struct display_stream_compressor *dsc, const struct dsc_config *dsc_cfg, 49 struct dsc_optc_config *dsc_optc_cfg); 50static bool dsc2_get_packed_pps(struct display_stream_compressor *dsc, const struct dsc_config *dsc_cfg, uint8_t *dsc_packed_pps); 51static void dsc2_enable(struct display_stream_compressor *dsc, int opp_pipe); 52static void dsc2_disable(struct display_stream_compressor *dsc); 53 54const struct dsc_funcs dcn20_dsc_funcs = { 55 .dsc_get_enc_caps = dsc2_get_enc_caps, 56 .dsc_read_state = dsc2_read_state, 57 .dsc_validate_stream = dsc2_validate_stream, 58 .dsc_set_config = dsc2_set_config, 59 .dsc_get_packed_pps = dsc2_get_packed_pps, 60 .dsc_enable = dsc2_enable, 61 .dsc_disable = dsc2_disable, 62}; 63 64/* Macro definitios for REG_SET macros*/ 65#define CTX \ 66 dsc20->base.ctx 67 68#define REG(reg)\ 69 dsc20->dsc_regs->reg 70 71#undef FN 72#define FN(reg_name, field_name) \ 73 dsc20->dsc_shift->field_name, dsc20->dsc_mask->field_name 74#define DC_LOGGER \ 75 dsc->ctx->logger 76 77enum dsc_bits_per_comp { 78 DSC_BPC_8 = 8, 79 DSC_BPC_10 = 10, 80 DSC_BPC_12 = 12, 81 DSC_BPC_UNKNOWN 82}; 83 84/* API functions (external or via structure->function_pointer) */ 85 86void dsc2_construct(struct dcn20_dsc *dsc, 87 struct dc_context *ctx, 88 int inst, 89 const struct dcn20_dsc_registers *dsc_regs, 90 const struct dcn20_dsc_shift *dsc_shift, 91 const struct dcn20_dsc_mask *dsc_mask) 92{ 93 dsc->base.ctx = ctx; 94 dsc->base.inst = inst; 95 dsc->base.funcs = &dcn20_dsc_funcs; 96 97 dsc->dsc_regs = dsc_regs; 98 dsc->dsc_shift = dsc_shift; 99 dsc->dsc_mask = dsc_mask; 100 101 dsc->max_image_width = 5184; 102} 103 104 105#define DCN20_MAX_PIXEL_CLOCK_Mhz 1188 106#define DCN20_MAX_DISPLAY_CLOCK_Mhz 1200 107 108/* This returns the capabilities for a single DSC encoder engine. Number of slices and total throughput 109 * can be doubled, tripled etc. by using additional DSC engines. 110 */ 111static void dsc2_get_enc_caps(struct dsc_enc_caps *dsc_enc_caps, int pixel_clock_100Hz) 112{ 113 dsc_enc_caps->dsc_version = 0x21; /* v1.2 - DP spec defined it in reverse order and we kept it */ 114 115 dsc_enc_caps->slice_caps.bits.NUM_SLICES_1 = 1; 116 dsc_enc_caps->slice_caps.bits.NUM_SLICES_2 = 1; 117 dsc_enc_caps->slice_caps.bits.NUM_SLICES_3 = 1; 118 dsc_enc_caps->slice_caps.bits.NUM_SLICES_4 = 1; 119 120 dsc_enc_caps->lb_bit_depth = 13; 121 dsc_enc_caps->is_block_pred_supported = true; 122 123 dsc_enc_caps->color_formats.bits.RGB = 1; 124 dsc_enc_caps->color_formats.bits.YCBCR_444 = 1; 125 dsc_enc_caps->color_formats.bits.YCBCR_SIMPLE_422 = 1; 126 dsc_enc_caps->color_formats.bits.YCBCR_NATIVE_422 = 0; 127 dsc_enc_caps->color_formats.bits.YCBCR_NATIVE_420 = 1; 128 129 dsc_enc_caps->color_depth.bits.COLOR_DEPTH_8_BPC = 1; 130 dsc_enc_caps->color_depth.bits.COLOR_DEPTH_10_BPC = 1; 131 dsc_enc_caps->color_depth.bits.COLOR_DEPTH_12_BPC = 1; 132 133 /* Maximum total throughput with all the slices combined. This is different from how DP spec specifies it. 134 * Our decoder's total throughput in Pix/s is equal to DISPCLK. This is then shared between slices. 135 * The value below is the absolute maximum value. The actual throughput may be lower, but it'll always 136 * be sufficient to process the input pixel rate fed into a single DSC engine. 137 */ 138 dsc_enc_caps->max_total_throughput_mps = DCN20_MAX_DISPLAY_CLOCK_Mhz; 139 140 /* For pixel clock bigger than a single-pipe limit we'll need two engines, which then doubles our 141 * throughput and number of slices, but also introduces a lower limit of 2 slices 142 */ 143 if (pixel_clock_100Hz >= DCN20_MAX_PIXEL_CLOCK_Mhz*10000) { 144 dsc_enc_caps->slice_caps.bits.NUM_SLICES_1 = 0; 145 dsc_enc_caps->slice_caps.bits.NUM_SLICES_8 = 1; 146 dsc_enc_caps->max_total_throughput_mps = DCN20_MAX_DISPLAY_CLOCK_Mhz * 2; 147 } 148 149 // TODO DSC: This is actually image width limitation, not a slice width. This should be added to the criteria to use ODM. 150 dsc_enc_caps->max_slice_width = 5184; /* (including 64 overlap pixels for eDP MSO mode) */ 151 dsc_enc_caps->bpp_increment_div = 16; /* 1/16th of a bit */ 152} 153 154 155/* this function read dsc related register fields to be logged later in dcn10_log_hw_state 156 * into a dcn_dsc_state struct. 157 */ 158static void dsc2_read_state(struct display_stream_compressor *dsc, struct dcn_dsc_state *s) 159{ 160 struct dcn20_dsc *dsc20 = TO_DCN20_DSC(dsc); 161 162 REG_GET(DSC_TOP_CONTROL, DSC_CLOCK_EN, &s->dsc_clock_en); 163 REG_GET(DSCC_PPS_CONFIG3, SLICE_WIDTH, &s->dsc_slice_width); 164 REG_GET(DSCC_PPS_CONFIG1, BITS_PER_PIXEL, &s->dsc_bytes_per_pixel); 165} 166 167 168static bool dsc2_validate_stream(struct display_stream_compressor *dsc, const struct dsc_config *dsc_cfg) 169{ 170 struct dsc_optc_config dsc_optc_cfg; 171 struct dcn20_dsc *dsc20 = TO_DCN20_DSC(dsc); 172 173 if (dsc_cfg->pic_width > dsc20->max_image_width) 174 return false; 175 176 return dsc_prepare_config(dsc_cfg, &dsc20->reg_vals, &dsc_optc_cfg); 177} 178 179 180static void dsc_config_log(struct display_stream_compressor *dsc, const struct dsc_config *config) 181{ 182 DC_LOG_DSC("\tnum_slices_h %d", config->dc_dsc_cfg.num_slices_h); 183 DC_LOG_DSC("\tnum_slices_v %d", config->dc_dsc_cfg.num_slices_v); 184 DC_LOG_DSC("\tbits_per_pixel %d (%d.%04d)", 185 config->dc_dsc_cfg.bits_per_pixel, 186 config->dc_dsc_cfg.bits_per_pixel / 16, 187 ((config->dc_dsc_cfg.bits_per_pixel % 16) * 10000) / 16); 188 DC_LOG_DSC("\tcolor_depth %d", config->color_depth); 189} 190 191static void dsc2_set_config(struct display_stream_compressor *dsc, const struct dsc_config *dsc_cfg, 192 struct dsc_optc_config *dsc_optc_cfg) 193{ 194 bool is_config_ok; 195 struct dcn20_dsc *dsc20 = TO_DCN20_DSC(dsc); 196 197 DC_LOG_DSC(" "); 198 DC_LOG_DSC("Setting DSC Config at DSC inst %d", dsc->inst); 199 dsc_config_log(dsc, dsc_cfg); 200 is_config_ok = dsc_prepare_config(dsc_cfg, &dsc20->reg_vals, dsc_optc_cfg); 201 ASSERT(is_config_ok); 202 DC_LOG_DSC("programming DSC Picture Parameter Set (PPS):"); 203 dsc_log_pps(dsc, &dsc20->reg_vals.pps); 204 dsc_write_to_registers(dsc, &dsc20->reg_vals); 205} 206 207 208static bool dsc2_get_packed_pps(struct display_stream_compressor *dsc, const struct dsc_config *dsc_cfg, uint8_t *dsc_packed_pps) 209{ 210 bool is_config_ok; 211 struct dsc_reg_values dsc_reg_vals; 212 struct dsc_optc_config dsc_optc_cfg; 213 214 memset(&dsc_reg_vals, 0, sizeof(dsc_reg_vals)); 215 memset(&dsc_optc_cfg, 0, sizeof(dsc_optc_cfg)); 216 217 DC_LOG_DSC("Getting packed DSC PPS for DSC Config:"); 218 dsc_config_log(dsc, dsc_cfg); 219 DC_LOG_DSC("DSC Picture Parameter Set (PPS):"); 220 is_config_ok = dsc_prepare_config(dsc_cfg, &dsc_reg_vals, &dsc_optc_cfg); 221 ASSERT(is_config_ok); 222 drm_dsc_pps_payload_pack((struct drm_dsc_picture_parameter_set *)dsc_packed_pps, &dsc_reg_vals.pps); 223 dsc_log_pps(dsc, &dsc_reg_vals.pps); 224 225 return is_config_ok; 226} 227 228 229static void dsc2_enable(struct display_stream_compressor *dsc, int opp_pipe) 230{ 231 struct dcn20_dsc *dsc20 = TO_DCN20_DSC(dsc); 232 int dsc_clock_en; 233 int dsc_fw_config; 234 int enabled_opp_pipe; 235 236 DC_LOG_DSC("enable DSC %d at opp pipe %d", dsc->inst, opp_pipe); 237 238 REG_GET(DSC_TOP_CONTROL, DSC_CLOCK_EN, &dsc_clock_en); 239 REG_GET_2(DSCRM_DSC_FORWARD_CONFIG, DSCRM_DSC_FORWARD_EN, &dsc_fw_config, DSCRM_DSC_OPP_PIPE_SOURCE, &enabled_opp_pipe); 240 if ((dsc_clock_en || dsc_fw_config) && enabled_opp_pipe != opp_pipe) { 241 DC_LOG_DSC("ERROR: DSC %d at opp pipe %d already enabled!", dsc->inst, enabled_opp_pipe); 242 ASSERT(0); 243 } 244 245 REG_UPDATE(DSC_TOP_CONTROL, 246 DSC_CLOCK_EN, 1); 247 248 REG_UPDATE_2(DSCRM_DSC_FORWARD_CONFIG, 249 DSCRM_DSC_FORWARD_EN, 1, 250 DSCRM_DSC_OPP_PIPE_SOURCE, opp_pipe); 251} 252 253 254static void dsc2_disable(struct display_stream_compressor *dsc) 255{ 256 struct dcn20_dsc *dsc20 = TO_DCN20_DSC(dsc); 257 int dsc_clock_en; 258 int dsc_fw_config; 259 int enabled_opp_pipe; 260 261 DC_LOG_DSC("disable DSC %d", dsc->inst); 262 263 REG_GET(DSC_TOP_CONTROL, DSC_CLOCK_EN, &dsc_clock_en); 264 REG_GET_2(DSCRM_DSC_FORWARD_CONFIG, DSCRM_DSC_FORWARD_EN, &dsc_fw_config, DSCRM_DSC_OPP_PIPE_SOURCE, &enabled_opp_pipe); 265 if (!dsc_clock_en || !dsc_fw_config) { 266 DC_LOG_DSC("ERROR: DSC %d at opp pipe %d already disabled!", dsc->inst, enabled_opp_pipe); 267 ASSERT(0); 268 } 269 270 REG_UPDATE(DSCRM_DSC_FORWARD_CONFIG, 271 DSCRM_DSC_FORWARD_EN, 0); 272 273 REG_UPDATE(DSC_TOP_CONTROL, 274 DSC_CLOCK_EN, 0); 275} 276 277 278/* This module's internal functions */ 279static void dsc_log_pps(struct display_stream_compressor *dsc, struct drm_dsc_config *pps) 280{ 281 int i; 282 int bits_per_pixel = pps->bits_per_pixel; 283 284 DC_LOG_DSC("\tdsc_version_major %d", pps->dsc_version_major); 285 DC_LOG_DSC("\tdsc_version_minor %d", pps->dsc_version_minor); 286 DC_LOG_DSC("\tbits_per_component %d", pps->bits_per_component); 287 DC_LOG_DSC("\tline_buf_depth %d", pps->line_buf_depth); 288 DC_LOG_DSC("\tblock_pred_enable %d", pps->block_pred_enable); 289 DC_LOG_DSC("\tconvert_rgb %d", pps->convert_rgb); 290 DC_LOG_DSC("\tsimple_422 %d", pps->simple_422); 291 DC_LOG_DSC("\tvbr_enable %d", pps->vbr_enable); 292 DC_LOG_DSC("\tbits_per_pixel %d (%d.%04d)", bits_per_pixel, bits_per_pixel / 16, ((bits_per_pixel % 16) * 10000) / 16); 293 DC_LOG_DSC("\tpic_height %d", pps->pic_height); 294 DC_LOG_DSC("\tpic_width %d", pps->pic_width); 295 DC_LOG_DSC("\tslice_height %d", pps->slice_height); 296 DC_LOG_DSC("\tslice_width %d", pps->slice_width); 297 DC_LOG_DSC("\tslice_chunk_size %d", pps->slice_chunk_size); 298 DC_LOG_DSC("\tinitial_xmit_delay %d", pps->initial_xmit_delay); 299 DC_LOG_DSC("\tinitial_dec_delay %d", pps->initial_dec_delay); 300 DC_LOG_DSC("\tinitial_scale_value %d", pps->initial_scale_value); 301 DC_LOG_DSC("\tscale_increment_interval %d", pps->scale_increment_interval); 302 DC_LOG_DSC("\tscale_decrement_interval %d", pps->scale_decrement_interval); 303 DC_LOG_DSC("\tfirst_line_bpg_offset %d", pps->first_line_bpg_offset); 304 DC_LOG_DSC("\tnfl_bpg_offset %d", pps->nfl_bpg_offset); 305 DC_LOG_DSC("\tslice_bpg_offset %d", pps->slice_bpg_offset); 306 DC_LOG_DSC("\tinitial_offset %d", pps->initial_offset); 307 DC_LOG_DSC("\tfinal_offset %d", pps->final_offset); 308 DC_LOG_DSC("\tflatness_min_qp %d", pps->flatness_min_qp); 309 DC_LOG_DSC("\tflatness_max_qp %d", pps->flatness_max_qp); 310 /* DC_LOG_DSC("\trc_parameter_set %d", pps->rc_parameter_set); */ 311 DC_LOG_DSC("\tnative_420 %d", pps->native_420); 312 DC_LOG_DSC("\tnative_422 %d", pps->native_422); 313 DC_LOG_DSC("\tsecond_line_bpg_offset %d", pps->second_line_bpg_offset); 314 DC_LOG_DSC("\tnsl_bpg_offset %d", pps->nsl_bpg_offset); 315 DC_LOG_DSC("\tsecond_line_offset_adj %d", pps->second_line_offset_adj); 316 DC_LOG_DSC("\trc_model_size %d", pps->rc_model_size); 317 DC_LOG_DSC("\trc_edge_factor %d", pps->rc_edge_factor); 318 DC_LOG_DSC("\trc_quant_incr_limit0 %d", pps->rc_quant_incr_limit0); 319 DC_LOG_DSC("\trc_quant_incr_limit1 %d", pps->rc_quant_incr_limit1); 320 DC_LOG_DSC("\trc_tgt_offset_high %d", pps->rc_tgt_offset_high); 321 DC_LOG_DSC("\trc_tgt_offset_low %d", pps->rc_tgt_offset_low); 322 323 for (i = 0; i < NUM_BUF_RANGES - 1; i++) 324 DC_LOG_DSC("\trc_buf_thresh[%d] %d", i, pps->rc_buf_thresh[i]); 325 326 for (i = 0; i < NUM_BUF_RANGES; i++) { 327 DC_LOG_DSC("\trc_range_parameters[%d].range_min_qp %d", i, pps->rc_range_params[i].range_min_qp); 328 DC_LOG_DSC("\trc_range_parameters[%d].range_max_qp %d", i, pps->rc_range_params[i].range_max_qp); 329 DC_LOG_DSC("\trc_range_parameters[%d].range_bpg_offset %d", i, pps->rc_range_params[i].range_bpg_offset); 330 } 331} 332 333static bool dsc_prepare_config(const struct dsc_config *dsc_cfg, struct dsc_reg_values *dsc_reg_vals, 334 struct dsc_optc_config *dsc_optc_cfg) 335{ 336 struct dsc_parameters dsc_params; 337 338 /* Validate input parameters */ 339 ASSERT(dsc_cfg->dc_dsc_cfg.num_slices_h); 340 ASSERT(dsc_cfg->dc_dsc_cfg.num_slices_v); 341 ASSERT(dsc_cfg->dc_dsc_cfg.version_minor == 1 || dsc_cfg->dc_dsc_cfg.version_minor == 2); 342 ASSERT(dsc_cfg->pic_width); 343 ASSERT(dsc_cfg->pic_height); 344 ASSERT((dsc_cfg->dc_dsc_cfg.version_minor == 1 && 345 (8 <= dsc_cfg->dc_dsc_cfg.linebuf_depth && dsc_cfg->dc_dsc_cfg.linebuf_depth <= 13)) || 346 (dsc_cfg->dc_dsc_cfg.version_minor == 2 && 347 ((8 <= dsc_cfg->dc_dsc_cfg.linebuf_depth && dsc_cfg->dc_dsc_cfg.linebuf_depth <= 15) || 348 dsc_cfg->dc_dsc_cfg.linebuf_depth == 0))); 349 ASSERT(96 <= dsc_cfg->dc_dsc_cfg.bits_per_pixel && dsc_cfg->dc_dsc_cfg.bits_per_pixel <= 0x3ff); // 6.0 <= bits_per_pixel <= 63.9375 350 351 if (!dsc_cfg->dc_dsc_cfg.num_slices_v || !dsc_cfg->dc_dsc_cfg.num_slices_h || 352 !(dsc_cfg->dc_dsc_cfg.version_minor == 1 || dsc_cfg->dc_dsc_cfg.version_minor == 2) || 353 !dsc_cfg->pic_width || !dsc_cfg->pic_height || 354 !((dsc_cfg->dc_dsc_cfg.version_minor == 1 && // v1.1 line buffer depth range: 355 8 <= dsc_cfg->dc_dsc_cfg.linebuf_depth && dsc_cfg->dc_dsc_cfg.linebuf_depth <= 13) || 356 (dsc_cfg->dc_dsc_cfg.version_minor == 2 && // v1.2 line buffer depth range: 357 ((8 <= dsc_cfg->dc_dsc_cfg.linebuf_depth && dsc_cfg->dc_dsc_cfg.linebuf_depth <= 15) || 358 dsc_cfg->dc_dsc_cfg.linebuf_depth == 0))) || 359 !(96 <= dsc_cfg->dc_dsc_cfg.bits_per_pixel && dsc_cfg->dc_dsc_cfg.bits_per_pixel <= 0x3ff)) { 360 dm_output_to_console("%s: Invalid parameters\n", __func__); 361 return false; 362 } 363 364 dsc_init_reg_values(dsc_reg_vals); 365 366 /* Copy input config */ 367 dsc_reg_vals->pixel_format = dsc_dc_pixel_encoding_to_dsc_pixel_format(dsc_cfg->pixel_encoding, dsc_cfg->dc_dsc_cfg.ycbcr422_simple); 368 dsc_reg_vals->num_slices_h = dsc_cfg->dc_dsc_cfg.num_slices_h; 369 dsc_reg_vals->num_slices_v = dsc_cfg->dc_dsc_cfg.num_slices_v; 370 dsc_reg_vals->pps.dsc_version_minor = dsc_cfg->dc_dsc_cfg.version_minor; 371 dsc_reg_vals->pps.pic_width = dsc_cfg->pic_width; 372 dsc_reg_vals->pps.pic_height = dsc_cfg->pic_height; 373 dsc_reg_vals->pps.bits_per_component = dsc_dc_color_depth_to_dsc_bits_per_comp(dsc_cfg->color_depth); 374 dsc_reg_vals->pps.block_pred_enable = dsc_cfg->dc_dsc_cfg.block_pred_enable; 375 dsc_reg_vals->pps.line_buf_depth = dsc_cfg->dc_dsc_cfg.linebuf_depth; 376 dsc_reg_vals->alternate_ich_encoding_en = dsc_reg_vals->pps.dsc_version_minor == 1 ? 0 : 1; 377 378 // TODO: in addition to validating slice height (pic height must be divisible by slice height), 379 // see what happens when the same condition doesn't apply for slice_width/pic_width. 380 dsc_reg_vals->pps.slice_width = dsc_cfg->pic_width / dsc_cfg->dc_dsc_cfg.num_slices_h; 381 dsc_reg_vals->pps.slice_height = dsc_cfg->pic_height / dsc_cfg->dc_dsc_cfg.num_slices_v; 382 383 ASSERT(dsc_reg_vals->pps.slice_height * dsc_cfg->dc_dsc_cfg.num_slices_v == dsc_cfg->pic_height); 384 if (!(dsc_reg_vals->pps.slice_height * dsc_cfg->dc_dsc_cfg.num_slices_v == dsc_cfg->pic_height)) { 385 dm_output_to_console("%s: pix height %d not divisible by num_slices_v %d\n\n", __func__, dsc_cfg->pic_height, dsc_cfg->dc_dsc_cfg.num_slices_v); 386 return false; 387 } 388 389 dsc_reg_vals->bpp_x32 = dsc_cfg->dc_dsc_cfg.bits_per_pixel << 1; 390 if (dsc_reg_vals->pixel_format == DSC_PIXFMT_NATIVE_YCBCR420 || dsc_reg_vals->pixel_format == DSC_PIXFMT_NATIVE_YCBCR422) 391 dsc_reg_vals->pps.bits_per_pixel = dsc_reg_vals->bpp_x32; 392 else 393 dsc_reg_vals->pps.bits_per_pixel = dsc_reg_vals->bpp_x32 >> 1; 394 395 dsc_reg_vals->pps.convert_rgb = dsc_reg_vals->pixel_format == DSC_PIXFMT_RGB ? 1 : 0; 396 dsc_reg_vals->pps.native_422 = (dsc_reg_vals->pixel_format == DSC_PIXFMT_NATIVE_YCBCR422); 397 dsc_reg_vals->pps.native_420 = (dsc_reg_vals->pixel_format == DSC_PIXFMT_NATIVE_YCBCR420); 398 dsc_reg_vals->pps.simple_422 = (dsc_reg_vals->pixel_format == DSC_PIXFMT_SIMPLE_YCBCR422); 399 400 if (dscc_compute_dsc_parameters(&dsc_reg_vals->pps, &dsc_params)) { 401 dm_output_to_console("%s: DSC config failed\n", __func__); 402 return false; 403 } 404 405 dsc_update_from_dsc_parameters(dsc_reg_vals, &dsc_params); 406 407 dsc_optc_cfg->bytes_per_pixel = dsc_params.bytes_per_pixel; 408 dsc_optc_cfg->slice_width = dsc_reg_vals->pps.slice_width; 409 dsc_optc_cfg->is_pixel_format_444 = dsc_reg_vals->pixel_format == DSC_PIXFMT_RGB || 410 dsc_reg_vals->pixel_format == DSC_PIXFMT_YCBCR444 || 411 dsc_reg_vals->pixel_format == DSC_PIXFMT_SIMPLE_YCBCR422; 412 413 return true; 414} 415 416 417static enum dsc_pixel_format dsc_dc_pixel_encoding_to_dsc_pixel_format(enum dc_pixel_encoding dc_pix_enc, bool is_ycbcr422_simple) 418{ 419 enum dsc_pixel_format dsc_pix_fmt = DSC_PIXFMT_UNKNOWN; 420 421 /* NOTE: We don't support DSC_PIXFMT_SIMPLE_YCBCR422 */ 422 423 switch (dc_pix_enc) { 424 case PIXEL_ENCODING_RGB: 425 dsc_pix_fmt = DSC_PIXFMT_RGB; 426 break; 427 case PIXEL_ENCODING_YCBCR422: 428 if (is_ycbcr422_simple) 429 dsc_pix_fmt = DSC_PIXFMT_SIMPLE_YCBCR422; 430 else 431 dsc_pix_fmt = DSC_PIXFMT_NATIVE_YCBCR422; 432 break; 433 case PIXEL_ENCODING_YCBCR444: 434 dsc_pix_fmt = DSC_PIXFMT_YCBCR444; 435 break; 436 case PIXEL_ENCODING_YCBCR420: 437 dsc_pix_fmt = DSC_PIXFMT_NATIVE_YCBCR420; 438 break; 439 default: 440 dsc_pix_fmt = DSC_PIXFMT_UNKNOWN; 441 break; 442 } 443 444 ASSERT(dsc_pix_fmt != DSC_PIXFMT_UNKNOWN); 445 return dsc_pix_fmt; 446} 447 448 449static enum dsc_bits_per_comp dsc_dc_color_depth_to_dsc_bits_per_comp(enum dc_color_depth dc_color_depth) 450{ 451 enum dsc_bits_per_comp bpc = DSC_BPC_UNKNOWN; 452 453 switch (dc_color_depth) { 454 case COLOR_DEPTH_888: 455 bpc = DSC_BPC_8; 456 break; 457 case COLOR_DEPTH_101010: 458 bpc = DSC_BPC_10; 459 break; 460 case COLOR_DEPTH_121212: 461 bpc = DSC_BPC_12; 462 break; 463 default: 464 bpc = DSC_BPC_UNKNOWN; 465 break; 466 } 467 468 return bpc; 469} 470 471 472static void dsc_init_reg_values(struct dsc_reg_values *reg_vals) 473{ 474 int i; 475 476 memset(reg_vals, 0, sizeof(struct dsc_reg_values)); 477 478 /* Non-PPS values */ 479 reg_vals->dsc_clock_enable = 1; 480 reg_vals->dsc_clock_gating_disable = 0; 481 reg_vals->underflow_recovery_en = 0; 482 reg_vals->underflow_occurred_int_en = 0; 483 reg_vals->underflow_occurred_status = 0; 484 reg_vals->ich_reset_at_eol = 0; 485 reg_vals->alternate_ich_encoding_en = 0; 486 reg_vals->rc_buffer_model_size = 0; 487 /*reg_vals->disable_ich = 0;*/ 488 reg_vals->dsc_dbg_en = 0; 489 490 for (i = 0; i < 4; i++) 491 reg_vals->rc_buffer_model_overflow_int_en[i] = 0; 492 493 /* PPS values */ 494 reg_vals->pps.dsc_version_minor = 2; 495 reg_vals->pps.dsc_version_major = 1; 496 reg_vals->pps.line_buf_depth = 9; 497 reg_vals->pps.bits_per_component = 8; 498 reg_vals->pps.block_pred_enable = 1; 499 reg_vals->pps.slice_chunk_size = 0; 500 reg_vals->pps.pic_width = 0; 501 reg_vals->pps.pic_height = 0; 502 reg_vals->pps.slice_width = 0; 503 reg_vals->pps.slice_height = 0; 504 reg_vals->pps.initial_xmit_delay = 170; 505 reg_vals->pps.initial_dec_delay = 0; 506 reg_vals->pps.initial_scale_value = 0; 507 reg_vals->pps.scale_increment_interval = 0; 508 reg_vals->pps.scale_decrement_interval = 0; 509 reg_vals->pps.nfl_bpg_offset = 0; 510 reg_vals->pps.slice_bpg_offset = 0; 511 reg_vals->pps.nsl_bpg_offset = 0; 512 reg_vals->pps.initial_offset = 6144; 513 reg_vals->pps.final_offset = 0; 514 reg_vals->pps.flatness_min_qp = 3; 515 reg_vals->pps.flatness_max_qp = 12; 516 reg_vals->pps.rc_model_size = 8192; 517 reg_vals->pps.rc_edge_factor = 6; 518 reg_vals->pps.rc_quant_incr_limit0 = 11; 519 reg_vals->pps.rc_quant_incr_limit1 = 11; 520 reg_vals->pps.rc_tgt_offset_low = 3; 521 reg_vals->pps.rc_tgt_offset_high = 3; 522} 523 524/* Updates dsc_reg_values::reg_vals::xxx fields based on the values from computed params. 525 * This is required because dscc_compute_dsc_parameters returns a modified PPS, which in turn 526 * affects non-PPS register values. 527 */ 528static void dsc_update_from_dsc_parameters(struct dsc_reg_values *reg_vals, const struct dsc_parameters *dsc_params) 529{ 530 int i; 531 532 reg_vals->pps = dsc_params->pps; 533 534 // pps_computed will have the "expanded" values; need to shift them to make them fit for regs. 535 for (i = 0; i < NUM_BUF_RANGES - 1; i++) 536 reg_vals->pps.rc_buf_thresh[i] = reg_vals->pps.rc_buf_thresh[i] >> 6; 537 538 reg_vals->rc_buffer_model_size = dsc_params->rc_buffer_model_size; 539 reg_vals->ich_reset_at_eol = reg_vals->num_slices_h == 1 ? 0 : 0xf; 540} 541 542static void dsc_write_to_registers(struct display_stream_compressor *dsc, const struct dsc_reg_values *reg_vals) 543{ 544 uint32_t temp_int; 545 struct dcn20_dsc *dsc20 = TO_DCN20_DSC(dsc); 546 547 REG_SET(DSC_DEBUG_CONTROL, 0, 548 DSC_DBG_EN, reg_vals->dsc_dbg_en); 549 550 // dsccif registers 551 REG_SET_5(DSCCIF_CONFIG0, 0, 552 INPUT_INTERFACE_UNDERFLOW_RECOVERY_EN, reg_vals->underflow_recovery_en, 553 INPUT_INTERFACE_UNDERFLOW_OCCURRED_INT_EN, reg_vals->underflow_occurred_int_en, 554 INPUT_INTERFACE_UNDERFLOW_OCCURRED_STATUS, reg_vals->underflow_occurred_status, 555 INPUT_PIXEL_FORMAT, reg_vals->pixel_format, 556 DSCCIF_CONFIG0__BITS_PER_COMPONENT, reg_vals->pps.bits_per_component); 557 558 REG_SET_2(DSCCIF_CONFIG1, 0, 559 PIC_WIDTH, reg_vals->pps.pic_width, 560 PIC_HEIGHT, reg_vals->pps.pic_height); 561 562 // dscc registers 563 REG_SET_4(DSCC_CONFIG0, 0, 564 ICH_RESET_AT_END_OF_LINE, reg_vals->ich_reset_at_eol, 565 NUMBER_OF_SLICES_PER_LINE, reg_vals->num_slices_h - 1, 566 ALTERNATE_ICH_ENCODING_EN, reg_vals->alternate_ich_encoding_en, 567 NUMBER_OF_SLICES_IN_VERTICAL_DIRECTION, reg_vals->num_slices_v - 1); 568 569 REG_SET(DSCC_CONFIG1, 0, 570 DSCC_RATE_CONTROL_BUFFER_MODEL_SIZE, reg_vals->rc_buffer_model_size); 571 /*REG_SET_2(DSCC_CONFIG1, 0, 572 DSCC_RATE_CONTROL_BUFFER_MODEL_SIZE, reg_vals->rc_buffer_model_size, 573 DSCC_DISABLE_ICH, reg_vals->disable_ich);*/ 574 575 REG_SET_4(DSCC_INTERRUPT_CONTROL_STATUS, 0, 576 DSCC_RATE_CONTROL_BUFFER_MODEL0_OVERFLOW_OCCURRED_INT_EN, reg_vals->rc_buffer_model_overflow_int_en[0], 577 DSCC_RATE_CONTROL_BUFFER_MODEL1_OVERFLOW_OCCURRED_INT_EN, reg_vals->rc_buffer_model_overflow_int_en[1], 578 DSCC_RATE_CONTROL_BUFFER_MODEL2_OVERFLOW_OCCURRED_INT_EN, reg_vals->rc_buffer_model_overflow_int_en[2], 579 DSCC_RATE_CONTROL_BUFFER_MODEL3_OVERFLOW_OCCURRED_INT_EN, reg_vals->rc_buffer_model_overflow_int_en[3]); 580 581 REG_SET_3(DSCC_PPS_CONFIG0, 0, 582 DSC_VERSION_MINOR, reg_vals->pps.dsc_version_minor, 583 LINEBUF_DEPTH, reg_vals->pps.line_buf_depth, 584 DSCC_PPS_CONFIG0__BITS_PER_COMPONENT, reg_vals->pps.bits_per_component); 585 586 if (reg_vals->pixel_format == DSC_PIXFMT_NATIVE_YCBCR420 || reg_vals->pixel_format == DSC_PIXFMT_NATIVE_YCBCR422) 587 temp_int = reg_vals->bpp_x32; 588 else 589 temp_int = reg_vals->bpp_x32 >> 1; 590 591 REG_SET_7(DSCC_PPS_CONFIG1, 0, 592 BITS_PER_PIXEL, temp_int, 593 SIMPLE_422, reg_vals->pixel_format == DSC_PIXFMT_SIMPLE_YCBCR422, 594 CONVERT_RGB, reg_vals->pixel_format == DSC_PIXFMT_RGB, 595 BLOCK_PRED_ENABLE, reg_vals->pps.block_pred_enable, 596 NATIVE_422, reg_vals->pixel_format == DSC_PIXFMT_NATIVE_YCBCR422, 597 NATIVE_420, reg_vals->pixel_format == DSC_PIXFMT_NATIVE_YCBCR420, 598 CHUNK_SIZE, reg_vals->pps.slice_chunk_size); 599 600 REG_SET_2(DSCC_PPS_CONFIG2, 0, 601 PIC_WIDTH, reg_vals->pps.pic_width, 602 PIC_HEIGHT, reg_vals->pps.pic_height); 603 604 REG_SET_2(DSCC_PPS_CONFIG3, 0, 605 SLICE_WIDTH, reg_vals->pps.slice_width, 606 SLICE_HEIGHT, reg_vals->pps.slice_height); 607 608 REG_SET(DSCC_PPS_CONFIG4, 0, 609 INITIAL_XMIT_DELAY, reg_vals->pps.initial_xmit_delay); 610 611 REG_SET_2(DSCC_PPS_CONFIG5, 0, 612 INITIAL_SCALE_VALUE, reg_vals->pps.initial_scale_value, 613 SCALE_INCREMENT_INTERVAL, reg_vals->pps.scale_increment_interval); 614 615 REG_SET_3(DSCC_PPS_CONFIG6, 0, 616 SCALE_DECREMENT_INTERVAL, reg_vals->pps.scale_decrement_interval, 617 FIRST_LINE_BPG_OFFSET, reg_vals->pps.first_line_bpg_offset, 618 SECOND_LINE_BPG_OFFSET, reg_vals->pps.second_line_bpg_offset); 619 620 REG_SET_2(DSCC_PPS_CONFIG7, 0, 621 NFL_BPG_OFFSET, reg_vals->pps.nfl_bpg_offset, 622 SLICE_BPG_OFFSET, reg_vals->pps.slice_bpg_offset); 623 624 REG_SET_2(DSCC_PPS_CONFIG8, 0, 625 NSL_BPG_OFFSET, reg_vals->pps.nsl_bpg_offset, 626 SECOND_LINE_OFFSET_ADJ, reg_vals->pps.second_line_offset_adj); 627 628 REG_SET_2(DSCC_PPS_CONFIG9, 0, 629 INITIAL_OFFSET, reg_vals->pps.initial_offset, 630 FINAL_OFFSET, reg_vals->pps.final_offset); 631 632 REG_SET_3(DSCC_PPS_CONFIG10, 0, 633 FLATNESS_MIN_QP, reg_vals->pps.flatness_min_qp, 634 FLATNESS_MAX_QP, reg_vals->pps.flatness_max_qp, 635 RC_MODEL_SIZE, reg_vals->pps.rc_model_size); 636 637 REG_SET_5(DSCC_PPS_CONFIG11, 0, 638 RC_EDGE_FACTOR, reg_vals->pps.rc_edge_factor, 639 RC_QUANT_INCR_LIMIT0, reg_vals->pps.rc_quant_incr_limit0, 640 RC_QUANT_INCR_LIMIT1, reg_vals->pps.rc_quant_incr_limit1, 641 RC_TGT_OFFSET_LO, reg_vals->pps.rc_tgt_offset_low, 642 RC_TGT_OFFSET_HI, reg_vals->pps.rc_tgt_offset_high); 643 644 REG_SET_4(DSCC_PPS_CONFIG12, 0, 645 RC_BUF_THRESH0, reg_vals->pps.rc_buf_thresh[0], 646 RC_BUF_THRESH1, reg_vals->pps.rc_buf_thresh[1], 647 RC_BUF_THRESH2, reg_vals->pps.rc_buf_thresh[2], 648 RC_BUF_THRESH3, reg_vals->pps.rc_buf_thresh[3]); 649 650 REG_SET_4(DSCC_PPS_CONFIG13, 0, 651 RC_BUF_THRESH4, reg_vals->pps.rc_buf_thresh[4], 652 RC_BUF_THRESH5, reg_vals->pps.rc_buf_thresh[5], 653 RC_BUF_THRESH6, reg_vals->pps.rc_buf_thresh[6], 654 RC_BUF_THRESH7, reg_vals->pps.rc_buf_thresh[7]); 655 656 REG_SET_4(DSCC_PPS_CONFIG14, 0, 657 RC_BUF_THRESH8, reg_vals->pps.rc_buf_thresh[8], 658 RC_BUF_THRESH9, reg_vals->pps.rc_buf_thresh[9], 659 RC_BUF_THRESH10, reg_vals->pps.rc_buf_thresh[10], 660 RC_BUF_THRESH11, reg_vals->pps.rc_buf_thresh[11]); 661 662 REG_SET_5(DSCC_PPS_CONFIG15, 0, 663 RC_BUF_THRESH12, reg_vals->pps.rc_buf_thresh[12], 664 RC_BUF_THRESH13, reg_vals->pps.rc_buf_thresh[13], 665 RANGE_MIN_QP0, reg_vals->pps.rc_range_params[0].range_min_qp, 666 RANGE_MAX_QP0, reg_vals->pps.rc_range_params[0].range_max_qp, 667 RANGE_BPG_OFFSET0, reg_vals->pps.rc_range_params[0].range_bpg_offset); 668 669 REG_SET_6(DSCC_PPS_CONFIG16, 0, 670 RANGE_MIN_QP1, reg_vals->pps.rc_range_params[1].range_min_qp, 671 RANGE_MAX_QP1, reg_vals->pps.rc_range_params[1].range_max_qp, 672 RANGE_BPG_OFFSET1, reg_vals->pps.rc_range_params[1].range_bpg_offset, 673 RANGE_MIN_QP2, reg_vals->pps.rc_range_params[2].range_min_qp, 674 RANGE_MAX_QP2, reg_vals->pps.rc_range_params[2].range_max_qp, 675 RANGE_BPG_OFFSET2, reg_vals->pps.rc_range_params[2].range_bpg_offset); 676 677 REG_SET_6(DSCC_PPS_CONFIG17, 0, 678 RANGE_MIN_QP3, reg_vals->pps.rc_range_params[3].range_min_qp, 679 RANGE_MAX_QP3, reg_vals->pps.rc_range_params[3].range_max_qp, 680 RANGE_BPG_OFFSET3, reg_vals->pps.rc_range_params[3].range_bpg_offset, 681 RANGE_MIN_QP4, reg_vals->pps.rc_range_params[4].range_min_qp, 682 RANGE_MAX_QP4, reg_vals->pps.rc_range_params[4].range_max_qp, 683 RANGE_BPG_OFFSET4, reg_vals->pps.rc_range_params[4].range_bpg_offset); 684 685 REG_SET_6(DSCC_PPS_CONFIG18, 0, 686 RANGE_MIN_QP5, reg_vals->pps.rc_range_params[5].range_min_qp, 687 RANGE_MAX_QP5, reg_vals->pps.rc_range_params[5].range_max_qp, 688 RANGE_BPG_OFFSET5, reg_vals->pps.rc_range_params[5].range_bpg_offset, 689 RANGE_MIN_QP6, reg_vals->pps.rc_range_params[6].range_min_qp, 690 RANGE_MAX_QP6, reg_vals->pps.rc_range_params[6].range_max_qp, 691 RANGE_BPG_OFFSET6, reg_vals->pps.rc_range_params[6].range_bpg_offset); 692 693 REG_SET_6(DSCC_PPS_CONFIG19, 0, 694 RANGE_MIN_QP7, reg_vals->pps.rc_range_params[7].range_min_qp, 695 RANGE_MAX_QP7, reg_vals->pps.rc_range_params[7].range_max_qp, 696 RANGE_BPG_OFFSET7, reg_vals->pps.rc_range_params[7].range_bpg_offset, 697 RANGE_MIN_QP8, reg_vals->pps.rc_range_params[8].range_min_qp, 698 RANGE_MAX_QP8, reg_vals->pps.rc_range_params[8].range_max_qp, 699 RANGE_BPG_OFFSET8, reg_vals->pps.rc_range_params[8].range_bpg_offset); 700 701 REG_SET_6(DSCC_PPS_CONFIG20, 0, 702 RANGE_MIN_QP9, reg_vals->pps.rc_range_params[9].range_min_qp, 703 RANGE_MAX_QP9, reg_vals->pps.rc_range_params[9].range_max_qp, 704 RANGE_BPG_OFFSET9, reg_vals->pps.rc_range_params[9].range_bpg_offset, 705 RANGE_MIN_QP10, reg_vals->pps.rc_range_params[10].range_min_qp, 706 RANGE_MAX_QP10, reg_vals->pps.rc_range_params[10].range_max_qp, 707 RANGE_BPG_OFFSET10, reg_vals->pps.rc_range_params[10].range_bpg_offset); 708 709 REG_SET_6(DSCC_PPS_CONFIG21, 0, 710 RANGE_MIN_QP11, reg_vals->pps.rc_range_params[11].range_min_qp, 711 RANGE_MAX_QP11, reg_vals->pps.rc_range_params[11].range_max_qp, 712 RANGE_BPG_OFFSET11, reg_vals->pps.rc_range_params[11].range_bpg_offset, 713 RANGE_MIN_QP12, reg_vals->pps.rc_range_params[12].range_min_qp, 714 RANGE_MAX_QP12, reg_vals->pps.rc_range_params[12].range_max_qp, 715 RANGE_BPG_OFFSET12, reg_vals->pps.rc_range_params[12].range_bpg_offset); 716 717 REG_SET_6(DSCC_PPS_CONFIG22, 0, 718 RANGE_MIN_QP13, reg_vals->pps.rc_range_params[13].range_min_qp, 719 RANGE_MAX_QP13, reg_vals->pps.rc_range_params[13].range_max_qp, 720 RANGE_BPG_OFFSET13, reg_vals->pps.rc_range_params[13].range_bpg_offset, 721 RANGE_MIN_QP14, reg_vals->pps.rc_range_params[14].range_min_qp, 722 RANGE_MAX_QP14, reg_vals->pps.rc_range_params[14].range_max_qp, 723 RANGE_BPG_OFFSET14, reg_vals->pps.rc_range_params[14].range_bpg_offset); 724 725 if (IS_FPGA_MAXIMUS_DC(dsc20->base.ctx->dce_environment)) { 726 /* It's safe to do this as long as debug bus is not being used in DAL Diag environment. 727 * 728 * This is because DSCC_PPS_CONFIG4.INITIAL_DEC_DELAY is a read-only register field (because it's a decoder 729 * value not required by DSC encoder). However, since decoding fails when this value is missing from PPS, it's 730 * required to communicate this value to the PPS header. When testing on FPGA, the values for PPS header are 731 * being read from Diag register dump. The register below is used in place of a scratch register to make 732 * 'initial_dec_delay' available. 733 */ 734 735 temp_int = reg_vals->pps.initial_dec_delay; 736 REG_SET_4(DSCC_TEST_DEBUG_BUS_ROTATE, 0, 737 DSCC_TEST_DEBUG_BUS0_ROTATE, temp_int & 0x1f, 738 DSCC_TEST_DEBUG_BUS1_ROTATE, temp_int >> 5 & 0x1f, 739 DSCC_TEST_DEBUG_BUS2_ROTATE, temp_int >> 10 & 0x1f, 740 DSCC_TEST_DEBUG_BUS3_ROTATE, temp_int >> 15 & 0x1); 741 } 742} 743 744