Merge tag 'selinux-pr-20220321' of git://git.kernel.org/pub/scm/linux/kernel/git...
[linux-block.git] / drivers / gpu / drm / drm_dsc.c
CommitLineData
a408c857
MN
1// SPDX-License-Identifier: MIT
2/*
3 * Copyright © 2018 Intel Corp
4 *
5 * Author:
6 * Manasi Navare <manasi.d.navare@intel.com>
7 */
8
9#include <linux/kernel.h>
10#include <linux/module.h>
11#include <linux/init.h>
12#include <linux/errno.h>
13#include <linux/byteorder/generic.h>
dc43332b 14#include <drm/drm_print.h>
a408c857
MN
15#include <drm/drm_dp_helper.h>
16#include <drm/drm_dsc.h>
17
18/**
19 * DOC: dsc helpers
20 *
05bad235
MN
21 * VESA specification for DP 1.4 adds a new feature called Display Stream
22 * Compression (DSC) used to compress the pixel bits before sending it on
23 * DP/eDP/MIPI DSI interface. DSC is required to be enabled so that the existing
24 * display interfaces can support high resolutions at higher frames rates uisng
25 * the maximum available link capacity of these interfaces.
26 *
a408c857
MN
27 * These functions contain some common logic and helpers to deal with VESA
28 * Display Stream Compression standard required for DSC on Display Port/eDP or
29 * MIPI display interfaces.
30 */
31
32/**
33 * drm_dsc_dp_pps_header_init() - Initializes the PPS Header
34 * for DisplayPort as per the DP 1.4 spec.
dbfbe717
DF
35 * @pps_header: Secondary data packet header for DSC Picture
36 * Parameter Set as defined in &struct dp_sdp_header
05bad235
MN
37 *
38 * DP 1.4 spec defines the secondary data packet for sending the
39 * picture parameter infoframes from the source to the sink.
dbfbe717
DF
40 * This function populates the SDP header defined in
41 * &struct dp_sdp_header.
a408c857 42 */
dbfbe717 43void drm_dsc_dp_pps_header_init(struct dp_sdp_header *pps_header)
a408c857 44{
dbfbe717 45 memset(pps_header, 0, sizeof(*pps_header));
a408c857 46
dbfbe717
DF
47 pps_header->HB1 = DP_SDP_PPS;
48 pps_header->HB2 = DP_SDP_PPS_HEADER_PAYLOAD_BYTES_MINUS_1;
a408c857
MN
49}
50EXPORT_SYMBOL(drm_dsc_dp_pps_header_init);
51
a8f65ba3
JN
52/**
53 * drm_dsc_dp_rc_buffer_size - get rc buffer size in bytes
54 * @rc_buffer_block_size: block size code, according to DPCD offset 62h
55 * @rc_buffer_size: number of blocks - 1, according to DPCD offset 63h
56 *
57 * return:
58 * buffer size in bytes, or 0 on invalid input
59 */
60int drm_dsc_dp_rc_buffer_size(u8 rc_buffer_block_size, u8 rc_buffer_size)
61{
62 int size = 1024 * (rc_buffer_size + 1);
63
64 switch (rc_buffer_block_size) {
65 case DP_DSC_RC_BUF_BLK_SIZE_1:
66 return 1 * size;
67 case DP_DSC_RC_BUF_BLK_SIZE_4:
68 return 4 * size;
69 case DP_DSC_RC_BUF_BLK_SIZE_16:
70 return 16 * size;
71 case DP_DSC_RC_BUF_BLK_SIZE_64:
72 return 64 * size;
73 default:
74 return 0;
75 }
76}
77EXPORT_SYMBOL(drm_dsc_dp_rc_buffer_size);
78
a408c857 79/**
dbfbe717 80 * drm_dsc_pps_payload_pack() - Populates the DSC PPS
a408c857 81 *
dbfbe717
DF
82 * @pps_payload:
83 * Bitwise struct for DSC Picture Parameter Set. This is defined
84 * by &struct drm_dsc_picture_parameter_set
a408c857 85 * @dsc_cfg:
05bad235
MN
86 * DSC Configuration data filled by driver as defined by
87 * &struct drm_dsc_config
88 *
dbfbe717
DF
89 * DSC source device sends a picture parameter set (PPS) containing the
90 * information required by the sink to decode the compressed frame. Driver
91 * populates the DSC PPS struct using the DSC configuration parameters in
92 * the order expected by the DSC Display Sink device. For the DSC, the sink
93 * device expects the PPS payload in big endian format for fields
94 * that span more than 1 byte.
a408c857 95 */
dbfbe717 96void drm_dsc_pps_payload_pack(struct drm_dsc_picture_parameter_set *pps_payload,
a408c857
MN
97 const struct drm_dsc_config *dsc_cfg)
98{
99 int i;
100
0ae865ef 101 /* Protect against someone accidentally changing struct size */
dbfbe717 102 BUILD_BUG_ON(sizeof(*pps_payload) !=
a408c857
MN
103 DP_SDP_PPS_HEADER_PAYLOAD_BYTES_MINUS_1 + 1);
104
dbfbe717 105 memset(pps_payload, 0, sizeof(*pps_payload));
a408c857
MN
106
107 /* PPS 0 */
dbfbe717 108 pps_payload->dsc_version =
a408c857
MN
109 dsc_cfg->dsc_version_minor |
110 dsc_cfg->dsc_version_major << DSC_PPS_VERSION_MAJOR_SHIFT;
111
112 /* PPS 1, 2 is 0 */
113
114 /* PPS 3 */
dbfbe717 115 pps_payload->pps_3 =
a408c857
MN
116 dsc_cfg->line_buf_depth |
117 dsc_cfg->bits_per_component << DSC_PPS_BPC_SHIFT;
118
119 /* PPS 4 */
dbfbe717 120 pps_payload->pps_4 =
a408c857
MN
121 ((dsc_cfg->bits_per_pixel & DSC_PPS_BPP_HIGH_MASK) >>
122 DSC_PPS_MSB_SHIFT) |
123 dsc_cfg->vbr_enable << DSC_PPS_VBR_EN_SHIFT |
06d7cecd 124 dsc_cfg->simple_422 << DSC_PPS_SIMPLE422_SHIFT |
a408c857
MN
125 dsc_cfg->convert_rgb << DSC_PPS_CONVERT_RGB_SHIFT |
126 dsc_cfg->block_pred_enable << DSC_PPS_BLOCK_PRED_EN_SHIFT;
127
128 /* PPS 5 */
dbfbe717 129 pps_payload->bits_per_pixel_low =
a408c857
MN
130 (dsc_cfg->bits_per_pixel & DSC_PPS_LSB_MASK);
131
132 /*
133 * The DSC panel expects the PPS packet to have big endian format
134 * for data spanning 2 bytes. Use a macro cpu_to_be16() to convert
135 * to big endian format. If format is little endian, it will swap
136 * bytes to convert to Big endian else keep it unchanged.
137 */
138
139 /* PPS 6, 7 */
dbfbe717 140 pps_payload->pic_height = cpu_to_be16(dsc_cfg->pic_height);
a408c857
MN
141
142 /* PPS 8, 9 */
dbfbe717 143 pps_payload->pic_width = cpu_to_be16(dsc_cfg->pic_width);
a408c857
MN
144
145 /* PPS 10, 11 */
dbfbe717 146 pps_payload->slice_height = cpu_to_be16(dsc_cfg->slice_height);
a408c857
MN
147
148 /* PPS 12, 13 */
dbfbe717 149 pps_payload->slice_width = cpu_to_be16(dsc_cfg->slice_width);
a408c857
MN
150
151 /* PPS 14, 15 */
dbfbe717 152 pps_payload->chunk_size = cpu_to_be16(dsc_cfg->slice_chunk_size);
a408c857
MN
153
154 /* PPS 16 */
dbfbe717 155 pps_payload->initial_xmit_delay_high =
a408c857
MN
156 ((dsc_cfg->initial_xmit_delay &
157 DSC_PPS_INIT_XMIT_DELAY_HIGH_MASK) >>
158 DSC_PPS_MSB_SHIFT);
159
160 /* PPS 17 */
dbfbe717 161 pps_payload->initial_xmit_delay_low =
a408c857
MN
162 (dsc_cfg->initial_xmit_delay & DSC_PPS_LSB_MASK);
163
164 /* PPS 18, 19 */
dbfbe717 165 pps_payload->initial_dec_delay =
a408c857
MN
166 cpu_to_be16(dsc_cfg->initial_dec_delay);
167
168 /* PPS 20 is 0 */
169
170 /* PPS 21 */
dbfbe717 171 pps_payload->initial_scale_value =
a408c857
MN
172 dsc_cfg->initial_scale_value;
173
174 /* PPS 22, 23 */
dbfbe717 175 pps_payload->scale_increment_interval =
a408c857
MN
176 cpu_to_be16(dsc_cfg->scale_increment_interval);
177
178 /* PPS 24 */
dbfbe717 179 pps_payload->scale_decrement_interval_high =
a408c857
MN
180 ((dsc_cfg->scale_decrement_interval &
181 DSC_PPS_SCALE_DEC_INT_HIGH_MASK) >>
182 DSC_PPS_MSB_SHIFT);
183
184 /* PPS 25 */
dbfbe717 185 pps_payload->scale_decrement_interval_low =
a408c857
MN
186 (dsc_cfg->scale_decrement_interval & DSC_PPS_LSB_MASK);
187
188 /* PPS 26[7:0], PPS 27[7:5] RESERVED */
189
190 /* PPS 27 */
dbfbe717 191 pps_payload->first_line_bpg_offset =
a408c857
MN
192 dsc_cfg->first_line_bpg_offset;
193
194 /* PPS 28, 29 */
dbfbe717 195 pps_payload->nfl_bpg_offset =
a408c857
MN
196 cpu_to_be16(dsc_cfg->nfl_bpg_offset);
197
198 /* PPS 30, 31 */
dbfbe717 199 pps_payload->slice_bpg_offset =
a408c857
MN
200 cpu_to_be16(dsc_cfg->slice_bpg_offset);
201
202 /* PPS 32, 33 */
dbfbe717 203 pps_payload->initial_offset =
a408c857
MN
204 cpu_to_be16(dsc_cfg->initial_offset);
205
206 /* PPS 34, 35 */
dbfbe717 207 pps_payload->final_offset = cpu_to_be16(dsc_cfg->final_offset);
a408c857
MN
208
209 /* PPS 36 */
dbfbe717 210 pps_payload->flatness_min_qp = dsc_cfg->flatness_min_qp;
a408c857
MN
211
212 /* PPS 37 */
dbfbe717 213 pps_payload->flatness_max_qp = dsc_cfg->flatness_max_qp;
a408c857
MN
214
215 /* PPS 38, 39 */
1f22ed36 216 pps_payload->rc_model_size = cpu_to_be16(dsc_cfg->rc_model_size);
a408c857
MN
217
218 /* PPS 40 */
dbfbe717 219 pps_payload->rc_edge_factor = DSC_RC_EDGE_FACTOR_CONST;
a408c857
MN
220
221 /* PPS 41 */
dbfbe717 222 pps_payload->rc_quant_incr_limit0 =
a408c857
MN
223 dsc_cfg->rc_quant_incr_limit0;
224
225 /* PPS 42 */
dbfbe717 226 pps_payload->rc_quant_incr_limit1 =
a408c857
MN
227 dsc_cfg->rc_quant_incr_limit1;
228
229 /* PPS 43 */
dbfbe717 230 pps_payload->rc_tgt_offset = DSC_RC_TGT_OFFSET_LO_CONST |
a408c857
MN
231 DSC_RC_TGT_OFFSET_HI_CONST << DSC_PPS_RC_TGT_OFFSET_HI_SHIFT;
232
233 /* PPS 44 - 57 */
234 for (i = 0; i < DSC_NUM_BUF_RANGES - 1; i++)
dbfbe717 235 pps_payload->rc_buf_thresh[i] =
a408c857
MN
236 dsc_cfg->rc_buf_thresh[i];
237
238 /* PPS 58 - 87 */
239 /*
240 * For DSC sink programming the RC Range parameter fields
241 * are as follows: Min_qp[15:11], max_qp[10:6], offset[5:0]
242 */
243 for (i = 0; i < DSC_NUM_BUF_RANGES; i++) {
dbfbe717 244 pps_payload->rc_range_parameters[i] =
40d51c05
VS
245 cpu_to_be16((dsc_cfg->rc_range_params[i].range_min_qp <<
246 DSC_PPS_RC_RANGE_MINQP_SHIFT) |
247 (dsc_cfg->rc_range_params[i].range_max_qp <<
248 DSC_PPS_RC_RANGE_MAXQP_SHIFT) |
249 (dsc_cfg->rc_range_params[i].range_bpg_offset));
a408c857
MN
250 }
251
252 /* PPS 88 */
dbfbe717 253 pps_payload->native_422_420 = dsc_cfg->native_422 |
a408c857
MN
254 dsc_cfg->native_420 << DSC_PPS_NATIVE_420_SHIFT;
255
256 /* PPS 89 */
dbfbe717 257 pps_payload->second_line_bpg_offset =
a408c857
MN
258 dsc_cfg->second_line_bpg_offset;
259
260 /* PPS 90, 91 */
dbfbe717 261 pps_payload->nsl_bpg_offset =
a408c857
MN
262 cpu_to_be16(dsc_cfg->nsl_bpg_offset);
263
264 /* PPS 92, 93 */
dbfbe717 265 pps_payload->second_line_offset_adj =
a408c857
MN
266 cpu_to_be16(dsc_cfg->second_line_offset_adj);
267
268 /* PPS 94 - 127 are O */
269}
dbfbe717 270EXPORT_SYMBOL(drm_dsc_pps_payload_pack);
dc43332b
DF
271
272/**
273 * drm_dsc_compute_rc_parameters() - Write rate control
274 * parameters to the dsc configuration defined in
06d7cecd 275 * &struct drm_dsc_config in accordance with the DSC 1.2
dc43332b
DF
276 * specification. Some configuration fields must be present
277 * beforehand.
278 *
279 * @vdsc_cfg:
280 * DSC Configuration data partially filled by driver
281 */
282int drm_dsc_compute_rc_parameters(struct drm_dsc_config *vdsc_cfg)
283{
284 unsigned long groups_per_line = 0;
285 unsigned long groups_total = 0;
286 unsigned long num_extra_mux_bits = 0;
287 unsigned long slice_bits = 0;
288 unsigned long hrd_delay = 0;
289 unsigned long final_scale = 0;
290 unsigned long rbs_min = 0;
291
06d7cecd
DF
292 if (vdsc_cfg->native_420 || vdsc_cfg->native_422) {
293 /* Number of groups used to code each line of a slice */
294 groups_per_line = DIV_ROUND_UP(vdsc_cfg->slice_width / 2,
295 DSC_RC_PIXELS_PER_GROUP);
296
297 /* chunksize in Bytes */
298 vdsc_cfg->slice_chunk_size = DIV_ROUND_UP(vdsc_cfg->slice_width / 2 *
299 vdsc_cfg->bits_per_pixel,
300 (8 * 16));
301 } else {
302 /* Number of groups used to code each line of a slice */
303 groups_per_line = DIV_ROUND_UP(vdsc_cfg->slice_width,
304 DSC_RC_PIXELS_PER_GROUP);
305
306 /* chunksize in Bytes */
307 vdsc_cfg->slice_chunk_size = DIV_ROUND_UP(vdsc_cfg->slice_width *
308 vdsc_cfg->bits_per_pixel,
309 (8 * 16));
310 }
dc43332b
DF
311
312 if (vdsc_cfg->convert_rgb)
313 num_extra_mux_bits = 3 * (vdsc_cfg->mux_word_size +
314 (4 * vdsc_cfg->bits_per_component + 4)
315 - 2);
06d7cecd
DF
316 else if (vdsc_cfg->native_422)
317 num_extra_mux_bits = 4 * vdsc_cfg->mux_word_size +
318 (4 * vdsc_cfg->bits_per_component + 4) +
319 3 * (4 * vdsc_cfg->bits_per_component) - 2;
dc43332b
DF
320 else
321 num_extra_mux_bits = 3 * vdsc_cfg->mux_word_size +
322 (4 * vdsc_cfg->bits_per_component + 4) +
323 2 * (4 * vdsc_cfg->bits_per_component) - 2;
324 /* Number of bits in one Slice */
325 slice_bits = 8 * vdsc_cfg->slice_chunk_size * vdsc_cfg->slice_height;
326
327 while ((num_extra_mux_bits > 0) &&
328 ((slice_bits - num_extra_mux_bits) % vdsc_cfg->mux_word_size))
329 num_extra_mux_bits--;
330
331 if (groups_per_line < vdsc_cfg->initial_scale_value - 8)
332 vdsc_cfg->initial_scale_value = groups_per_line + 8;
333
334 /* scale_decrement_interval calculation according to DSC spec 1.11 */
335 if (vdsc_cfg->initial_scale_value > 8)
336 vdsc_cfg->scale_decrement_interval = groups_per_line /
337 (vdsc_cfg->initial_scale_value - 8);
338 else
339 vdsc_cfg->scale_decrement_interval = DSC_SCALE_DECREMENT_INTERVAL_MAX;
340
341 vdsc_cfg->final_offset = vdsc_cfg->rc_model_size -
342 (vdsc_cfg->initial_xmit_delay *
343 vdsc_cfg->bits_per_pixel + 8) / 16 + num_extra_mux_bits;
344
345 if (vdsc_cfg->final_offset >= vdsc_cfg->rc_model_size) {
346 DRM_DEBUG_KMS("FinalOfs < RcModelSze for this InitialXmitDelay\n");
347 return -ERANGE;
348 }
349
350 final_scale = (vdsc_cfg->rc_model_size * 8) /
351 (vdsc_cfg->rc_model_size - vdsc_cfg->final_offset);
352 if (vdsc_cfg->slice_height > 1)
353 /*
354 * NflBpgOffset is 16 bit value with 11 fractional bits
355 * hence we multiply by 2^11 for preserving the
356 * fractional part
357 */
358 vdsc_cfg->nfl_bpg_offset = DIV_ROUND_UP((vdsc_cfg->first_line_bpg_offset << 11),
359 (vdsc_cfg->slice_height - 1));
360 else
361 vdsc_cfg->nfl_bpg_offset = 0;
362
dc43332b
DF
363 /* Number of groups used to code the entire slice */
364 groups_total = groups_per_line * vdsc_cfg->slice_height;
365
366 /* slice_bpg_offset is 16 bit value with 11 fractional bits */
367 vdsc_cfg->slice_bpg_offset = DIV_ROUND_UP(((vdsc_cfg->rc_model_size -
368 vdsc_cfg->initial_offset +
369 num_extra_mux_bits) << 11),
370 groups_total);
371
372 if (final_scale > 9) {
373 /*
374 * ScaleIncrementInterval =
375 * finaloffset/((NflBpgOffset + SliceBpgOffset)*8(finalscale - 1.125))
376 * as (NflBpgOffset + SliceBpgOffset) has 11 bit fractional value,
377 * we need divide by 2^11 from pstDscCfg values
378 */
379 vdsc_cfg->scale_increment_interval =
380 (vdsc_cfg->final_offset * (1 << 11)) /
381 ((vdsc_cfg->nfl_bpg_offset +
382 vdsc_cfg->slice_bpg_offset) *
383 (final_scale - 9));
384 } else {
385 /*
386 * If finalScaleValue is less than or equal to 9, a value of 0 should
387 * be used to disable the scale increment at the end of the slice
388 */
389 vdsc_cfg->scale_increment_interval = 0;
390 }
391
dc43332b
DF
392 /*
393 * DSC spec mentions that bits_per_pixel specifies the target
394 * bits/pixel (bpp) rate that is used by the encoder,
395 * in steps of 1/16 of a bit per pixel
396 */
397 rbs_min = vdsc_cfg->rc_model_size - vdsc_cfg->initial_offset +
398 DIV_ROUND_UP(vdsc_cfg->initial_xmit_delay *
399 vdsc_cfg->bits_per_pixel, 16) +
400 groups_per_line * vdsc_cfg->first_line_bpg_offset;
401
402 hrd_delay = DIV_ROUND_UP((rbs_min * 16), vdsc_cfg->bits_per_pixel);
403 vdsc_cfg->rc_bits = (hrd_delay * vdsc_cfg->bits_per_pixel) / 16;
404 vdsc_cfg->initial_dec_delay = hrd_delay - vdsc_cfg->initial_xmit_delay;
405
406 return 0;
407}
408EXPORT_SYMBOL(drm_dsc_compute_rc_parameters);