4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
20 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
24 * Daniel Vetter <daniel@ffwll.ch>
26 * Derived from Xorg ddx, xf86-video-intel, src/i830_video.c
29 #include <drm/i915_drm.h>
32 #include "intel_drv.h"
34 /* Limits for overlay size. According to intel doc, the real limits are:
35 * Y width: 4095, UV width (planar): 2047, Y height: 2047,
36 * UV width (planar): * 1023. But the xorg thinks 2048 for height and width. Use
37 * the mininum of both. */
38 #define IMAGE_MAX_WIDTH 2048
39 #define IMAGE_MAX_HEIGHT 2046 /* 2 * 1023 */
40 /* on 830 and 845 these large limits result in the card hanging */
41 #define IMAGE_MAX_WIDTH_LEGACY 1024
42 #define IMAGE_MAX_HEIGHT_LEGACY 1088
44 /* overlay register definitions */
46 #define OCMD_TILED_SURFACE (0x1<<19)
47 #define OCMD_MIRROR_MASK (0x3<<17)
48 #define OCMD_MIRROR_MODE (0x3<<17)
49 #define OCMD_MIRROR_HORIZONTAL (0x1<<17)
50 #define OCMD_MIRROR_VERTICAL (0x2<<17)
51 #define OCMD_MIRROR_BOTH (0x3<<17)
52 #define OCMD_BYTEORDER_MASK (0x3<<14) /* zero for YUYV or FOURCC YUY2 */
53 #define OCMD_UV_SWAP (0x1<<14) /* YVYU */
54 #define OCMD_Y_SWAP (0x2<<14) /* UYVY or FOURCC UYVY */
55 #define OCMD_Y_AND_UV_SWAP (0x3<<14) /* VYUY */
56 #define OCMD_SOURCE_FORMAT_MASK (0xf<<10)
57 #define OCMD_RGB_888 (0x1<<10) /* not in i965 Intel docs */
58 #define OCMD_RGB_555 (0x2<<10) /* not in i965 Intel docs */
59 #define OCMD_RGB_565 (0x3<<10) /* not in i965 Intel docs */
60 #define OCMD_YUV_422_PACKED (0x8<<10)
61 #define OCMD_YUV_411_PACKED (0x9<<10) /* not in i965 Intel docs */
62 #define OCMD_YUV_420_PLANAR (0xc<<10)
63 #define OCMD_YUV_422_PLANAR (0xd<<10)
64 #define OCMD_YUV_410_PLANAR (0xe<<10) /* also 411 */
65 #define OCMD_TVSYNCFLIP_PARITY (0x1<<9)
66 #define OCMD_TVSYNCFLIP_ENABLE (0x1<<7)
67 #define OCMD_BUF_TYPE_MASK (0x1<<5)
68 #define OCMD_BUF_TYPE_FRAME (0x0<<5)
69 #define OCMD_BUF_TYPE_FIELD (0x1<<5)
70 #define OCMD_TEST_MODE (0x1<<4)
71 #define OCMD_BUFFER_SELECT (0x3<<2)
72 #define OCMD_BUFFER0 (0x0<<2)
73 #define OCMD_BUFFER1 (0x1<<2)
74 #define OCMD_FIELD_SELECT (0x1<<2)
75 #define OCMD_FIELD0 (0x0<<1)
76 #define OCMD_FIELD1 (0x1<<1)
77 #define OCMD_ENABLE (0x1<<0)
79 /* OCONFIG register */
80 #define OCONF_PIPE_MASK (0x1<<18)
81 #define OCONF_PIPE_A (0x0<<18)
82 #define OCONF_PIPE_B (0x1<<18)
83 #define OCONF_GAMMA2_ENABLE (0x1<<16)
84 #define OCONF_CSC_MODE_BT601 (0x0<<5)
85 #define OCONF_CSC_MODE_BT709 (0x1<<5)
86 #define OCONF_CSC_BYPASS (0x1<<4)
87 #define OCONF_CC_OUT_8BIT (0x1<<3)
88 #define OCONF_TEST_MODE (0x1<<2)
89 #define OCONF_THREE_LINE_BUFFER (0x1<<0)
90 #define OCONF_TWO_LINE_BUFFER (0x0<<0)
92 /* DCLRKM (dst-key) register */
93 #define DST_KEY_ENABLE (0x1<<31)
94 #define CLK_RGB24_MASK 0x0
95 #define CLK_RGB16_MASK 0x070307
96 #define CLK_RGB15_MASK 0x070707
97 #define CLK_RGB8I_MASK 0xffffff
99 #define RGB16_TO_COLORKEY(c) \
100 (((c & 0xF800) << 8) | ((c & 0x07E0) << 5) | ((c & 0x001F) << 3))
101 #define RGB15_TO_COLORKEY(c) \
102 (((c & 0x7c00) << 9) | ((c & 0x03E0) << 6) | ((c & 0x001F) << 3))
104 /* overlay flip addr flag */
105 #define OFC_UPDATE 0x1
107 /* polyphase filter coefficients */
108 #define N_HORIZ_Y_TAPS 5
109 #define N_VERT_Y_TAPS 3
110 #define N_HORIZ_UV_TAPS 3
111 #define N_VERT_UV_TAPS 3
115 /* memory bufferd overlay registers */
116 struct overlay_registers {
144 u32 RESERVED1; /* 0x6C */
157 u32 FASTHSCALE; /* 0xA0 */
158 u32 UVSCALEV; /* 0xA4 */
159 u32 RESERVEDC[(0x200 - 0xA8) / 4]; /* 0xA8 - 0x1FC */
160 u16 Y_VCOEFS[N_VERT_Y_TAPS * N_PHASES]; /* 0x200 */
161 u16 RESERVEDD[0x100 / 2 - N_VERT_Y_TAPS * N_PHASES];
162 u16 Y_HCOEFS[N_HORIZ_Y_TAPS * N_PHASES]; /* 0x300 */
163 u16 RESERVEDE[0x200 / 2 - N_HORIZ_Y_TAPS * N_PHASES];
164 u16 UV_VCOEFS[N_VERT_UV_TAPS * N_PHASES]; /* 0x500 */
165 u16 RESERVEDF[0x100 / 2 - N_VERT_UV_TAPS * N_PHASES];
166 u16 UV_HCOEFS[N_HORIZ_UV_TAPS * N_PHASES]; /* 0x600 */
167 u16 RESERVEDG[0x100 / 2 - N_HORIZ_UV_TAPS * N_PHASES];
170 struct intel_overlay {
171 struct drm_device *dev;
172 struct intel_crtc *crtc;
173 struct drm_i915_gem_object *vid_bo;
174 struct drm_i915_gem_object *old_vid_bo;
177 u32 pfit_vscale_ratio; /* shifted-point number, (1<<12) == 1.0 */
179 u32 color_key_enabled:1;
180 u32 brightness, contrast, saturation;
181 u32 old_xscale, old_yscale;
182 /* register access */
184 struct drm_i915_gem_object *reg_bo;
186 struct drm_i915_gem_request *last_flip_req;
187 void (*flip_tail)(struct intel_overlay *);
190 static struct overlay_registers __iomem *
191 intel_overlay_map_regs(struct intel_overlay *overlay)
193 struct drm_i915_private *dev_priv = overlay->dev->dev_private;
194 struct overlay_registers __iomem *regs;
196 if (OVERLAY_NEEDS_PHYSICAL(overlay->dev))
197 regs = (struct overlay_registers __iomem *)overlay->reg_bo->phys_handle->vaddr;
199 regs = io_mapping_map_wc(dev_priv->gtt.mappable,
200 i915_gem_obj_ggtt_offset(overlay->reg_bo));
205 static void intel_overlay_unmap_regs(struct intel_overlay *overlay,
206 struct overlay_registers __iomem *regs)
208 if (!OVERLAY_NEEDS_PHYSICAL(overlay->dev))
209 io_mapping_unmap(regs);
212 static int intel_overlay_do_wait_request(struct intel_overlay *overlay,
213 struct drm_i915_gem_request *req,
214 void (*tail)(struct intel_overlay *))
218 WARN_ON(overlay->last_flip_req);
219 i915_gem_request_assign(&overlay->last_flip_req, req);
220 i915_add_request(req);
222 overlay->flip_tail = tail;
223 ret = i915_wait_request(overlay->last_flip_req);
227 i915_gem_request_assign(&overlay->last_flip_req, NULL);
231 /* overlay needs to be disable in OCMD reg */
232 static int intel_overlay_on(struct intel_overlay *overlay)
234 struct drm_device *dev = overlay->dev;
235 struct drm_i915_private *dev_priv = dev->dev_private;
236 struct intel_engine_cs *engine = &dev_priv->engine[RCS];
237 struct drm_i915_gem_request *req;
240 WARN_ON(overlay->active);
241 WARN_ON(IS_I830(dev) && !(dev_priv->quirks & QUIRK_PIPEA_FORCE));
243 req = i915_gem_request_alloc(engine, NULL);
247 ret = intel_ring_begin(req, 4);
249 i915_gem_request_cancel(req);
253 overlay->active = true;
255 intel_ring_emit(engine, MI_OVERLAY_FLIP | MI_OVERLAY_ON);
256 intel_ring_emit(engine, overlay->flip_addr | OFC_UPDATE);
257 intel_ring_emit(engine, MI_WAIT_FOR_EVENT | MI_WAIT_FOR_OVERLAY_FLIP);
258 intel_ring_emit(engine, MI_NOOP);
259 intel_ring_advance(engine);
261 return intel_overlay_do_wait_request(overlay, req, NULL);
264 /* overlay needs to be enabled in OCMD reg */
265 static int intel_overlay_continue(struct intel_overlay *overlay,
266 bool load_polyphase_filter)
268 struct drm_device *dev = overlay->dev;
269 struct drm_i915_private *dev_priv = dev->dev_private;
270 struct intel_engine_cs *engine = &dev_priv->engine[RCS];
271 struct drm_i915_gem_request *req;
272 u32 flip_addr = overlay->flip_addr;
276 WARN_ON(!overlay->active);
278 if (load_polyphase_filter)
279 flip_addr |= OFC_UPDATE;
281 /* check for underruns */
282 tmp = I915_READ(DOVSTA);
284 DRM_DEBUG("overlay underrun, DOVSTA: %x\n", tmp);
286 req = i915_gem_request_alloc(engine, NULL);
290 ret = intel_ring_begin(req, 2);
292 i915_gem_request_cancel(req);
296 intel_ring_emit(engine, MI_OVERLAY_FLIP | MI_OVERLAY_CONTINUE);
297 intel_ring_emit(engine, flip_addr);
298 intel_ring_advance(engine);
300 WARN_ON(overlay->last_flip_req);
301 i915_gem_request_assign(&overlay->last_flip_req, req);
302 i915_add_request(req);
307 static void intel_overlay_release_old_vid_tail(struct intel_overlay *overlay)
309 struct drm_i915_gem_object *obj = overlay->old_vid_bo;
311 i915_gem_object_ggtt_unpin(obj);
312 drm_gem_object_unreference(&obj->base);
314 overlay->old_vid_bo = NULL;
317 static void intel_overlay_off_tail(struct intel_overlay *overlay)
319 struct drm_i915_gem_object *obj = overlay->vid_bo;
321 /* never have the overlay hw on without showing a frame */
325 i915_gem_object_ggtt_unpin(obj);
326 drm_gem_object_unreference(&obj->base);
327 overlay->vid_bo = NULL;
329 overlay->crtc->overlay = NULL;
330 overlay->crtc = NULL;
331 overlay->active = false;
334 /* overlay needs to be disabled in OCMD reg */
335 static int intel_overlay_off(struct intel_overlay *overlay)
337 struct drm_device *dev = overlay->dev;
338 struct drm_i915_private *dev_priv = dev->dev_private;
339 struct intel_engine_cs *engine = &dev_priv->engine[RCS];
340 struct drm_i915_gem_request *req;
341 u32 flip_addr = overlay->flip_addr;
344 WARN_ON(!overlay->active);
346 /* According to intel docs the overlay hw may hang (when switching
347 * off) without loading the filter coeffs. It is however unclear whether
348 * this applies to the disabling of the overlay or to the switching off
349 * of the hw. Do it in both cases */
350 flip_addr |= OFC_UPDATE;
352 req = i915_gem_request_alloc(engine, NULL);
356 ret = intel_ring_begin(req, 6);
358 i915_gem_request_cancel(req);
362 /* wait for overlay to go idle */
363 intel_ring_emit(engine, MI_OVERLAY_FLIP | MI_OVERLAY_CONTINUE);
364 intel_ring_emit(engine, flip_addr);
365 intel_ring_emit(engine, MI_WAIT_FOR_EVENT | MI_WAIT_FOR_OVERLAY_FLIP);
366 /* turn overlay off */
368 /* Workaround: Don't disable the overlay fully, since otherwise
369 * it dies on the next OVERLAY_ON cmd. */
370 intel_ring_emit(engine, MI_NOOP);
371 intel_ring_emit(engine, MI_NOOP);
372 intel_ring_emit(engine, MI_NOOP);
374 intel_ring_emit(engine, MI_OVERLAY_FLIP | MI_OVERLAY_OFF);
375 intel_ring_emit(engine, flip_addr);
376 intel_ring_emit(engine,
377 MI_WAIT_FOR_EVENT | MI_WAIT_FOR_OVERLAY_FLIP);
379 intel_ring_advance(engine);
381 return intel_overlay_do_wait_request(overlay, req, intel_overlay_off_tail);
384 /* recover from an interruption due to a signal
385 * We have to be careful not to repeat work forever an make forward progess. */
386 static int intel_overlay_recover_from_interrupt(struct intel_overlay *overlay)
390 if (overlay->last_flip_req == NULL)
393 ret = i915_wait_request(overlay->last_flip_req);
397 if (overlay->flip_tail)
398 overlay->flip_tail(overlay);
400 i915_gem_request_assign(&overlay->last_flip_req, NULL);
404 /* Wait for pending overlay flip and release old frame.
405 * Needs to be called before the overlay register are changed
406 * via intel_overlay_(un)map_regs
408 static int intel_overlay_release_old_vid(struct intel_overlay *overlay)
410 struct drm_device *dev = overlay->dev;
411 struct drm_i915_private *dev_priv = dev->dev_private;
412 struct intel_engine_cs *engine = &dev_priv->engine[RCS];
415 WARN_ON(!mutex_is_locked(&dev->struct_mutex));
417 /* Only wait if there is actually an old frame to release to
418 * guarantee forward progress.
420 if (!overlay->old_vid_bo)
423 if (I915_READ(ISR) & I915_OVERLAY_PLANE_FLIP_PENDING_INTERRUPT) {
424 /* synchronous slowpath */
425 struct drm_i915_gem_request *req;
427 req = i915_gem_request_alloc(engine, NULL);
431 ret = intel_ring_begin(req, 2);
433 i915_gem_request_cancel(req);
437 intel_ring_emit(engine,
438 MI_WAIT_FOR_EVENT | MI_WAIT_FOR_OVERLAY_FLIP);
439 intel_ring_emit(engine, MI_NOOP);
440 intel_ring_advance(engine);
442 ret = intel_overlay_do_wait_request(overlay, req,
443 intel_overlay_release_old_vid_tail);
448 intel_overlay_release_old_vid_tail(overlay);
451 i915_gem_track_fb(overlay->old_vid_bo, NULL,
452 INTEL_FRONTBUFFER_OVERLAY(overlay->crtc->pipe));
456 void intel_overlay_reset(struct drm_i915_private *dev_priv)
458 struct intel_overlay *overlay = dev_priv->overlay;
463 intel_overlay_release_old_vid(overlay);
465 overlay->last_flip_req = NULL;
466 overlay->old_xscale = 0;
467 overlay->old_yscale = 0;
468 overlay->crtc = NULL;
469 overlay->active = false;
472 struct put_image_params {
489 static int packed_depth_bytes(u32 format)
491 switch (format & I915_OVERLAY_DEPTH_MASK) {
492 case I915_OVERLAY_YUV422:
494 case I915_OVERLAY_YUV411:
495 /* return 6; not implemented */
501 static int packed_width_bytes(u32 format, short width)
503 switch (format & I915_OVERLAY_DEPTH_MASK) {
504 case I915_OVERLAY_YUV422:
511 static int uv_hsubsampling(u32 format)
513 switch (format & I915_OVERLAY_DEPTH_MASK) {
514 case I915_OVERLAY_YUV422:
515 case I915_OVERLAY_YUV420:
517 case I915_OVERLAY_YUV411:
518 case I915_OVERLAY_YUV410:
525 static int uv_vsubsampling(u32 format)
527 switch (format & I915_OVERLAY_DEPTH_MASK) {
528 case I915_OVERLAY_YUV420:
529 case I915_OVERLAY_YUV410:
531 case I915_OVERLAY_YUV422:
532 case I915_OVERLAY_YUV411:
539 static u32 calc_swidthsw(struct drm_device *dev, u32 offset, u32 width)
541 u32 mask, shift, ret;
549 ret = ((offset + width + mask) >> shift) - (offset >> shift);
556 static const u16 y_static_hcoeffs[N_HORIZ_Y_TAPS * N_PHASES] = {
557 0x3000, 0xb4a0, 0x1930, 0x1920, 0xb4a0,
558 0x3000, 0xb500, 0x19d0, 0x1880, 0xb440,
559 0x3000, 0xb540, 0x1a88, 0x2f80, 0xb3e0,
560 0x3000, 0xb580, 0x1b30, 0x2e20, 0xb380,
561 0x3000, 0xb5c0, 0x1bd8, 0x2cc0, 0xb320,
562 0x3020, 0xb5e0, 0x1c60, 0x2b80, 0xb2c0,
563 0x3020, 0xb5e0, 0x1cf8, 0x2a20, 0xb260,
564 0x3020, 0xb5e0, 0x1d80, 0x28e0, 0xb200,
565 0x3020, 0xb5c0, 0x1e08, 0x3f40, 0xb1c0,
566 0x3020, 0xb580, 0x1e78, 0x3ce0, 0xb160,
567 0x3040, 0xb520, 0x1ed8, 0x3aa0, 0xb120,
568 0x3040, 0xb4a0, 0x1f30, 0x3880, 0xb0e0,
569 0x3040, 0xb400, 0x1f78, 0x3680, 0xb0a0,
570 0x3020, 0xb340, 0x1fb8, 0x34a0, 0xb060,
571 0x3020, 0xb240, 0x1fe0, 0x32e0, 0xb040,
572 0x3020, 0xb140, 0x1ff8, 0x3160, 0xb020,
573 0xb000, 0x3000, 0x0800, 0x3000, 0xb000
576 static const u16 uv_static_hcoeffs[N_HORIZ_UV_TAPS * N_PHASES] = {
577 0x3000, 0x1800, 0x1800, 0xb000, 0x18d0, 0x2e60,
578 0xb000, 0x1990, 0x2ce0, 0xb020, 0x1a68, 0x2b40,
579 0xb040, 0x1b20, 0x29e0, 0xb060, 0x1bd8, 0x2880,
580 0xb080, 0x1c88, 0x3e60, 0xb0a0, 0x1d28, 0x3c00,
581 0xb0c0, 0x1db8, 0x39e0, 0xb0e0, 0x1e40, 0x37e0,
582 0xb100, 0x1eb8, 0x3620, 0xb100, 0x1f18, 0x34a0,
583 0xb100, 0x1f68, 0x3360, 0xb0e0, 0x1fa8, 0x3240,
584 0xb0c0, 0x1fe0, 0x3140, 0xb060, 0x1ff0, 0x30a0,
585 0x3000, 0x0800, 0x3000
588 static void update_polyphase_filter(struct overlay_registers __iomem *regs)
590 memcpy_toio(regs->Y_HCOEFS, y_static_hcoeffs, sizeof(y_static_hcoeffs));
591 memcpy_toio(regs->UV_HCOEFS, uv_static_hcoeffs,
592 sizeof(uv_static_hcoeffs));
595 static bool update_scaling_factors(struct intel_overlay *overlay,
596 struct overlay_registers __iomem *regs,
597 struct put_image_params *params)
599 /* fixed point with a 12 bit shift */
600 u32 xscale, yscale, xscale_UV, yscale_UV;
602 #define FRACT_MASK 0xfff
603 bool scale_changed = false;
604 int uv_hscale = uv_hsubsampling(params->format);
605 int uv_vscale = uv_vsubsampling(params->format);
607 if (params->dst_w > 1)
608 xscale = ((params->src_scan_w - 1) << FP_SHIFT)
611 xscale = 1 << FP_SHIFT;
613 if (params->dst_h > 1)
614 yscale = ((params->src_scan_h - 1) << FP_SHIFT)
617 yscale = 1 << FP_SHIFT;
619 /*if (params->format & I915_OVERLAY_YUV_PLANAR) {*/
620 xscale_UV = xscale/uv_hscale;
621 yscale_UV = yscale/uv_vscale;
622 /* make the Y scale to UV scale ratio an exact multiply */
623 xscale = xscale_UV * uv_hscale;
624 yscale = yscale_UV * uv_vscale;
630 if (xscale != overlay->old_xscale || yscale != overlay->old_yscale)
631 scale_changed = true;
632 overlay->old_xscale = xscale;
633 overlay->old_yscale = yscale;
635 iowrite32(((yscale & FRACT_MASK) << 20) |
636 ((xscale >> FP_SHIFT) << 16) |
637 ((xscale & FRACT_MASK) << 3),
640 iowrite32(((yscale_UV & FRACT_MASK) << 20) |
641 ((xscale_UV >> FP_SHIFT) << 16) |
642 ((xscale_UV & FRACT_MASK) << 3),
645 iowrite32((((yscale >> FP_SHIFT) << 16) |
646 ((yscale_UV >> FP_SHIFT) << 0)),
650 update_polyphase_filter(regs);
652 return scale_changed;
655 static void update_colorkey(struct intel_overlay *overlay,
656 struct overlay_registers __iomem *regs)
658 u32 key = overlay->color_key;
662 if (overlay->color_key_enabled)
663 flags |= DST_KEY_ENABLE;
665 switch (overlay->crtc->base.primary->fb->bits_per_pixel) {
668 flags |= CLK_RGB8I_MASK;
672 if (overlay->crtc->base.primary->fb->depth == 15) {
673 key = RGB15_TO_COLORKEY(key);
674 flags |= CLK_RGB15_MASK;
676 key = RGB16_TO_COLORKEY(key);
677 flags |= CLK_RGB16_MASK;
683 flags |= CLK_RGB24_MASK;
687 iowrite32(key, ®s->DCLRKV);
688 iowrite32(flags, ®s->DCLRKM);
691 static u32 overlay_cmd_reg(struct put_image_params *params)
693 u32 cmd = OCMD_ENABLE | OCMD_BUF_TYPE_FRAME | OCMD_BUFFER0;
695 if (params->format & I915_OVERLAY_YUV_PLANAR) {
696 switch (params->format & I915_OVERLAY_DEPTH_MASK) {
697 case I915_OVERLAY_YUV422:
698 cmd |= OCMD_YUV_422_PLANAR;
700 case I915_OVERLAY_YUV420:
701 cmd |= OCMD_YUV_420_PLANAR;
703 case I915_OVERLAY_YUV411:
704 case I915_OVERLAY_YUV410:
705 cmd |= OCMD_YUV_410_PLANAR;
708 } else { /* YUV packed */
709 switch (params->format & I915_OVERLAY_DEPTH_MASK) {
710 case I915_OVERLAY_YUV422:
711 cmd |= OCMD_YUV_422_PACKED;
713 case I915_OVERLAY_YUV411:
714 cmd |= OCMD_YUV_411_PACKED;
718 switch (params->format & I915_OVERLAY_SWAP_MASK) {
719 case I915_OVERLAY_NO_SWAP:
721 case I915_OVERLAY_UV_SWAP:
724 case I915_OVERLAY_Y_SWAP:
727 case I915_OVERLAY_Y_AND_UV_SWAP:
728 cmd |= OCMD_Y_AND_UV_SWAP;
736 static int intel_overlay_do_put_image(struct intel_overlay *overlay,
737 struct drm_i915_gem_object *new_bo,
738 struct put_image_params *params)
741 struct overlay_registers __iomem *regs;
742 bool scale_changed = false;
743 struct drm_device *dev = overlay->dev;
744 u32 swidth, swidthsw, sheight, ostride;
745 enum pipe pipe = overlay->crtc->pipe;
747 WARN_ON(!mutex_is_locked(&dev->struct_mutex));
748 WARN_ON(!drm_modeset_is_locked(&dev->mode_config.connection_mutex));
750 ret = intel_overlay_release_old_vid(overlay);
754 ret = i915_gem_object_pin_to_display_plane(new_bo, 0,
755 &i915_ggtt_view_normal);
759 ret = i915_gem_object_put_fence(new_bo);
763 if (!overlay->active) {
765 regs = intel_overlay_map_regs(overlay);
770 oconfig = OCONF_CC_OUT_8BIT;
771 if (IS_GEN4(overlay->dev))
772 oconfig |= OCONF_CSC_MODE_BT709;
773 oconfig |= pipe == 0 ?
774 OCONF_PIPE_A : OCONF_PIPE_B;
775 iowrite32(oconfig, ®s->OCONFIG);
776 intel_overlay_unmap_regs(overlay, regs);
778 ret = intel_overlay_on(overlay);
783 regs = intel_overlay_map_regs(overlay);
789 iowrite32((params->dst_y << 16) | params->dst_x, ®s->DWINPOS);
790 iowrite32((params->dst_h << 16) | params->dst_w, ®s->DWINSZ);
792 if (params->format & I915_OVERLAY_YUV_PACKED)
793 tmp_width = packed_width_bytes(params->format, params->src_w);
795 tmp_width = params->src_w;
797 swidth = params->src_w;
798 swidthsw = calc_swidthsw(overlay->dev, params->offset_Y, tmp_width);
799 sheight = params->src_h;
800 iowrite32(i915_gem_obj_ggtt_offset(new_bo) + params->offset_Y, ®s->OBUF_0Y);
801 ostride = params->stride_Y;
803 if (params->format & I915_OVERLAY_YUV_PLANAR) {
804 int uv_hscale = uv_hsubsampling(params->format);
805 int uv_vscale = uv_vsubsampling(params->format);
807 swidth |= (params->src_w/uv_hscale) << 16;
808 tmp_U = calc_swidthsw(overlay->dev, params->offset_U,
809 params->src_w/uv_hscale);
810 tmp_V = calc_swidthsw(overlay->dev, params->offset_V,
811 params->src_w/uv_hscale);
812 swidthsw |= max_t(u32, tmp_U, tmp_V) << 16;
813 sheight |= (params->src_h/uv_vscale) << 16;
814 iowrite32(i915_gem_obj_ggtt_offset(new_bo) + params->offset_U, ®s->OBUF_0U);
815 iowrite32(i915_gem_obj_ggtt_offset(new_bo) + params->offset_V, ®s->OBUF_0V);
816 ostride |= params->stride_UV << 16;
819 iowrite32(swidth, ®s->SWIDTH);
820 iowrite32(swidthsw, ®s->SWIDTHSW);
821 iowrite32(sheight, ®s->SHEIGHT);
822 iowrite32(ostride, ®s->OSTRIDE);
824 scale_changed = update_scaling_factors(overlay, regs, params);
826 update_colorkey(overlay, regs);
828 iowrite32(overlay_cmd_reg(params), ®s->OCMD);
830 intel_overlay_unmap_regs(overlay, regs);
832 ret = intel_overlay_continue(overlay, scale_changed);
836 i915_gem_track_fb(overlay->vid_bo, new_bo,
837 INTEL_FRONTBUFFER_OVERLAY(pipe));
839 overlay->old_vid_bo = overlay->vid_bo;
840 overlay->vid_bo = new_bo;
842 intel_frontbuffer_flip(dev,
843 INTEL_FRONTBUFFER_OVERLAY(pipe));
848 i915_gem_object_ggtt_unpin(new_bo);
852 int intel_overlay_switch_off(struct intel_overlay *overlay)
854 struct overlay_registers __iomem *regs;
855 struct drm_device *dev = overlay->dev;
858 WARN_ON(!mutex_is_locked(&dev->struct_mutex));
859 WARN_ON(!drm_modeset_is_locked(&dev->mode_config.connection_mutex));
861 ret = intel_overlay_recover_from_interrupt(overlay);
865 if (!overlay->active)
868 ret = intel_overlay_release_old_vid(overlay);
872 regs = intel_overlay_map_regs(overlay);
873 iowrite32(0, ®s->OCMD);
874 intel_overlay_unmap_regs(overlay, regs);
876 ret = intel_overlay_off(overlay);
880 intel_overlay_off_tail(overlay);
884 static int check_overlay_possible_on_crtc(struct intel_overlay *overlay,
885 struct intel_crtc *crtc)
890 /* can't use the overlay with double wide pipe */
891 if (crtc->config->double_wide)
897 static void update_pfit_vscale_ratio(struct intel_overlay *overlay)
899 struct drm_device *dev = overlay->dev;
900 struct drm_i915_private *dev_priv = dev->dev_private;
901 u32 pfit_control = I915_READ(PFIT_CONTROL);
904 /* XXX: This is not the same logic as in the xorg driver, but more in
905 * line with the intel documentation for the i965
907 if (INTEL_INFO(dev)->gen >= 4) {
908 /* on i965 use the PGM reg to read out the autoscaler values */
909 ratio = I915_READ(PFIT_PGM_RATIOS) >> PFIT_VERT_SCALE_SHIFT_965;
911 if (pfit_control & VERT_AUTO_SCALE)
912 ratio = I915_READ(PFIT_AUTO_RATIOS);
914 ratio = I915_READ(PFIT_PGM_RATIOS);
915 ratio >>= PFIT_VERT_SCALE_SHIFT;
918 overlay->pfit_vscale_ratio = ratio;
921 static int check_overlay_dst(struct intel_overlay *overlay,
922 struct drm_intel_overlay_put_image *rec)
924 struct drm_display_mode *mode = &overlay->crtc->base.mode;
926 if (rec->dst_x < mode->hdisplay &&
927 rec->dst_x + rec->dst_width <= mode->hdisplay &&
928 rec->dst_y < mode->vdisplay &&
929 rec->dst_y + rec->dst_height <= mode->vdisplay)
935 static int check_overlay_scaling(struct put_image_params *rec)
939 /* downscaling limit is 8.0 */
940 tmp = ((rec->src_scan_h << 16) / rec->dst_h) >> 16;
943 tmp = ((rec->src_scan_w << 16) / rec->dst_w) >> 16;
950 static int check_overlay_src(struct drm_device *dev,
951 struct drm_intel_overlay_put_image *rec,
952 struct drm_i915_gem_object *new_bo)
954 int uv_hscale = uv_hsubsampling(rec->flags);
955 int uv_vscale = uv_vsubsampling(rec->flags);
960 /* check src dimensions */
961 if (IS_845G(dev) || IS_I830(dev)) {
962 if (rec->src_height > IMAGE_MAX_HEIGHT_LEGACY ||
963 rec->src_width > IMAGE_MAX_WIDTH_LEGACY)
966 if (rec->src_height > IMAGE_MAX_HEIGHT ||
967 rec->src_width > IMAGE_MAX_WIDTH)
971 /* better safe than sorry, use 4 as the maximal subsampling ratio */
972 if (rec->src_height < N_VERT_Y_TAPS*4 ||
973 rec->src_width < N_HORIZ_Y_TAPS*4)
976 /* check alignment constraints */
977 switch (rec->flags & I915_OVERLAY_TYPE_MASK) {
978 case I915_OVERLAY_RGB:
979 /* not implemented */
982 case I915_OVERLAY_YUV_PACKED:
986 depth = packed_depth_bytes(rec->flags);
990 /* ignore UV planes */
994 /* check pixel alignment */
995 if (rec->offset_Y % depth)
999 case I915_OVERLAY_YUV_PLANAR:
1000 if (uv_vscale < 0 || uv_hscale < 0)
1002 /* no offset restrictions for planar formats */
1009 if (rec->src_width % uv_hscale)
1012 /* stride checking */
1013 if (IS_I830(dev) || IS_845G(dev))
1018 if (rec->stride_Y & stride_mask || rec->stride_UV & stride_mask)
1020 if (IS_GEN4(dev) && rec->stride_Y < 512)
1023 tmp = (rec->flags & I915_OVERLAY_TYPE_MASK) == I915_OVERLAY_YUV_PLANAR ?
1025 if (rec->stride_Y > tmp || rec->stride_UV > 2*1024)
1028 /* check buffer dimensions */
1029 switch (rec->flags & I915_OVERLAY_TYPE_MASK) {
1030 case I915_OVERLAY_RGB:
1031 case I915_OVERLAY_YUV_PACKED:
1032 /* always 4 Y values per depth pixels */
1033 if (packed_width_bytes(rec->flags, rec->src_width) > rec->stride_Y)
1036 tmp = rec->stride_Y*rec->src_height;
1037 if (rec->offset_Y + tmp > new_bo->base.size)
1041 case I915_OVERLAY_YUV_PLANAR:
1042 if (rec->src_width > rec->stride_Y)
1044 if (rec->src_width/uv_hscale > rec->stride_UV)
1047 tmp = rec->stride_Y * rec->src_height;
1048 if (rec->offset_Y + tmp > new_bo->base.size)
1051 tmp = rec->stride_UV * (rec->src_height / uv_vscale);
1052 if (rec->offset_U + tmp > new_bo->base.size ||
1053 rec->offset_V + tmp > new_bo->base.size)
1062 * Return the pipe currently connected to the panel fitter,
1063 * or -1 if the panel fitter is not present or not in use
1065 static int intel_panel_fitter_pipe(struct drm_device *dev)
1067 struct drm_i915_private *dev_priv = dev->dev_private;
1070 /* i830 doesn't have a panel fitter */
1071 if (INTEL_INFO(dev)->gen <= 3 && (IS_I830(dev) || !IS_MOBILE(dev)))
1074 pfit_control = I915_READ(PFIT_CONTROL);
1076 /* See if the panel fitter is in use */
1077 if ((pfit_control & PFIT_ENABLE) == 0)
1080 /* 965 can place panel fitter on either pipe */
1082 return (pfit_control >> 29) & 0x3;
1084 /* older chips can only use pipe 1 */
1088 int intel_overlay_put_image(struct drm_device *dev, void *data,
1089 struct drm_file *file_priv)
1091 struct drm_intel_overlay_put_image *put_image_rec = data;
1092 struct drm_i915_private *dev_priv = dev->dev_private;
1093 struct intel_overlay *overlay;
1094 struct drm_crtc *drmmode_crtc;
1095 struct intel_crtc *crtc;
1096 struct drm_i915_gem_object *new_bo;
1097 struct put_image_params *params;
1100 overlay = dev_priv->overlay;
1102 DRM_DEBUG("userspace bug: no overlay\n");
1106 if (!(put_image_rec->flags & I915_OVERLAY_ENABLE)) {
1107 drm_modeset_lock_all(dev);
1108 mutex_lock(&dev->struct_mutex);
1110 ret = intel_overlay_switch_off(overlay);
1112 mutex_unlock(&dev->struct_mutex);
1113 drm_modeset_unlock_all(dev);
1118 params = kmalloc(sizeof(*params), GFP_KERNEL);
1122 drmmode_crtc = drm_crtc_find(dev, put_image_rec->crtc_id);
1123 if (!drmmode_crtc) {
1127 crtc = to_intel_crtc(drmmode_crtc);
1129 new_bo = to_intel_bo(drm_gem_object_lookup(dev, file_priv,
1130 put_image_rec->bo_handle));
1131 if (&new_bo->base == NULL) {
1136 drm_modeset_lock_all(dev);
1137 mutex_lock(&dev->struct_mutex);
1139 if (new_bo->tiling_mode) {
1140 DRM_DEBUG_KMS("buffer used for overlay image can not be tiled\n");
1145 ret = intel_overlay_recover_from_interrupt(overlay);
1149 if (overlay->crtc != crtc) {
1150 struct drm_display_mode *mode = &crtc->base.mode;
1151 ret = intel_overlay_switch_off(overlay);
1155 ret = check_overlay_possible_on_crtc(overlay, crtc);
1159 overlay->crtc = crtc;
1160 crtc->overlay = overlay;
1162 /* line too wide, i.e. one-line-mode */
1163 if (mode->hdisplay > 1024 &&
1164 intel_panel_fitter_pipe(dev) == crtc->pipe) {
1165 overlay->pfit_active = true;
1166 update_pfit_vscale_ratio(overlay);
1168 overlay->pfit_active = false;
1171 ret = check_overlay_dst(overlay, put_image_rec);
1175 if (overlay->pfit_active) {
1176 params->dst_y = ((((u32)put_image_rec->dst_y) << 12) /
1177 overlay->pfit_vscale_ratio);
1178 /* shifting right rounds downwards, so add 1 */
1179 params->dst_h = ((((u32)put_image_rec->dst_height) << 12) /
1180 overlay->pfit_vscale_ratio) + 1;
1182 params->dst_y = put_image_rec->dst_y;
1183 params->dst_h = put_image_rec->dst_height;
1185 params->dst_x = put_image_rec->dst_x;
1186 params->dst_w = put_image_rec->dst_width;
1188 params->src_w = put_image_rec->src_width;
1189 params->src_h = put_image_rec->src_height;
1190 params->src_scan_w = put_image_rec->src_scan_width;
1191 params->src_scan_h = put_image_rec->src_scan_height;
1192 if (params->src_scan_h > params->src_h ||
1193 params->src_scan_w > params->src_w) {
1198 ret = check_overlay_src(dev, put_image_rec, new_bo);
1201 params->format = put_image_rec->flags & ~I915_OVERLAY_FLAGS_MASK;
1202 params->stride_Y = put_image_rec->stride_Y;
1203 params->stride_UV = put_image_rec->stride_UV;
1204 params->offset_Y = put_image_rec->offset_Y;
1205 params->offset_U = put_image_rec->offset_U;
1206 params->offset_V = put_image_rec->offset_V;
1208 /* Check scaling after src size to prevent a divide-by-zero. */
1209 ret = check_overlay_scaling(params);
1213 ret = intel_overlay_do_put_image(overlay, new_bo, params);
1217 mutex_unlock(&dev->struct_mutex);
1218 drm_modeset_unlock_all(dev);
1225 mutex_unlock(&dev->struct_mutex);
1226 drm_modeset_unlock_all(dev);
1227 drm_gem_object_unreference_unlocked(&new_bo->base);
1234 static void update_reg_attrs(struct intel_overlay *overlay,
1235 struct overlay_registers __iomem *regs)
1237 iowrite32((overlay->contrast << 18) | (overlay->brightness & 0xff),
1239 iowrite32(overlay->saturation, ®s->OCLRC1);
1242 static bool check_gamma_bounds(u32 gamma1, u32 gamma2)
1246 if (gamma1 & 0xff000000 || gamma2 & 0xff000000)
1249 for (i = 0; i < 3; i++) {
1250 if (((gamma1 >> i*8) & 0xff) >= ((gamma2 >> i*8) & 0xff))
1257 static bool check_gamma5_errata(u32 gamma5)
1261 for (i = 0; i < 3; i++) {
1262 if (((gamma5 >> i*8) & 0xff) == 0x80)
1269 static int check_gamma(struct drm_intel_overlay_attrs *attrs)
1271 if (!check_gamma_bounds(0, attrs->gamma0) ||
1272 !check_gamma_bounds(attrs->gamma0, attrs->gamma1) ||
1273 !check_gamma_bounds(attrs->gamma1, attrs->gamma2) ||
1274 !check_gamma_bounds(attrs->gamma2, attrs->gamma3) ||
1275 !check_gamma_bounds(attrs->gamma3, attrs->gamma4) ||
1276 !check_gamma_bounds(attrs->gamma4, attrs->gamma5) ||
1277 !check_gamma_bounds(attrs->gamma5, 0x00ffffff))
1280 if (!check_gamma5_errata(attrs->gamma5))
1286 int intel_overlay_attrs(struct drm_device *dev, void *data,
1287 struct drm_file *file_priv)
1289 struct drm_intel_overlay_attrs *attrs = data;
1290 struct drm_i915_private *dev_priv = dev->dev_private;
1291 struct intel_overlay *overlay;
1292 struct overlay_registers __iomem *regs;
1295 overlay = dev_priv->overlay;
1297 DRM_DEBUG("userspace bug: no overlay\n");
1301 drm_modeset_lock_all(dev);
1302 mutex_lock(&dev->struct_mutex);
1305 if (!(attrs->flags & I915_OVERLAY_UPDATE_ATTRS)) {
1306 attrs->color_key = overlay->color_key;
1307 attrs->brightness = overlay->brightness;
1308 attrs->contrast = overlay->contrast;
1309 attrs->saturation = overlay->saturation;
1311 if (!IS_GEN2(dev)) {
1312 attrs->gamma0 = I915_READ(OGAMC0);
1313 attrs->gamma1 = I915_READ(OGAMC1);
1314 attrs->gamma2 = I915_READ(OGAMC2);
1315 attrs->gamma3 = I915_READ(OGAMC3);
1316 attrs->gamma4 = I915_READ(OGAMC4);
1317 attrs->gamma5 = I915_READ(OGAMC5);
1320 if (attrs->brightness < -128 || attrs->brightness > 127)
1322 if (attrs->contrast > 255)
1324 if (attrs->saturation > 1023)
1327 overlay->color_key = attrs->color_key;
1328 overlay->brightness = attrs->brightness;
1329 overlay->contrast = attrs->contrast;
1330 overlay->saturation = attrs->saturation;
1332 regs = intel_overlay_map_regs(overlay);
1338 update_reg_attrs(overlay, regs);
1340 intel_overlay_unmap_regs(overlay, regs);
1342 if (attrs->flags & I915_OVERLAY_UPDATE_GAMMA) {
1346 if (overlay->active) {
1351 ret = check_gamma(attrs);
1355 I915_WRITE(OGAMC0, attrs->gamma0);
1356 I915_WRITE(OGAMC1, attrs->gamma1);
1357 I915_WRITE(OGAMC2, attrs->gamma2);
1358 I915_WRITE(OGAMC3, attrs->gamma3);
1359 I915_WRITE(OGAMC4, attrs->gamma4);
1360 I915_WRITE(OGAMC5, attrs->gamma5);
1363 overlay->color_key_enabled = (attrs->flags & I915_OVERLAY_DISABLE_DEST_COLORKEY) == 0;
1367 mutex_unlock(&dev->struct_mutex);
1368 drm_modeset_unlock_all(dev);
1373 void intel_setup_overlay(struct drm_device *dev)
1375 struct drm_i915_private *dev_priv = dev->dev_private;
1376 struct intel_overlay *overlay;
1377 struct drm_i915_gem_object *reg_bo;
1378 struct overlay_registers __iomem *regs;
1381 if (!HAS_OVERLAY(dev))
1384 overlay = kzalloc(sizeof(*overlay), GFP_KERNEL);
1388 mutex_lock(&dev->struct_mutex);
1389 if (WARN_ON(dev_priv->overlay))
1395 if (!OVERLAY_NEEDS_PHYSICAL(dev))
1396 reg_bo = i915_gem_object_create_stolen(dev, PAGE_SIZE);
1398 reg_bo = i915_gem_alloc_object(dev, PAGE_SIZE);
1401 overlay->reg_bo = reg_bo;
1403 if (OVERLAY_NEEDS_PHYSICAL(dev)) {
1404 ret = i915_gem_object_attach_phys(reg_bo, PAGE_SIZE);
1406 DRM_ERROR("failed to attach phys overlay regs\n");
1409 overlay->flip_addr = reg_bo->phys_handle->busaddr;
1411 ret = i915_gem_obj_ggtt_pin(reg_bo, PAGE_SIZE, PIN_MAPPABLE);
1413 DRM_ERROR("failed to pin overlay register bo\n");
1416 overlay->flip_addr = i915_gem_obj_ggtt_offset(reg_bo);
1418 ret = i915_gem_object_set_to_gtt_domain(reg_bo, true);
1420 DRM_ERROR("failed to move overlay register bo into the GTT\n");
1425 /* init all values */
1426 overlay->color_key = 0x0101fe;
1427 overlay->color_key_enabled = true;
1428 overlay->brightness = -19;
1429 overlay->contrast = 75;
1430 overlay->saturation = 146;
1432 regs = intel_overlay_map_regs(overlay);
1436 memset_io(regs, 0, sizeof(struct overlay_registers));
1437 update_polyphase_filter(regs);
1438 update_reg_attrs(overlay, regs);
1440 intel_overlay_unmap_regs(overlay, regs);
1442 dev_priv->overlay = overlay;
1443 mutex_unlock(&dev->struct_mutex);
1444 DRM_INFO("initialized overlay support\n");
1448 if (!OVERLAY_NEEDS_PHYSICAL(dev))
1449 i915_gem_object_ggtt_unpin(reg_bo);
1451 drm_gem_object_unreference(®_bo->base);
1453 mutex_unlock(&dev->struct_mutex);
1458 void intel_cleanup_overlay(struct drm_device *dev)
1460 struct drm_i915_private *dev_priv = dev->dev_private;
1462 if (!dev_priv->overlay)
1465 /* The bo's should be free'd by the generic code already.
1466 * Furthermore modesetting teardown happens beforehand so the
1467 * hardware should be off already */
1468 WARN_ON(dev_priv->overlay->active);
1470 drm_gem_object_unreference_unlocked(&dev_priv->overlay->reg_bo->base);
1471 kfree(dev_priv->overlay);
1474 struct intel_overlay_error_state {
1475 struct overlay_registers regs;
1481 static struct overlay_registers __iomem *
1482 intel_overlay_map_regs_atomic(struct intel_overlay *overlay)
1484 struct drm_i915_private *dev_priv = overlay->dev->dev_private;
1485 struct overlay_registers __iomem *regs;
1487 if (OVERLAY_NEEDS_PHYSICAL(overlay->dev))
1488 /* Cast to make sparse happy, but it's wc memory anyway, so
1489 * equivalent to the wc io mapping on X86. */
1490 regs = (struct overlay_registers __iomem *)
1491 overlay->reg_bo->phys_handle->vaddr;
1493 regs = io_mapping_map_atomic_wc(dev_priv->gtt.mappable,
1494 i915_gem_obj_ggtt_offset(overlay->reg_bo));
1499 static void intel_overlay_unmap_regs_atomic(struct intel_overlay *overlay,
1500 struct overlay_registers __iomem *regs)
1502 if (!OVERLAY_NEEDS_PHYSICAL(overlay->dev))
1503 io_mapping_unmap_atomic(regs);
1507 struct intel_overlay_error_state *
1508 intel_overlay_capture_error_state(struct drm_device *dev)
1510 struct drm_i915_private *dev_priv = dev->dev_private;
1511 struct intel_overlay *overlay = dev_priv->overlay;
1512 struct intel_overlay_error_state *error;
1513 struct overlay_registers __iomem *regs;
1515 if (!overlay || !overlay->active)
1518 error = kmalloc(sizeof(*error), GFP_ATOMIC);
1522 error->dovsta = I915_READ(DOVSTA);
1523 error->isr = I915_READ(ISR);
1524 if (OVERLAY_NEEDS_PHYSICAL(overlay->dev))
1525 error->base = (__force long)overlay->reg_bo->phys_handle->vaddr;
1527 error->base = i915_gem_obj_ggtt_offset(overlay->reg_bo);
1529 regs = intel_overlay_map_regs_atomic(overlay);
1533 memcpy_fromio(&error->regs, regs, sizeof(struct overlay_registers));
1534 intel_overlay_unmap_regs_atomic(overlay, regs);
1544 intel_overlay_print_error_state(struct drm_i915_error_state_buf *m,
1545 struct intel_overlay_error_state *error)
1547 i915_error_printf(m, "Overlay, status: 0x%08x, interrupt: 0x%08x\n",
1548 error->dovsta, error->isr);
1549 i915_error_printf(m, " Register file at 0x%08lx:\n",
1552 #define P(x) i915_error_printf(m, " " #x ": 0x%08x\n", error->regs.x)