4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
20 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
24 * Daniel Vetter <daniel@ffwll.ch>
26 * Derived from Xorg ddx, xf86-video-intel, src/i830_video.c
29 #include <linux/seq_file.h>
35 #include "intel_drv.h"
37 /* Limits for overlay size. According to intel doc, the real limits are:
38 * Y width: 4095, UV width (planar): 2047, Y height: 2047,
39 * UV width (planar): * 1023. But the xorg thinks 2048 for height and width. Use
40 * the mininum of both. */
41 #define IMAGE_MAX_WIDTH 2048
42 #define IMAGE_MAX_HEIGHT 2046 /* 2 * 1023 */
43 /* on 830 and 845 these large limits result in the card hanging */
44 #define IMAGE_MAX_WIDTH_LEGACY 1024
45 #define IMAGE_MAX_HEIGHT_LEGACY 1088
47 /* overlay register definitions */
49 #define OCMD_TILED_SURFACE (0x1<<19)
50 #define OCMD_MIRROR_MASK (0x3<<17)
51 #define OCMD_MIRROR_MODE (0x3<<17)
52 #define OCMD_MIRROR_HORIZONTAL (0x1<<17)
53 #define OCMD_MIRROR_VERTICAL (0x2<<17)
54 #define OCMD_MIRROR_BOTH (0x3<<17)
55 #define OCMD_BYTEORDER_MASK (0x3<<14) /* zero for YUYV or FOURCC YUY2 */
56 #define OCMD_UV_SWAP (0x1<<14) /* YVYU */
57 #define OCMD_Y_SWAP (0x2<<14) /* UYVY or FOURCC UYVY */
58 #define OCMD_Y_AND_UV_SWAP (0x3<<14) /* VYUY */
59 #define OCMD_SOURCE_FORMAT_MASK (0xf<<10)
60 #define OCMD_RGB_888 (0x1<<10) /* not in i965 Intel docs */
61 #define OCMD_RGB_555 (0x2<<10) /* not in i965 Intel docs */
62 #define OCMD_RGB_565 (0x3<<10) /* not in i965 Intel docs */
63 #define OCMD_YUV_422_PACKED (0x8<<10)
64 #define OCMD_YUV_411_PACKED (0x9<<10) /* not in i965 Intel docs */
65 #define OCMD_YUV_420_PLANAR (0xc<<10)
66 #define OCMD_YUV_422_PLANAR (0xd<<10)
67 #define OCMD_YUV_410_PLANAR (0xe<<10) /* also 411 */
68 #define OCMD_TVSYNCFLIP_PARITY (0x1<<9)
69 #define OCMD_TVSYNCFLIP_ENABLE (0x1<<7)
70 #define OCMD_BUF_TYPE_MASK (0x1<<5)
71 #define OCMD_BUF_TYPE_FRAME (0x0<<5)
72 #define OCMD_BUF_TYPE_FIELD (0x1<<5)
73 #define OCMD_TEST_MODE (0x1<<4)
74 #define OCMD_BUFFER_SELECT (0x3<<2)
75 #define OCMD_BUFFER0 (0x0<<2)
76 #define OCMD_BUFFER1 (0x1<<2)
77 #define OCMD_FIELD_SELECT (0x1<<2)
78 #define OCMD_FIELD0 (0x0<<1)
79 #define OCMD_FIELD1 (0x1<<1)
80 #define OCMD_ENABLE (0x1<<0)
82 /* OCONFIG register */
83 #define OCONF_PIPE_MASK (0x1<<18)
84 #define OCONF_PIPE_A (0x0<<18)
85 #define OCONF_PIPE_B (0x1<<18)
86 #define OCONF_GAMMA2_ENABLE (0x1<<16)
87 #define OCONF_CSC_MODE_BT601 (0x0<<5)
88 #define OCONF_CSC_MODE_BT709 (0x1<<5)
89 #define OCONF_CSC_BYPASS (0x1<<4)
90 #define OCONF_CC_OUT_8BIT (0x1<<3)
91 #define OCONF_TEST_MODE (0x1<<2)
92 #define OCONF_THREE_LINE_BUFFER (0x1<<0)
93 #define OCONF_TWO_LINE_BUFFER (0x0<<0)
95 /* DCLRKM (dst-key) register */
96 #define DST_KEY_ENABLE (0x1<<31)
97 #define CLK_RGB24_MASK 0x0
98 #define CLK_RGB16_MASK 0x070307
99 #define CLK_RGB15_MASK 0x070707
100 #define CLK_RGB8I_MASK 0xffffff
102 #define RGB16_TO_COLORKEY(c) \
103 (((c & 0xF800) << 8) | ((c & 0x07E0) << 5) | ((c & 0x001F) << 3))
104 #define RGB15_TO_COLORKEY(c) \
105 (((c & 0x7c00) << 9) | ((c & 0x03E0) << 6) | ((c & 0x001F) << 3))
107 /* overlay flip addr flag */
108 #define OFC_UPDATE 0x1
110 /* polyphase filter coefficients */
111 #define N_HORIZ_Y_TAPS 5
112 #define N_VERT_Y_TAPS 3
113 #define N_HORIZ_UV_TAPS 3
114 #define N_VERT_UV_TAPS 3
118 /* memory bufferd overlay registers */
119 struct overlay_registers {
147 u32 RESERVED1; /* 0x6C */
160 u32 FASTHSCALE; /* 0xA0 */
161 u32 UVSCALEV; /* 0xA4 */
162 u32 RESERVEDC[(0x200 - 0xA8) / 4]; /* 0xA8 - 0x1FC */
163 u16 Y_VCOEFS[N_VERT_Y_TAPS * N_PHASES]; /* 0x200 */
164 u16 RESERVEDD[0x100 / 2 - N_VERT_Y_TAPS * N_PHASES];
165 u16 Y_HCOEFS[N_HORIZ_Y_TAPS * N_PHASES]; /* 0x300 */
166 u16 RESERVEDE[0x200 / 2 - N_HORIZ_Y_TAPS * N_PHASES];
167 u16 UV_VCOEFS[N_VERT_UV_TAPS * N_PHASES]; /* 0x500 */
168 u16 RESERVEDF[0x100 / 2 - N_VERT_UV_TAPS * N_PHASES];
169 u16 UV_HCOEFS[N_HORIZ_UV_TAPS * N_PHASES]; /* 0x600 */
170 u16 RESERVEDG[0x100 / 2 - N_HORIZ_UV_TAPS * N_PHASES];
173 struct intel_overlay {
174 struct drm_device *dev;
175 struct intel_crtc *crtc;
176 struct drm_i915_gem_object *vid_bo;
177 struct drm_i915_gem_object *old_vid_bo;
180 u32 pfit_vscale_ratio; /* shifted-point number, (1<<12) == 1.0 */
182 u32 brightness, contrast, saturation;
183 u32 old_xscale, old_yscale;
184 /* register access */
186 struct drm_i915_gem_object *reg_bo;
188 uint32_t last_flip_req;
191 #define NEEDS_WAIT_FOR_FLIP 2
192 #define RELEASE_OLD_VID 3
196 static struct overlay_registers *
197 intel_overlay_map_regs_atomic(struct intel_overlay *overlay,
200 drm_i915_private_t *dev_priv = overlay->dev->dev_private;
201 struct overlay_registers *regs;
203 if (OVERLAY_NEEDS_PHYSICAL(overlay->dev))
204 regs = overlay->reg_bo->phys_obj->handle->vaddr;
206 regs = io_mapping_map_atomic_wc(dev_priv->mm.gtt_mapping,
207 overlay->reg_bo->gtt_offset,
213 static void intel_overlay_unmap_regs_atomic(struct intel_overlay *overlay,
215 struct overlay_registers *regs)
217 if (!OVERLAY_NEEDS_PHYSICAL(overlay->dev))
218 io_mapping_unmap_atomic(regs, slot);
221 static struct overlay_registers *
222 intel_overlay_map_regs(struct intel_overlay *overlay)
224 drm_i915_private_t *dev_priv = overlay->dev->dev_private;
225 struct overlay_registers *regs;
227 if (OVERLAY_NEEDS_PHYSICAL(overlay->dev))
228 regs = overlay->reg_bo->phys_obj->handle->vaddr;
230 regs = io_mapping_map_wc(dev_priv->mm.gtt_mapping,
231 overlay->reg_bo->gtt_offset);
236 static void intel_overlay_unmap_regs(struct intel_overlay *overlay,
237 struct overlay_registers *regs)
239 if (!OVERLAY_NEEDS_PHYSICAL(overlay->dev))
240 io_mapping_unmap(regs);
243 static int intel_overlay_do_wait_request(struct intel_overlay *overlay,
244 struct drm_i915_gem_request *request,
248 struct drm_device *dev = overlay->dev;
249 drm_i915_private_t *dev_priv = dev->dev_private;
252 overlay->last_flip_req =
253 i915_add_request(dev, NULL, request, &dev_priv->render_ring);
254 if (overlay->last_flip_req == 0)
257 overlay->hw_wedged = stage;
258 ret = i915_do_wait_request(dev,
259 overlay->last_flip_req, true,
260 &dev_priv->render_ring);
264 overlay->hw_wedged = 0;
265 overlay->last_flip_req = 0;
269 /* Workaround for i830 bug where pipe a must be enable to change control regs */
271 i830_activate_pipe_a(struct drm_device *dev)
273 drm_i915_private_t *dev_priv = dev->dev_private;
274 struct intel_crtc *crtc;
275 struct drm_crtc_helper_funcs *crtc_funcs;
276 struct drm_display_mode vesa_640x480 = {
277 DRM_MODE("640x480", DRM_MODE_TYPE_DRIVER, 25175, 640, 656,
278 752, 800, 0, 480, 489, 492, 525, 0,
279 DRM_MODE_FLAG_NHSYNC | DRM_MODE_FLAG_NVSYNC)
282 crtc = to_intel_crtc(dev_priv->pipe_to_crtc_mapping[0]);
283 if (crtc->dpms_mode == DRM_MODE_DPMS_ON)
286 /* most i8xx have pipe a forced on, so don't trust dpms mode */
287 if (I915_READ(PIPEACONF) & PIPEACONF_ENABLE)
290 crtc_funcs = crtc->base.helper_private;
291 if (crtc_funcs->dpms == NULL)
294 DRM_DEBUG_DRIVER("Enabling pipe A in order to enable overlay\n");
296 mode = drm_mode_duplicate(dev, &vesa_640x480);
297 drm_mode_set_crtcinfo(mode, CRTC_INTERLACE_HALVE_V);
298 if(!drm_crtc_helper_set_mode(&crtc->base, mode,
299 crtc->base.x, crtc->base.y,
303 crtc_funcs->dpms(&crtc->base, DRM_MODE_DPMS_ON);
308 i830_deactivate_pipe_a(struct drm_device *dev)
310 drm_i915_private_t *dev_priv = dev->dev_private;
311 struct drm_crtc *crtc = dev_priv->pipe_to_crtc_mapping[0];
312 struct drm_crtc_helper_funcs *crtc_funcs = crtc->helper_private;
314 crtc_funcs->dpms(crtc, DRM_MODE_DPMS_OFF);
317 /* overlay needs to be disable in OCMD reg */
318 static int intel_overlay_on(struct intel_overlay *overlay)
320 struct drm_device *dev = overlay->dev;
321 struct drm_i915_gem_request *request;
322 int pipe_a_quirk = 0;
325 BUG_ON(overlay->active);
329 pipe_a_quirk = i830_activate_pipe_a(dev);
330 if (pipe_a_quirk < 0)
334 request = kzalloc(sizeof(*request), GFP_KERNEL);
335 if (request == NULL) {
341 OUT_RING(MI_OVERLAY_FLIP | MI_OVERLAY_ON);
342 OUT_RING(overlay->flip_addr | OFC_UPDATE);
343 OUT_RING(MI_WAIT_FOR_EVENT | MI_WAIT_FOR_OVERLAY_FLIP);
347 ret = intel_overlay_do_wait_request(overlay, request, true,
348 NEEDS_WAIT_FOR_FLIP);
351 i830_deactivate_pipe_a(dev);
356 /* overlay needs to be enabled in OCMD reg */
357 static int intel_overlay_continue(struct intel_overlay *overlay,
358 bool load_polyphase_filter)
360 struct drm_device *dev = overlay->dev;
361 drm_i915_private_t *dev_priv = dev->dev_private;
362 struct drm_i915_gem_request *request;
363 u32 flip_addr = overlay->flip_addr;
366 BUG_ON(!overlay->active);
368 request = kzalloc(sizeof(*request), GFP_KERNEL);
372 if (load_polyphase_filter)
373 flip_addr |= OFC_UPDATE;
375 /* check for underruns */
376 tmp = I915_READ(DOVSTA);
378 DRM_DEBUG("overlay underrun, DOVSTA: %x\n", tmp);
381 OUT_RING(MI_OVERLAY_FLIP | MI_OVERLAY_CONTINUE);
385 overlay->last_flip_req =
386 i915_add_request(dev, NULL, request, &dev_priv->render_ring);
390 /* overlay needs to be disabled in OCMD reg */
391 static int intel_overlay_off(struct intel_overlay *overlay,
394 struct drm_device *dev = overlay->dev;
395 u32 flip_addr = overlay->flip_addr;
396 struct drm_i915_gem_request *request;
398 BUG_ON(!overlay->active);
400 request = kzalloc(sizeof(*request), GFP_KERNEL);
404 /* According to intel docs the overlay hw may hang (when switching
405 * off) without loading the filter coeffs. It is however unclear whether
406 * this applies to the disabling of the overlay or to the switching off
407 * of the hw. Do it in both cases */
408 flip_addr |= OFC_UPDATE;
411 /* wait for overlay to go idle */
412 OUT_RING(MI_OVERLAY_FLIP | MI_OVERLAY_CONTINUE);
414 OUT_RING(MI_WAIT_FOR_EVENT | MI_WAIT_FOR_OVERLAY_FLIP);
415 /* turn overlay off */
416 OUT_RING(MI_OVERLAY_FLIP | MI_OVERLAY_OFF);
418 OUT_RING(MI_WAIT_FOR_EVENT | MI_WAIT_FOR_OVERLAY_FLIP);
421 return intel_overlay_do_wait_request(overlay, request, interruptible,
425 static void intel_overlay_release_old_vid_tail(struct intel_overlay *overlay)
427 struct drm_gem_object *obj = &overlay->old_vid_bo->base;
429 i915_gem_object_unpin(obj);
430 drm_gem_object_unreference(obj);
432 overlay->old_vid_bo = NULL;
435 static void intel_overlay_off_tail(struct intel_overlay *overlay)
437 struct drm_gem_object *obj;
439 /* never have the overlay hw on without showing a frame */
440 BUG_ON(!overlay->vid_bo);
441 obj = &overlay->vid_bo->base;
443 i915_gem_object_unpin(obj);
444 drm_gem_object_unreference(obj);
445 overlay->vid_bo = NULL;
447 overlay->crtc->overlay = NULL;
448 overlay->crtc = NULL;
452 /* recover from an interruption due to a signal
453 * We have to be careful not to repeat work forever an make forward progess. */
454 static int intel_overlay_recover_from_interrupt(struct intel_overlay *overlay,
457 struct drm_device *dev = overlay->dev;
458 drm_i915_private_t *dev_priv = dev->dev_private;
461 if (overlay->hw_wedged == HW_WEDGED)
464 ret = i915_do_wait_request(dev, overlay->last_flip_req,
465 interruptible, &dev_priv->render_ring);
469 switch (overlay->hw_wedged) {
470 case RELEASE_OLD_VID:
471 intel_overlay_release_old_vid_tail(overlay);
475 intel_overlay_off_tail(overlay);
479 BUG_ON(overlay->hw_wedged != NEEDS_WAIT_FOR_FLIP);
482 overlay->hw_wedged = 0;
483 overlay->last_flip_req = 0;
487 /* Wait for pending overlay flip and release old frame.
488 * Needs to be called before the overlay register are changed
489 * via intel_overlay_(un)map_regs
491 static int intel_overlay_release_old_vid(struct intel_overlay *overlay)
493 struct drm_device *dev = overlay->dev;
494 drm_i915_private_t *dev_priv = dev->dev_private;
497 /* Only wait if there is actually an old frame to release to
498 * guarantee forward progress.
500 if (!overlay->old_vid_bo)
503 if (I915_READ(ISR) & I915_OVERLAY_PLANE_FLIP_PENDING_INTERRUPT) {
504 struct drm_i915_gem_request *request;
506 /* synchronous slowpath */
507 request = kzalloc(sizeof(*request), GFP_KERNEL);
512 OUT_RING(MI_WAIT_FOR_EVENT | MI_WAIT_FOR_OVERLAY_FLIP);
516 ret = intel_overlay_do_wait_request(overlay, request, true,
522 intel_overlay_release_old_vid_tail(overlay);
526 struct put_image_params {
543 static int packed_depth_bytes(u32 format)
545 switch (format & I915_OVERLAY_DEPTH_MASK) {
546 case I915_OVERLAY_YUV422:
548 case I915_OVERLAY_YUV411:
549 /* return 6; not implemented */
555 static int packed_width_bytes(u32 format, short width)
557 switch (format & I915_OVERLAY_DEPTH_MASK) {
558 case I915_OVERLAY_YUV422:
565 static int uv_hsubsampling(u32 format)
567 switch (format & I915_OVERLAY_DEPTH_MASK) {
568 case I915_OVERLAY_YUV422:
569 case I915_OVERLAY_YUV420:
571 case I915_OVERLAY_YUV411:
572 case I915_OVERLAY_YUV410:
579 static int uv_vsubsampling(u32 format)
581 switch (format & I915_OVERLAY_DEPTH_MASK) {
582 case I915_OVERLAY_YUV420:
583 case I915_OVERLAY_YUV410:
585 case I915_OVERLAY_YUV422:
586 case I915_OVERLAY_YUV411:
593 static u32 calc_swidthsw(struct drm_device *dev, u32 offset, u32 width)
595 u32 mask, shift, ret;
603 ret = ((offset + width + mask) >> shift) - (offset >> shift);
610 static const u16 y_static_hcoeffs[N_HORIZ_Y_TAPS * N_PHASES] = {
611 0x3000, 0xb4a0, 0x1930, 0x1920, 0xb4a0,
612 0x3000, 0xb500, 0x19d0, 0x1880, 0xb440,
613 0x3000, 0xb540, 0x1a88, 0x2f80, 0xb3e0,
614 0x3000, 0xb580, 0x1b30, 0x2e20, 0xb380,
615 0x3000, 0xb5c0, 0x1bd8, 0x2cc0, 0xb320,
616 0x3020, 0xb5e0, 0x1c60, 0x2b80, 0xb2c0,
617 0x3020, 0xb5e0, 0x1cf8, 0x2a20, 0xb260,
618 0x3020, 0xb5e0, 0x1d80, 0x28e0, 0xb200,
619 0x3020, 0xb5c0, 0x1e08, 0x3f40, 0xb1c0,
620 0x3020, 0xb580, 0x1e78, 0x3ce0, 0xb160,
621 0x3040, 0xb520, 0x1ed8, 0x3aa0, 0xb120,
622 0x3040, 0xb4a0, 0x1f30, 0x3880, 0xb0e0,
623 0x3040, 0xb400, 0x1f78, 0x3680, 0xb0a0,
624 0x3020, 0xb340, 0x1fb8, 0x34a0, 0xb060,
625 0x3020, 0xb240, 0x1fe0, 0x32e0, 0xb040,
626 0x3020, 0xb140, 0x1ff8, 0x3160, 0xb020,
627 0xb000, 0x3000, 0x0800, 0x3000, 0xb000
630 static const u16 uv_static_hcoeffs[N_HORIZ_UV_TAPS * N_PHASES] = {
631 0x3000, 0x1800, 0x1800, 0xb000, 0x18d0, 0x2e60,
632 0xb000, 0x1990, 0x2ce0, 0xb020, 0x1a68, 0x2b40,
633 0xb040, 0x1b20, 0x29e0, 0xb060, 0x1bd8, 0x2880,
634 0xb080, 0x1c88, 0x3e60, 0xb0a0, 0x1d28, 0x3c00,
635 0xb0c0, 0x1db8, 0x39e0, 0xb0e0, 0x1e40, 0x37e0,
636 0xb100, 0x1eb8, 0x3620, 0xb100, 0x1f18, 0x34a0,
637 0xb100, 0x1f68, 0x3360, 0xb0e0, 0x1fa8, 0x3240,
638 0xb0c0, 0x1fe0, 0x3140, 0xb060, 0x1ff0, 0x30a0,
639 0x3000, 0x0800, 0x3000
642 static void update_polyphase_filter(struct overlay_registers *regs)
644 memcpy(regs->Y_HCOEFS, y_static_hcoeffs, sizeof(y_static_hcoeffs));
645 memcpy(regs->UV_HCOEFS, uv_static_hcoeffs, sizeof(uv_static_hcoeffs));
648 static bool update_scaling_factors(struct intel_overlay *overlay,
649 struct overlay_registers *regs,
650 struct put_image_params *params)
652 /* fixed point with a 12 bit shift */
653 u32 xscale, yscale, xscale_UV, yscale_UV;
655 #define FRACT_MASK 0xfff
656 bool scale_changed = false;
657 int uv_hscale = uv_hsubsampling(params->format);
658 int uv_vscale = uv_vsubsampling(params->format);
660 if (params->dst_w > 1)
661 xscale = ((params->src_scan_w - 1) << FP_SHIFT)
664 xscale = 1 << FP_SHIFT;
666 if (params->dst_h > 1)
667 yscale = ((params->src_scan_h - 1) << FP_SHIFT)
670 yscale = 1 << FP_SHIFT;
672 /*if (params->format & I915_OVERLAY_YUV_PLANAR) {*/
673 xscale_UV = xscale/uv_hscale;
674 yscale_UV = yscale/uv_vscale;
675 /* make the Y scale to UV scale ratio an exact multiply */
676 xscale = xscale_UV * uv_hscale;
677 yscale = yscale_UV * uv_vscale;
683 if (xscale != overlay->old_xscale || yscale != overlay->old_yscale)
684 scale_changed = true;
685 overlay->old_xscale = xscale;
686 overlay->old_yscale = yscale;
688 regs->YRGBSCALE = (((yscale & FRACT_MASK) << 20) |
689 ((xscale >> FP_SHIFT) << 16) |
690 ((xscale & FRACT_MASK) << 3));
692 regs->UVSCALE = (((yscale_UV & FRACT_MASK) << 20) |
693 ((xscale_UV >> FP_SHIFT) << 16) |
694 ((xscale_UV & FRACT_MASK) << 3));
696 regs->UVSCALEV = ((((yscale >> FP_SHIFT) << 16) |
697 ((yscale_UV >> FP_SHIFT) << 0)));
700 update_polyphase_filter(regs);
702 return scale_changed;
705 static void update_colorkey(struct intel_overlay *overlay,
706 struct overlay_registers *regs)
708 u32 key = overlay->color_key;
710 switch (overlay->crtc->base.fb->bits_per_pixel) {
713 regs->DCLRKM = CLK_RGB8I_MASK | DST_KEY_ENABLE;
717 if (overlay->crtc->base.fb->depth == 15) {
718 regs->DCLRKV = RGB15_TO_COLORKEY(key);
719 regs->DCLRKM = CLK_RGB15_MASK | DST_KEY_ENABLE;
721 regs->DCLRKV = RGB16_TO_COLORKEY(key);
722 regs->DCLRKM = CLK_RGB16_MASK | DST_KEY_ENABLE;
729 regs->DCLRKM = CLK_RGB24_MASK | DST_KEY_ENABLE;
734 static u32 overlay_cmd_reg(struct put_image_params *params)
736 u32 cmd = OCMD_ENABLE | OCMD_BUF_TYPE_FRAME | OCMD_BUFFER0;
738 if (params->format & I915_OVERLAY_YUV_PLANAR) {
739 switch (params->format & I915_OVERLAY_DEPTH_MASK) {
740 case I915_OVERLAY_YUV422:
741 cmd |= OCMD_YUV_422_PLANAR;
743 case I915_OVERLAY_YUV420:
744 cmd |= OCMD_YUV_420_PLANAR;
746 case I915_OVERLAY_YUV411:
747 case I915_OVERLAY_YUV410:
748 cmd |= OCMD_YUV_410_PLANAR;
751 } else { /* YUV packed */
752 switch (params->format & I915_OVERLAY_DEPTH_MASK) {
753 case I915_OVERLAY_YUV422:
754 cmd |= OCMD_YUV_422_PACKED;
756 case I915_OVERLAY_YUV411:
757 cmd |= OCMD_YUV_411_PACKED;
761 switch (params->format & I915_OVERLAY_SWAP_MASK) {
762 case I915_OVERLAY_NO_SWAP:
764 case I915_OVERLAY_UV_SWAP:
767 case I915_OVERLAY_Y_SWAP:
770 case I915_OVERLAY_Y_AND_UV_SWAP:
771 cmd |= OCMD_Y_AND_UV_SWAP;
779 static int intel_overlay_do_put_image(struct intel_overlay *overlay,
780 struct drm_gem_object *new_bo,
781 struct put_image_params *params)
784 struct overlay_registers *regs;
785 bool scale_changed = false;
786 struct drm_i915_gem_object *bo_priv = to_intel_bo(new_bo);
787 struct drm_device *dev = overlay->dev;
789 BUG_ON(!mutex_is_locked(&dev->struct_mutex));
790 BUG_ON(!mutex_is_locked(&dev->mode_config.mutex));
793 ret = intel_overlay_release_old_vid(overlay);
797 ret = i915_gem_object_pin(new_bo, PAGE_SIZE);
801 ret = i915_gem_object_set_to_gtt_domain(new_bo, 0);
805 if (!overlay->active) {
806 regs = intel_overlay_map_regs(overlay);
811 regs->OCONFIG = OCONF_CC_OUT_8BIT;
812 if (IS_I965GM(overlay->dev))
813 regs->OCONFIG |= OCONF_CSC_MODE_BT709;
814 regs->OCONFIG |= overlay->crtc->pipe == 0 ?
815 OCONF_PIPE_A : OCONF_PIPE_B;
816 intel_overlay_unmap_regs(overlay, regs);
818 ret = intel_overlay_on(overlay);
823 regs = intel_overlay_map_regs(overlay);
829 regs->DWINPOS = (params->dst_y << 16) | params->dst_x;
830 regs->DWINSZ = (params->dst_h << 16) | params->dst_w;
832 if (params->format & I915_OVERLAY_YUV_PACKED)
833 tmp_width = packed_width_bytes(params->format, params->src_w);
835 tmp_width = params->src_w;
837 regs->SWIDTH = params->src_w;
838 regs->SWIDTHSW = calc_swidthsw(overlay->dev,
839 params->offset_Y, tmp_width);
840 regs->SHEIGHT = params->src_h;
841 regs->OBUF_0Y = bo_priv->gtt_offset + params-> offset_Y;
842 regs->OSTRIDE = params->stride_Y;
844 if (params->format & I915_OVERLAY_YUV_PLANAR) {
845 int uv_hscale = uv_hsubsampling(params->format);
846 int uv_vscale = uv_vsubsampling(params->format);
848 regs->SWIDTH |= (params->src_w/uv_hscale) << 16;
849 tmp_U = calc_swidthsw(overlay->dev, params->offset_U,
850 params->src_w/uv_hscale);
851 tmp_V = calc_swidthsw(overlay->dev, params->offset_V,
852 params->src_w/uv_hscale);
853 regs->SWIDTHSW |= max_t(u32, tmp_U, tmp_V) << 16;
854 regs->SHEIGHT |= (params->src_h/uv_vscale) << 16;
855 regs->OBUF_0U = bo_priv->gtt_offset + params->offset_U;
856 regs->OBUF_0V = bo_priv->gtt_offset + params->offset_V;
857 regs->OSTRIDE |= params->stride_UV << 16;
860 scale_changed = update_scaling_factors(overlay, regs, params);
862 update_colorkey(overlay, regs);
864 regs->OCMD = overlay_cmd_reg(params);
866 intel_overlay_unmap_regs(overlay, regs);
868 ret = intel_overlay_continue(overlay, scale_changed);
872 overlay->old_vid_bo = overlay->vid_bo;
873 overlay->vid_bo = to_intel_bo(new_bo);
878 i915_gem_object_unpin(new_bo);
882 int intel_overlay_switch_off(struct intel_overlay *overlay,
885 struct overlay_registers *regs;
886 struct drm_device *dev = overlay->dev;
889 BUG_ON(!mutex_is_locked(&dev->struct_mutex));
890 BUG_ON(!mutex_is_locked(&dev->mode_config.mutex));
892 if (overlay->hw_wedged) {
893 ret = intel_overlay_recover_from_interrupt(overlay,
899 if (!overlay->active)
902 ret = intel_overlay_release_old_vid(overlay);
906 regs = intel_overlay_map_regs(overlay);
908 intel_overlay_unmap_regs(overlay, regs);
910 ret = intel_overlay_off(overlay, interruptible);
914 intel_overlay_off_tail(overlay);
919 static int check_overlay_possible_on_crtc(struct intel_overlay *overlay,
920 struct intel_crtc *crtc)
922 drm_i915_private_t *dev_priv = overlay->dev->dev_private;
924 int pipeconf_reg = (crtc->pipe == 0) ? PIPEACONF : PIPEBCONF;
926 if (!crtc->base.enabled || crtc->dpms_mode != DRM_MODE_DPMS_ON)
929 pipeconf = I915_READ(pipeconf_reg);
931 /* can't use the overlay with double wide pipe */
932 if (!IS_I965G(overlay->dev) && pipeconf & PIPEACONF_DOUBLE_WIDE)
938 static void update_pfit_vscale_ratio(struct intel_overlay *overlay)
940 struct drm_device *dev = overlay->dev;
941 drm_i915_private_t *dev_priv = dev->dev_private;
942 u32 pfit_control = I915_READ(PFIT_CONTROL);
945 /* XXX: This is not the same logic as in the xorg driver, but more in
946 * line with the intel documentation for the i965
948 if (!IS_I965G(dev)) {
949 if (pfit_control & VERT_AUTO_SCALE)
950 ratio = I915_READ(PFIT_AUTO_RATIOS);
952 ratio = I915_READ(PFIT_PGM_RATIOS);
953 ratio >>= PFIT_VERT_SCALE_SHIFT;
954 } else { /* on i965 use the PGM reg to read out the autoscaler values */
955 ratio = I915_READ(PFIT_PGM_RATIOS) >> PFIT_VERT_SCALE_SHIFT_965;
958 overlay->pfit_vscale_ratio = ratio;
961 static int check_overlay_dst(struct intel_overlay *overlay,
962 struct drm_intel_overlay_put_image *rec)
964 struct drm_display_mode *mode = &overlay->crtc->base.mode;
966 if (rec->dst_x < mode->crtc_hdisplay &&
967 rec->dst_x + rec->dst_width <= mode->crtc_hdisplay &&
968 rec->dst_y < mode->crtc_vdisplay &&
969 rec->dst_y + rec->dst_height <= mode->crtc_vdisplay)
975 static int check_overlay_scaling(struct put_image_params *rec)
979 /* downscaling limit is 8.0 */
980 tmp = ((rec->src_scan_h << 16) / rec->dst_h) >> 16;
983 tmp = ((rec->src_scan_w << 16) / rec->dst_w) >> 16;
990 static int check_overlay_src(struct drm_device *dev,
991 struct drm_intel_overlay_put_image *rec,
992 struct drm_gem_object *new_bo)
994 int uv_hscale = uv_hsubsampling(rec->flags);
995 int uv_vscale = uv_vsubsampling(rec->flags);
996 u32 stride_mask, depth, tmp;
998 /* check src dimensions */
999 if (IS_845G(dev) || IS_I830(dev)) {
1000 if (rec->src_height > IMAGE_MAX_HEIGHT_LEGACY ||
1001 rec->src_width > IMAGE_MAX_WIDTH_LEGACY)
1004 if (rec->src_height > IMAGE_MAX_HEIGHT ||
1005 rec->src_width > IMAGE_MAX_WIDTH)
1009 /* better safe than sorry, use 4 as the maximal subsampling ratio */
1010 if (rec->src_height < N_VERT_Y_TAPS*4 ||
1011 rec->src_width < N_HORIZ_Y_TAPS*4)
1014 /* check alignment constraints */
1015 switch (rec->flags & I915_OVERLAY_TYPE_MASK) {
1016 case I915_OVERLAY_RGB:
1017 /* not implemented */
1020 case I915_OVERLAY_YUV_PACKED:
1024 depth = packed_depth_bytes(rec->flags);
1028 /* ignore UV planes */
1032 /* check pixel alignment */
1033 if (rec->offset_Y % depth)
1037 case I915_OVERLAY_YUV_PLANAR:
1038 if (uv_vscale < 0 || uv_hscale < 0)
1040 /* no offset restrictions for planar formats */
1047 if (rec->src_width % uv_hscale)
1050 /* stride checking */
1051 if (IS_I830(dev) || IS_845G(dev))
1056 if (rec->stride_Y & stride_mask || rec->stride_UV & stride_mask)
1058 if (IS_I965G(dev) && rec->stride_Y < 512)
1061 tmp = (rec->flags & I915_OVERLAY_TYPE_MASK) == I915_OVERLAY_YUV_PLANAR ?
1063 if (rec->stride_Y > tmp || rec->stride_UV > 2*1024)
1066 /* check buffer dimensions */
1067 switch (rec->flags & I915_OVERLAY_TYPE_MASK) {
1068 case I915_OVERLAY_RGB:
1069 case I915_OVERLAY_YUV_PACKED:
1070 /* always 4 Y values per depth pixels */
1071 if (packed_width_bytes(rec->flags, rec->src_width) > rec->stride_Y)
1074 tmp = rec->stride_Y*rec->src_height;
1075 if (rec->offset_Y + tmp > new_bo->size)
1079 case I915_OVERLAY_YUV_PLANAR:
1080 if (rec->src_width > rec->stride_Y)
1082 if (rec->src_width/uv_hscale > rec->stride_UV)
1085 tmp = rec->stride_Y * rec->src_height;
1086 if (rec->offset_Y + tmp > new_bo->size)
1089 tmp = rec->stride_UV * (rec->src_height / uv_vscale);
1090 if (rec->offset_U + tmp > new_bo->size ||
1091 rec->offset_V + tmp > new_bo->size)
1099 int intel_overlay_put_image(struct drm_device *dev, void *data,
1100 struct drm_file *file_priv)
1102 struct drm_intel_overlay_put_image *put_image_rec = data;
1103 drm_i915_private_t *dev_priv = dev->dev_private;
1104 struct intel_overlay *overlay;
1105 struct drm_mode_object *drmmode_obj;
1106 struct intel_crtc *crtc;
1107 struct drm_gem_object *new_bo;
1108 struct put_image_params *params;
1112 DRM_ERROR("called with no initialization\n");
1116 overlay = dev_priv->overlay;
1118 DRM_DEBUG("userspace bug: no overlay\n");
1122 if (!(put_image_rec->flags & I915_OVERLAY_ENABLE)) {
1123 mutex_lock(&dev->mode_config.mutex);
1124 mutex_lock(&dev->struct_mutex);
1126 ret = intel_overlay_switch_off(overlay, true);
1128 mutex_unlock(&dev->struct_mutex);
1129 mutex_unlock(&dev->mode_config.mutex);
1134 params = kmalloc(sizeof(struct put_image_params), GFP_KERNEL);
1138 drmmode_obj = drm_mode_object_find(dev, put_image_rec->crtc_id,
1139 DRM_MODE_OBJECT_CRTC);
1144 crtc = to_intel_crtc(obj_to_crtc(drmmode_obj));
1146 new_bo = drm_gem_object_lookup(dev, file_priv,
1147 put_image_rec->bo_handle);
1153 mutex_lock(&dev->mode_config.mutex);
1154 mutex_lock(&dev->struct_mutex);
1156 if (overlay->hw_wedged) {
1157 ret = intel_overlay_recover_from_interrupt(overlay, 1);
1162 if (overlay->crtc != crtc) {
1163 struct drm_display_mode *mode = &crtc->base.mode;
1164 ret = intel_overlay_switch_off(overlay, true);
1168 ret = check_overlay_possible_on_crtc(overlay, crtc);
1172 overlay->crtc = crtc;
1173 crtc->overlay = overlay;
1175 if (intel_panel_fitter_pipe(dev) == crtc->pipe
1176 /* and line to wide, i.e. one-line-mode */
1177 && mode->hdisplay > 1024) {
1178 overlay->pfit_active = 1;
1179 update_pfit_vscale_ratio(overlay);
1181 overlay->pfit_active = 0;
1184 ret = check_overlay_dst(overlay, put_image_rec);
1188 if (overlay->pfit_active) {
1189 params->dst_y = ((((u32)put_image_rec->dst_y) << 12) /
1190 overlay->pfit_vscale_ratio);
1191 /* shifting right rounds downwards, so add 1 */
1192 params->dst_h = ((((u32)put_image_rec->dst_height) << 12) /
1193 overlay->pfit_vscale_ratio) + 1;
1195 params->dst_y = put_image_rec->dst_y;
1196 params->dst_h = put_image_rec->dst_height;
1198 params->dst_x = put_image_rec->dst_x;
1199 params->dst_w = put_image_rec->dst_width;
1201 params->src_w = put_image_rec->src_width;
1202 params->src_h = put_image_rec->src_height;
1203 params->src_scan_w = put_image_rec->src_scan_width;
1204 params->src_scan_h = put_image_rec->src_scan_height;
1205 if (params->src_scan_h > params->src_h ||
1206 params->src_scan_w > params->src_w) {
1211 ret = check_overlay_src(dev, put_image_rec, new_bo);
1214 params->format = put_image_rec->flags & ~I915_OVERLAY_FLAGS_MASK;
1215 params->stride_Y = put_image_rec->stride_Y;
1216 params->stride_UV = put_image_rec->stride_UV;
1217 params->offset_Y = put_image_rec->offset_Y;
1218 params->offset_U = put_image_rec->offset_U;
1219 params->offset_V = put_image_rec->offset_V;
1221 /* Check scaling after src size to prevent a divide-by-zero. */
1222 ret = check_overlay_scaling(params);
1226 ret = intel_overlay_do_put_image(overlay, new_bo, params);
1230 mutex_unlock(&dev->struct_mutex);
1231 mutex_unlock(&dev->mode_config.mutex);
1238 mutex_unlock(&dev->struct_mutex);
1239 mutex_unlock(&dev->mode_config.mutex);
1240 drm_gem_object_unreference_unlocked(new_bo);
1247 static void update_reg_attrs(struct intel_overlay *overlay,
1248 struct overlay_registers *regs)
1250 regs->OCLRC0 = (overlay->contrast << 18) | (overlay->brightness & 0xff);
1251 regs->OCLRC1 = overlay->saturation;
1254 static bool check_gamma_bounds(u32 gamma1, u32 gamma2)
1258 if (gamma1 & 0xff000000 || gamma2 & 0xff000000)
1261 for (i = 0; i < 3; i++) {
1262 if (((gamma1 >> i*8) & 0xff) >= ((gamma2 >> i*8) & 0xff))
1269 static bool check_gamma5_errata(u32 gamma5)
1273 for (i = 0; i < 3; i++) {
1274 if (((gamma5 >> i*8) & 0xff) == 0x80)
1281 static int check_gamma(struct drm_intel_overlay_attrs *attrs)
1283 if (!check_gamma_bounds(0, attrs->gamma0) ||
1284 !check_gamma_bounds(attrs->gamma0, attrs->gamma1) ||
1285 !check_gamma_bounds(attrs->gamma1, attrs->gamma2) ||
1286 !check_gamma_bounds(attrs->gamma2, attrs->gamma3) ||
1287 !check_gamma_bounds(attrs->gamma3, attrs->gamma4) ||
1288 !check_gamma_bounds(attrs->gamma4, attrs->gamma5) ||
1289 !check_gamma_bounds(attrs->gamma5, 0x00ffffff))
1292 if (!check_gamma5_errata(attrs->gamma5))
1298 int intel_overlay_attrs(struct drm_device *dev, void *data,
1299 struct drm_file *file_priv)
1301 struct drm_intel_overlay_attrs *attrs = data;
1302 drm_i915_private_t *dev_priv = dev->dev_private;
1303 struct intel_overlay *overlay;
1304 struct overlay_registers *regs;
1308 DRM_ERROR("called with no initialization\n");
1312 overlay = dev_priv->overlay;
1314 DRM_DEBUG("userspace bug: no overlay\n");
1318 mutex_lock(&dev->mode_config.mutex);
1319 mutex_lock(&dev->struct_mutex);
1322 if (!(attrs->flags & I915_OVERLAY_UPDATE_ATTRS)) {
1323 attrs->color_key = overlay->color_key;
1324 attrs->brightness = overlay->brightness;
1325 attrs->contrast = overlay->contrast;
1326 attrs->saturation = overlay->saturation;
1329 attrs->gamma0 = I915_READ(OGAMC0);
1330 attrs->gamma1 = I915_READ(OGAMC1);
1331 attrs->gamma2 = I915_READ(OGAMC2);
1332 attrs->gamma3 = I915_READ(OGAMC3);
1333 attrs->gamma4 = I915_READ(OGAMC4);
1334 attrs->gamma5 = I915_READ(OGAMC5);
1337 if (attrs->brightness < -128 || attrs->brightness > 127)
1339 if (attrs->contrast > 255)
1341 if (attrs->saturation > 1023)
1344 overlay->color_key = attrs->color_key;
1345 overlay->brightness = attrs->brightness;
1346 overlay->contrast = attrs->contrast;
1347 overlay->saturation = attrs->saturation;
1349 regs = intel_overlay_map_regs(overlay);
1355 update_reg_attrs(overlay, regs);
1357 intel_overlay_unmap_regs(overlay, regs);
1359 if (attrs->flags & I915_OVERLAY_UPDATE_GAMMA) {
1363 if (overlay->active) {
1368 ret = check_gamma(attrs);
1372 I915_WRITE(OGAMC0, attrs->gamma0);
1373 I915_WRITE(OGAMC1, attrs->gamma1);
1374 I915_WRITE(OGAMC2, attrs->gamma2);
1375 I915_WRITE(OGAMC3, attrs->gamma3);
1376 I915_WRITE(OGAMC4, attrs->gamma4);
1377 I915_WRITE(OGAMC5, attrs->gamma5);
1383 mutex_unlock(&dev->struct_mutex);
1384 mutex_unlock(&dev->mode_config.mutex);
1389 void intel_setup_overlay(struct drm_device *dev)
1391 drm_i915_private_t *dev_priv = dev->dev_private;
1392 struct intel_overlay *overlay;
1393 struct drm_gem_object *reg_bo;
1394 struct overlay_registers *regs;
1397 if (!HAS_OVERLAY(dev))
1400 overlay = kzalloc(sizeof(struct intel_overlay), GFP_KERNEL);
1405 reg_bo = i915_gem_alloc_object(dev, PAGE_SIZE);
1408 overlay->reg_bo = to_intel_bo(reg_bo);
1410 if (OVERLAY_NEEDS_PHYSICAL(dev)) {
1411 ret = i915_gem_attach_phys_object(dev, reg_bo,
1412 I915_GEM_PHYS_OVERLAY_REGS,
1415 DRM_ERROR("failed to attach phys overlay regs\n");
1418 overlay->flip_addr = overlay->reg_bo->phys_obj->handle->busaddr;
1420 ret = i915_gem_object_pin(reg_bo, PAGE_SIZE);
1422 DRM_ERROR("failed to pin overlay register bo\n");
1425 overlay->flip_addr = overlay->reg_bo->gtt_offset;
1427 ret = i915_gem_object_set_to_gtt_domain(reg_bo, true);
1429 DRM_ERROR("failed to move overlay register bo into the GTT\n");
1434 /* init all values */
1435 overlay->color_key = 0x0101fe;
1436 overlay->brightness = -19;
1437 overlay->contrast = 75;
1438 overlay->saturation = 146;
1440 regs = intel_overlay_map_regs(overlay);
1444 memset(regs, 0, sizeof(struct overlay_registers));
1445 update_polyphase_filter(regs);
1446 update_reg_attrs(overlay, regs);
1448 intel_overlay_unmap_regs(overlay, regs);
1450 dev_priv->overlay = overlay;
1451 DRM_INFO("initialized overlay support\n");
1455 i915_gem_object_unpin(reg_bo);
1457 drm_gem_object_unreference(reg_bo);
1463 void intel_cleanup_overlay(struct drm_device *dev)
1465 drm_i915_private_t *dev_priv = dev->dev_private;
1467 if (!dev_priv->overlay)
1470 /* The bo's should be free'd by the generic code already.
1471 * Furthermore modesetting teardown happens beforehand so the
1472 * hardware should be off already */
1473 BUG_ON(dev_priv->overlay->active);
1475 drm_gem_object_unreference_unlocked(&dev_priv->overlay->reg_bo->base);
1476 kfree(dev_priv->overlay);
1479 struct intel_overlay_error_state {
1480 struct overlay_registers regs;
1486 struct intel_overlay_error_state *
1487 intel_overlay_capture_error_state(struct drm_device *dev)
1489 drm_i915_private_t *dev_priv = dev->dev_private;
1490 struct intel_overlay *overlay = dev_priv->overlay;
1491 struct intel_overlay_error_state *error;
1492 struct overlay_registers __iomem *regs;
1494 if (!overlay || !overlay->active)
1497 error = kmalloc(sizeof(*error), GFP_ATOMIC);
1501 error->dovsta = I915_READ(DOVSTA);
1502 error->isr = I915_READ(ISR);
1503 if (OVERLAY_NEEDS_PHYSICAL(overlay->dev))
1504 error->base = (long) overlay->reg_bo->phys_obj->handle->vaddr;
1506 error->base = (long) overlay->reg_bo->gtt_offset;
1508 regs = intel_overlay_map_regs_atomic(overlay, KM_IRQ0);
1512 memcpy_fromio(&error->regs, regs, sizeof(struct overlay_registers));
1513 intel_overlay_unmap_regs_atomic(overlay, KM_IRQ0, regs);
1523 intel_overlay_print_error_state(struct seq_file *m, struct intel_overlay_error_state *error)
1525 seq_printf(m, "Overlay, status: 0x%08x, interrupt: 0x%08x\n",
1526 error->dovsta, error->isr);
1527 seq_printf(m, " Register file at 0x%08lx:\n",
1530 #define P(x) seq_printf(m, " " #x ": 0x%08x\n", error->regs.x)