4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
20 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
24 * Daniel Vetter <daniel@ffwll.ch>
26 * Derived from Xorg ddx, xf86-video-intel, src/i830_video.c
29 #include <linux/seq_file.h>
35 #include "intel_drv.h"
37 /* Limits for overlay size. According to intel doc, the real limits are:
38 * Y width: 4095, UV width (planar): 2047, Y height: 2047,
39 * UV width (planar): * 1023. But the xorg thinks 2048 for height and width. Use
40 * the mininum of both. */
41 #define IMAGE_MAX_WIDTH 2048
42 #define IMAGE_MAX_HEIGHT 2046 /* 2 * 1023 */
43 /* on 830 and 845 these large limits result in the card hanging */
44 #define IMAGE_MAX_WIDTH_LEGACY 1024
45 #define IMAGE_MAX_HEIGHT_LEGACY 1088
47 /* overlay register definitions */
49 #define OCMD_TILED_SURFACE (0x1<<19)
50 #define OCMD_MIRROR_MASK (0x3<<17)
51 #define OCMD_MIRROR_MODE (0x3<<17)
52 #define OCMD_MIRROR_HORIZONTAL (0x1<<17)
53 #define OCMD_MIRROR_VERTICAL (0x2<<17)
54 #define OCMD_MIRROR_BOTH (0x3<<17)
55 #define OCMD_BYTEORDER_MASK (0x3<<14) /* zero for YUYV or FOURCC YUY2 */
56 #define OCMD_UV_SWAP (0x1<<14) /* YVYU */
57 #define OCMD_Y_SWAP (0x2<<14) /* UYVY or FOURCC UYVY */
58 #define OCMD_Y_AND_UV_SWAP (0x3<<14) /* VYUY */
59 #define OCMD_SOURCE_FORMAT_MASK (0xf<<10)
60 #define OCMD_RGB_888 (0x1<<10) /* not in i965 Intel docs */
61 #define OCMD_RGB_555 (0x2<<10) /* not in i965 Intel docs */
62 #define OCMD_RGB_565 (0x3<<10) /* not in i965 Intel docs */
63 #define OCMD_YUV_422_PACKED (0x8<<10)
64 #define OCMD_YUV_411_PACKED (0x9<<10) /* not in i965 Intel docs */
65 #define OCMD_YUV_420_PLANAR (0xc<<10)
66 #define OCMD_YUV_422_PLANAR (0xd<<10)
67 #define OCMD_YUV_410_PLANAR (0xe<<10) /* also 411 */
68 #define OCMD_TVSYNCFLIP_PARITY (0x1<<9)
69 #define OCMD_TVSYNCFLIP_ENABLE (0x1<<7)
70 #define OCMD_BUF_TYPE_MASK (0x1<<5)
71 #define OCMD_BUF_TYPE_FRAME (0x0<<5)
72 #define OCMD_BUF_TYPE_FIELD (0x1<<5)
73 #define OCMD_TEST_MODE (0x1<<4)
74 #define OCMD_BUFFER_SELECT (0x3<<2)
75 #define OCMD_BUFFER0 (0x0<<2)
76 #define OCMD_BUFFER1 (0x1<<2)
77 #define OCMD_FIELD_SELECT (0x1<<2)
78 #define OCMD_FIELD0 (0x0<<1)
79 #define OCMD_FIELD1 (0x1<<1)
80 #define OCMD_ENABLE (0x1<<0)
82 /* OCONFIG register */
83 #define OCONF_PIPE_MASK (0x1<<18)
84 #define OCONF_PIPE_A (0x0<<18)
85 #define OCONF_PIPE_B (0x1<<18)
86 #define OCONF_GAMMA2_ENABLE (0x1<<16)
87 #define OCONF_CSC_MODE_BT601 (0x0<<5)
88 #define OCONF_CSC_MODE_BT709 (0x1<<5)
89 #define OCONF_CSC_BYPASS (0x1<<4)
90 #define OCONF_CC_OUT_8BIT (0x1<<3)
91 #define OCONF_TEST_MODE (0x1<<2)
92 #define OCONF_THREE_LINE_BUFFER (0x1<<0)
93 #define OCONF_TWO_LINE_BUFFER (0x0<<0)
95 /* DCLRKM (dst-key) register */
96 #define DST_KEY_ENABLE (0x1<<31)
97 #define CLK_RGB24_MASK 0x0
98 #define CLK_RGB16_MASK 0x070307
99 #define CLK_RGB15_MASK 0x070707
100 #define CLK_RGB8I_MASK 0xffffff
102 #define RGB16_TO_COLORKEY(c) \
103 (((c & 0xF800) << 8) | ((c & 0x07E0) << 5) | ((c & 0x001F) << 3))
104 #define RGB15_TO_COLORKEY(c) \
105 (((c & 0x7c00) << 9) | ((c & 0x03E0) << 6) | ((c & 0x001F) << 3))
107 /* overlay flip addr flag */
108 #define OFC_UPDATE 0x1
110 /* polyphase filter coefficients */
111 #define N_HORIZ_Y_TAPS 5
112 #define N_VERT_Y_TAPS 3
113 #define N_HORIZ_UV_TAPS 3
114 #define N_VERT_UV_TAPS 3
118 /* memory bufferd overlay registers */
119 struct overlay_registers
{
147 u32 RESERVED1
; /* 0x6C */
160 u32 FASTHSCALE
; /* 0xA0 */
161 u32 UVSCALEV
; /* 0xA4 */
162 u32 RESERVEDC
[(0x200 - 0xA8) / 4]; /* 0xA8 - 0x1FC */
163 u16 Y_VCOEFS
[N_VERT_Y_TAPS
* N_PHASES
]; /* 0x200 */
164 u16 RESERVEDD
[0x100 / 2 - N_VERT_Y_TAPS
* N_PHASES
];
165 u16 Y_HCOEFS
[N_HORIZ_Y_TAPS
* N_PHASES
]; /* 0x300 */
166 u16 RESERVEDE
[0x200 / 2 - N_HORIZ_Y_TAPS
* N_PHASES
];
167 u16 UV_VCOEFS
[N_VERT_UV_TAPS
* N_PHASES
]; /* 0x500 */
168 u16 RESERVEDF
[0x100 / 2 - N_VERT_UV_TAPS
* N_PHASES
];
169 u16 UV_HCOEFS
[N_HORIZ_UV_TAPS
* N_PHASES
]; /* 0x600 */
170 u16 RESERVEDG
[0x100 / 2 - N_HORIZ_UV_TAPS
* N_PHASES
];
173 static struct overlay_registers
*
174 intel_overlay_map_regs_atomic(struct intel_overlay
*overlay
,
177 drm_i915_private_t
*dev_priv
= overlay
->dev
->dev_private
;
178 struct overlay_registers
*regs
;
180 if (OVERLAY_NEEDS_PHYSICAL(overlay
->dev
))
181 regs
= overlay
->reg_bo
->phys_obj
->handle
->vaddr
;
183 regs
= io_mapping_map_atomic_wc(dev_priv
->mm
.gtt_mapping
,
184 overlay
->reg_bo
->gtt_offset
,
190 static void intel_overlay_unmap_regs_atomic(struct intel_overlay
*overlay
,
192 struct overlay_registers
*regs
)
194 if (!OVERLAY_NEEDS_PHYSICAL(overlay
->dev
))
195 io_mapping_unmap_atomic(regs
, slot
);
198 static struct overlay_registers
*
199 intel_overlay_map_regs(struct intel_overlay
*overlay
)
201 drm_i915_private_t
*dev_priv
= overlay
->dev
->dev_private
;
202 struct overlay_registers
*regs
;
204 if (OVERLAY_NEEDS_PHYSICAL(overlay
->dev
))
205 regs
= overlay
->reg_bo
->phys_obj
->handle
->vaddr
;
207 regs
= io_mapping_map_wc(dev_priv
->mm
.gtt_mapping
,
208 overlay
->reg_bo
->gtt_offset
);
213 static void intel_overlay_unmap_regs(struct intel_overlay
*overlay
,
214 struct overlay_registers
*regs
)
216 if (!OVERLAY_NEEDS_PHYSICAL(overlay
->dev
))
217 io_mapping_unmap(regs
);
220 static int intel_overlay_do_wait_request(struct intel_overlay
*overlay
,
224 struct drm_device
*dev
= overlay
->dev
;
225 drm_i915_private_t
*dev_priv
= dev
->dev_private
;
228 overlay
->last_flip_req
=
229 i915_add_request(dev
, NULL
, &dev_priv
->render_ring
);
230 if (overlay
->last_flip_req
== 0)
233 overlay
->hw_wedged
= stage
;
234 ret
= i915_do_wait_request(dev
,
235 overlay
->last_flip_req
, true,
236 &dev_priv
->render_ring
);
240 overlay
->hw_wedged
= 0;
241 overlay
->last_flip_req
= 0;
245 /* overlay needs to be disable in OCMD reg */
246 static int intel_overlay_on(struct intel_overlay
*overlay
)
248 struct drm_device
*dev
= overlay
->dev
;
250 BUG_ON(overlay
->active
);
255 OUT_RING(MI_OVERLAY_FLIP
| MI_OVERLAY_ON
);
256 OUT_RING(overlay
->flip_addr
| OFC_UPDATE
);
257 OUT_RING(MI_WAIT_FOR_EVENT
| MI_WAIT_FOR_OVERLAY_FLIP
);
261 return intel_overlay_do_wait_request(overlay
, true,
262 NEEDS_WAIT_FOR_FLIP
);
265 /* overlay needs to be enabled in OCMD reg */
266 static void intel_overlay_continue(struct intel_overlay
*overlay
,
267 bool load_polyphase_filter
)
269 struct drm_device
*dev
= overlay
->dev
;
270 drm_i915_private_t
*dev_priv
= dev
->dev_private
;
271 u32 flip_addr
= overlay
->flip_addr
;
274 BUG_ON(!overlay
->active
);
276 if (load_polyphase_filter
)
277 flip_addr
|= OFC_UPDATE
;
279 /* check for underruns */
280 tmp
= I915_READ(DOVSTA
);
282 DRM_DEBUG("overlay underrun, DOVSTA: %x\n", tmp
);
285 OUT_RING(MI_OVERLAY_FLIP
| MI_OVERLAY_CONTINUE
);
289 overlay
->last_flip_req
=
290 i915_add_request(dev
, NULL
, &dev_priv
->render_ring
);
293 static int intel_overlay_wait_flip(struct intel_overlay
*overlay
)
295 struct drm_device
*dev
= overlay
->dev
;
296 drm_i915_private_t
*dev_priv
= dev
->dev_private
;
300 if (overlay
->last_flip_req
!= 0) {
301 ret
= i915_do_wait_request(dev
,
302 overlay
->last_flip_req
, true,
303 &dev_priv
->render_ring
);
305 overlay
->last_flip_req
= 0;
307 tmp
= I915_READ(ISR
);
309 if (!(tmp
& I915_OVERLAY_PLANE_FLIP_PENDING_INTERRUPT
))
314 /* synchronous slowpath */
316 OUT_RING(MI_WAIT_FOR_EVENT
| MI_WAIT_FOR_OVERLAY_FLIP
);
320 return intel_overlay_do_wait_request(overlay
, true, RELEASE_OLD_VID
);
323 /* overlay needs to be disabled in OCMD reg */
324 static int intel_overlay_off(struct intel_overlay
*overlay
)
326 u32 flip_addr
= overlay
->flip_addr
;
327 struct drm_device
*dev
= overlay
->dev
;
330 BUG_ON(!overlay
->active
);
332 /* According to intel docs the overlay hw may hang (when switching
333 * off) without loading the filter coeffs. It is however unclear whether
334 * this applies to the disabling of the overlay or to the switching off
335 * of the hw. Do it in both cases */
336 flip_addr
|= OFC_UPDATE
;
338 /* wait for overlay to go idle */
340 OUT_RING(MI_OVERLAY_FLIP
| MI_OVERLAY_CONTINUE
);
342 OUT_RING(MI_WAIT_FOR_EVENT
| MI_WAIT_FOR_OVERLAY_FLIP
);
346 ret
= intel_overlay_do_wait_request(overlay
, true,
351 /* turn overlay off */
353 OUT_RING(MI_OVERLAY_FLIP
| MI_OVERLAY_OFF
);
355 OUT_RING(MI_WAIT_FOR_EVENT
| MI_WAIT_FOR_OVERLAY_FLIP
);
359 return intel_overlay_do_wait_request(overlay
, true,
363 static void intel_overlay_off_tail(struct intel_overlay
*overlay
)
365 struct drm_gem_object
*obj
;
367 /* never have the overlay hw on without showing a frame */
368 BUG_ON(!overlay
->vid_bo
);
369 obj
= &overlay
->vid_bo
->base
;
371 i915_gem_object_unpin(obj
);
372 drm_gem_object_unreference(obj
);
373 overlay
->vid_bo
= NULL
;
375 overlay
->crtc
->overlay
= NULL
;
376 overlay
->crtc
= NULL
;
380 /* recover from an interruption due to a signal
381 * We have to be careful not to repeat work forever an make forward progess. */
382 int intel_overlay_recover_from_interrupt(struct intel_overlay
*overlay
,
385 struct drm_device
*dev
= overlay
->dev
;
386 struct drm_gem_object
*obj
;
387 drm_i915_private_t
*dev_priv
= dev
->dev_private
;
391 if (overlay
->hw_wedged
== HW_WEDGED
)
394 ret
= i915_do_wait_request(dev
, overlay
->last_flip_req
,
395 interruptible
, &dev_priv
->render_ring
);
399 switch (overlay
->hw_wedged
) {
400 case RELEASE_OLD_VID
:
401 obj
= &overlay
->old_vid_bo
->base
;
402 i915_gem_object_unpin(obj
);
403 drm_gem_object_unreference(obj
);
404 overlay
->old_vid_bo
= NULL
;
407 case SWITCH_OFF_STAGE_1
:
408 flip_addr
= overlay
->flip_addr
;
409 flip_addr
|= OFC_UPDATE
;
412 OUT_RING(MI_OVERLAY_FLIP
| MI_OVERLAY_OFF
);
414 OUT_RING(MI_WAIT_FOR_EVENT
| MI_WAIT_FOR_OVERLAY_FLIP
);
418 ret
= intel_overlay_do_wait_request(overlay
, interruptible
,
423 case SWITCH_OFF_STAGE_2
:
424 intel_overlay_off_tail(overlay
);
427 BUG_ON(overlay
->hw_wedged
!= NEEDS_WAIT_FOR_FLIP
);
430 overlay
->hw_wedged
= 0;
431 overlay
->last_flip_req
= 0;
435 /* Wait for pending overlay flip and release old frame.
436 * Needs to be called before the overlay register are changed
437 * via intel_overlay_(un)map_regs
439 static int intel_overlay_release_old_vid(struct intel_overlay
*overlay
)
442 struct drm_gem_object
*obj
;
444 /* only wait if there is actually an old frame to release to
445 * guarantee forward progress */
446 if (!overlay
->old_vid_bo
)
449 ret
= intel_overlay_wait_flip(overlay
);
453 obj
= &overlay
->old_vid_bo
->base
;
454 i915_gem_object_unpin(obj
);
455 drm_gem_object_unreference(obj
);
456 overlay
->old_vid_bo
= NULL
;
461 struct put_image_params
{
478 static int packed_depth_bytes(u32 format
)
480 switch (format
& I915_OVERLAY_DEPTH_MASK
) {
481 case I915_OVERLAY_YUV422
:
483 case I915_OVERLAY_YUV411
:
484 /* return 6; not implemented */
490 static int packed_width_bytes(u32 format
, short width
)
492 switch (format
& I915_OVERLAY_DEPTH_MASK
) {
493 case I915_OVERLAY_YUV422
:
500 static int uv_hsubsampling(u32 format
)
502 switch (format
& I915_OVERLAY_DEPTH_MASK
) {
503 case I915_OVERLAY_YUV422
:
504 case I915_OVERLAY_YUV420
:
506 case I915_OVERLAY_YUV411
:
507 case I915_OVERLAY_YUV410
:
514 static int uv_vsubsampling(u32 format
)
516 switch (format
& I915_OVERLAY_DEPTH_MASK
) {
517 case I915_OVERLAY_YUV420
:
518 case I915_OVERLAY_YUV410
:
520 case I915_OVERLAY_YUV422
:
521 case I915_OVERLAY_YUV411
:
528 static u32
calc_swidthsw(struct drm_device
*dev
, u32 offset
, u32 width
)
530 u32 mask
, shift
, ret
;
538 ret
= ((offset
+ width
+ mask
) >> shift
) - (offset
>> shift
);
545 static const u16 y_static_hcoeffs
[N_HORIZ_Y_TAPS
* N_PHASES
] = {
546 0x3000, 0xb4a0, 0x1930, 0x1920, 0xb4a0,
547 0x3000, 0xb500, 0x19d0, 0x1880, 0xb440,
548 0x3000, 0xb540, 0x1a88, 0x2f80, 0xb3e0,
549 0x3000, 0xb580, 0x1b30, 0x2e20, 0xb380,
550 0x3000, 0xb5c0, 0x1bd8, 0x2cc0, 0xb320,
551 0x3020, 0xb5e0, 0x1c60, 0x2b80, 0xb2c0,
552 0x3020, 0xb5e0, 0x1cf8, 0x2a20, 0xb260,
553 0x3020, 0xb5e0, 0x1d80, 0x28e0, 0xb200,
554 0x3020, 0xb5c0, 0x1e08, 0x3f40, 0xb1c0,
555 0x3020, 0xb580, 0x1e78, 0x3ce0, 0xb160,
556 0x3040, 0xb520, 0x1ed8, 0x3aa0, 0xb120,
557 0x3040, 0xb4a0, 0x1f30, 0x3880, 0xb0e0,
558 0x3040, 0xb400, 0x1f78, 0x3680, 0xb0a0,
559 0x3020, 0xb340, 0x1fb8, 0x34a0, 0xb060,
560 0x3020, 0xb240, 0x1fe0, 0x32e0, 0xb040,
561 0x3020, 0xb140, 0x1ff8, 0x3160, 0xb020,
562 0xb000, 0x3000, 0x0800, 0x3000, 0xb000
565 static const u16 uv_static_hcoeffs
[N_HORIZ_UV_TAPS
* N_PHASES
] = {
566 0x3000, 0x1800, 0x1800, 0xb000, 0x18d0, 0x2e60,
567 0xb000, 0x1990, 0x2ce0, 0xb020, 0x1a68, 0x2b40,
568 0xb040, 0x1b20, 0x29e0, 0xb060, 0x1bd8, 0x2880,
569 0xb080, 0x1c88, 0x3e60, 0xb0a0, 0x1d28, 0x3c00,
570 0xb0c0, 0x1db8, 0x39e0, 0xb0e0, 0x1e40, 0x37e0,
571 0xb100, 0x1eb8, 0x3620, 0xb100, 0x1f18, 0x34a0,
572 0xb100, 0x1f68, 0x3360, 0xb0e0, 0x1fa8, 0x3240,
573 0xb0c0, 0x1fe0, 0x3140, 0xb060, 0x1ff0, 0x30a0,
574 0x3000, 0x0800, 0x3000
577 static void update_polyphase_filter(struct overlay_registers
*regs
)
579 memcpy(regs
->Y_HCOEFS
, y_static_hcoeffs
, sizeof(y_static_hcoeffs
));
580 memcpy(regs
->UV_HCOEFS
, uv_static_hcoeffs
, sizeof(uv_static_hcoeffs
));
583 static bool update_scaling_factors(struct intel_overlay
*overlay
,
584 struct overlay_registers
*regs
,
585 struct put_image_params
*params
)
587 /* fixed point with a 12 bit shift */
588 u32 xscale
, yscale
, xscale_UV
, yscale_UV
;
590 #define FRACT_MASK 0xfff
591 bool scale_changed
= false;
592 int uv_hscale
= uv_hsubsampling(params
->format
);
593 int uv_vscale
= uv_vsubsampling(params
->format
);
595 if (params
->dst_w
> 1)
596 xscale
= ((params
->src_scan_w
- 1) << FP_SHIFT
)
599 xscale
= 1 << FP_SHIFT
;
601 if (params
->dst_h
> 1)
602 yscale
= ((params
->src_scan_h
- 1) << FP_SHIFT
)
605 yscale
= 1 << FP_SHIFT
;
607 /*if (params->format & I915_OVERLAY_YUV_PLANAR) {*/
608 xscale_UV
= xscale
/uv_hscale
;
609 yscale_UV
= yscale
/uv_vscale
;
610 /* make the Y scale to UV scale ratio an exact multiply */
611 xscale
= xscale_UV
* uv_hscale
;
612 yscale
= yscale_UV
* uv_vscale
;
618 if (xscale
!= overlay
->old_xscale
|| yscale
!= overlay
->old_yscale
)
619 scale_changed
= true;
620 overlay
->old_xscale
= xscale
;
621 overlay
->old_yscale
= yscale
;
623 regs
->YRGBSCALE
= (((yscale
& FRACT_MASK
) << 20) |
624 ((xscale
>> FP_SHIFT
) << 16) |
625 ((xscale
& FRACT_MASK
) << 3));
627 regs
->UVSCALE
= (((yscale_UV
& FRACT_MASK
) << 20) |
628 ((xscale_UV
>> FP_SHIFT
) << 16) |
629 ((xscale_UV
& FRACT_MASK
) << 3));
631 regs
->UVSCALEV
= ((((yscale
>> FP_SHIFT
) << 16) |
632 ((yscale_UV
>> FP_SHIFT
) << 0)));
635 update_polyphase_filter(regs
);
637 return scale_changed
;
640 static void update_colorkey(struct intel_overlay
*overlay
,
641 struct overlay_registers
*regs
)
643 u32 key
= overlay
->color_key
;
645 switch (overlay
->crtc
->base
.fb
->bits_per_pixel
) {
648 regs
->DCLRKM
= CLK_RGB8I_MASK
| DST_KEY_ENABLE
;
652 if (overlay
->crtc
->base
.fb
->depth
== 15) {
653 regs
->DCLRKV
= RGB15_TO_COLORKEY(key
);
654 regs
->DCLRKM
= CLK_RGB15_MASK
| DST_KEY_ENABLE
;
656 regs
->DCLRKV
= RGB16_TO_COLORKEY(key
);
657 regs
->DCLRKM
= CLK_RGB16_MASK
| DST_KEY_ENABLE
;
664 regs
->DCLRKM
= CLK_RGB24_MASK
| DST_KEY_ENABLE
;
669 static u32
overlay_cmd_reg(struct put_image_params
*params
)
671 u32 cmd
= OCMD_ENABLE
| OCMD_BUF_TYPE_FRAME
| OCMD_BUFFER0
;
673 if (params
->format
& I915_OVERLAY_YUV_PLANAR
) {
674 switch (params
->format
& I915_OVERLAY_DEPTH_MASK
) {
675 case I915_OVERLAY_YUV422
:
676 cmd
|= OCMD_YUV_422_PLANAR
;
678 case I915_OVERLAY_YUV420
:
679 cmd
|= OCMD_YUV_420_PLANAR
;
681 case I915_OVERLAY_YUV411
:
682 case I915_OVERLAY_YUV410
:
683 cmd
|= OCMD_YUV_410_PLANAR
;
686 } else { /* YUV packed */
687 switch (params
->format
& I915_OVERLAY_DEPTH_MASK
) {
688 case I915_OVERLAY_YUV422
:
689 cmd
|= OCMD_YUV_422_PACKED
;
691 case I915_OVERLAY_YUV411
:
692 cmd
|= OCMD_YUV_411_PACKED
;
696 switch (params
->format
& I915_OVERLAY_SWAP_MASK
) {
697 case I915_OVERLAY_NO_SWAP
:
699 case I915_OVERLAY_UV_SWAP
:
702 case I915_OVERLAY_Y_SWAP
:
705 case I915_OVERLAY_Y_AND_UV_SWAP
:
706 cmd
|= OCMD_Y_AND_UV_SWAP
;
714 int intel_overlay_do_put_image(struct intel_overlay
*overlay
,
715 struct drm_gem_object
*new_bo
,
716 struct put_image_params
*params
)
719 struct overlay_registers
*regs
;
720 bool scale_changed
= false;
721 struct drm_i915_gem_object
*bo_priv
= to_intel_bo(new_bo
);
722 struct drm_device
*dev
= overlay
->dev
;
724 BUG_ON(!mutex_is_locked(&dev
->struct_mutex
));
725 BUG_ON(!mutex_is_locked(&dev
->mode_config
.mutex
));
728 ret
= intel_overlay_release_old_vid(overlay
);
732 ret
= i915_gem_object_pin(new_bo
, PAGE_SIZE
);
736 ret
= i915_gem_object_set_to_gtt_domain(new_bo
, 0);
740 if (!overlay
->active
) {
741 regs
= intel_overlay_map_regs(overlay
);
746 regs
->OCONFIG
= OCONF_CC_OUT_8BIT
;
747 if (IS_I965GM(overlay
->dev
))
748 regs
->OCONFIG
|= OCONF_CSC_MODE_BT709
;
749 regs
->OCONFIG
|= overlay
->crtc
->pipe
== 0 ?
750 OCONF_PIPE_A
: OCONF_PIPE_B
;
751 intel_overlay_unmap_regs(overlay
, regs
);
753 ret
= intel_overlay_on(overlay
);
758 regs
= intel_overlay_map_regs(overlay
);
764 regs
->DWINPOS
= (params
->dst_y
<< 16) | params
->dst_x
;
765 regs
->DWINSZ
= (params
->dst_h
<< 16) | params
->dst_w
;
767 if (params
->format
& I915_OVERLAY_YUV_PACKED
)
768 tmp_width
= packed_width_bytes(params
->format
, params
->src_w
);
770 tmp_width
= params
->src_w
;
772 regs
->SWIDTH
= params
->src_w
;
773 regs
->SWIDTHSW
= calc_swidthsw(overlay
->dev
,
774 params
->offset_Y
, tmp_width
);
775 regs
->SHEIGHT
= params
->src_h
;
776 regs
->OBUF_0Y
= bo_priv
->gtt_offset
+ params
-> offset_Y
;
777 regs
->OSTRIDE
= params
->stride_Y
;
779 if (params
->format
& I915_OVERLAY_YUV_PLANAR
) {
780 int uv_hscale
= uv_hsubsampling(params
->format
);
781 int uv_vscale
= uv_vsubsampling(params
->format
);
783 regs
->SWIDTH
|= (params
->src_w
/uv_hscale
) << 16;
784 tmp_U
= calc_swidthsw(overlay
->dev
, params
->offset_U
,
785 params
->src_w
/uv_hscale
);
786 tmp_V
= calc_swidthsw(overlay
->dev
, params
->offset_V
,
787 params
->src_w
/uv_hscale
);
788 regs
->SWIDTHSW
|= max_t(u32
, tmp_U
, tmp_V
) << 16;
789 regs
->SHEIGHT
|= (params
->src_h
/uv_vscale
) << 16;
790 regs
->OBUF_0U
= bo_priv
->gtt_offset
+ params
->offset_U
;
791 regs
->OBUF_0V
= bo_priv
->gtt_offset
+ params
->offset_V
;
792 regs
->OSTRIDE
|= params
->stride_UV
<< 16;
795 scale_changed
= update_scaling_factors(overlay
, regs
, params
);
797 update_colorkey(overlay
, regs
);
799 regs
->OCMD
= overlay_cmd_reg(params
);
801 intel_overlay_unmap_regs(overlay
, regs
);
803 intel_overlay_continue(overlay
, scale_changed
);
805 overlay
->old_vid_bo
= overlay
->vid_bo
;
806 overlay
->vid_bo
= to_intel_bo(new_bo
);
811 i915_gem_object_unpin(new_bo
);
815 int intel_overlay_switch_off(struct intel_overlay
*overlay
)
818 struct overlay_registers
*regs
;
819 struct drm_device
*dev
= overlay
->dev
;
821 BUG_ON(!mutex_is_locked(&dev
->struct_mutex
));
822 BUG_ON(!mutex_is_locked(&dev
->mode_config
.mutex
));
824 if (overlay
->hw_wedged
) {
825 ret
= intel_overlay_recover_from_interrupt(overlay
, 1);
830 if (!overlay
->active
)
833 ret
= intel_overlay_release_old_vid(overlay
);
837 regs
= intel_overlay_map_regs(overlay
);
839 intel_overlay_unmap_regs(overlay
, regs
);
841 ret
= intel_overlay_off(overlay
);
845 intel_overlay_off_tail(overlay
);
850 static int check_overlay_possible_on_crtc(struct intel_overlay
*overlay
,
851 struct intel_crtc
*crtc
)
853 drm_i915_private_t
*dev_priv
= overlay
->dev
->dev_private
;
855 int pipeconf_reg
= (crtc
->pipe
== 0) ? PIPEACONF
: PIPEBCONF
;
857 if (!crtc
->base
.enabled
|| crtc
->dpms_mode
!= DRM_MODE_DPMS_ON
)
860 pipeconf
= I915_READ(pipeconf_reg
);
862 /* can't use the overlay with double wide pipe */
863 if (!IS_I965G(overlay
->dev
) && pipeconf
& PIPEACONF_DOUBLE_WIDE
)
869 static void update_pfit_vscale_ratio(struct intel_overlay
*overlay
)
871 struct drm_device
*dev
= overlay
->dev
;
872 drm_i915_private_t
*dev_priv
= dev
->dev_private
;
873 u32 pfit_control
= I915_READ(PFIT_CONTROL
);
876 /* XXX: This is not the same logic as in the xorg driver, but more in
877 * line with the intel documentation for the i965
879 if (!IS_I965G(dev
)) {
880 if (pfit_control
& VERT_AUTO_SCALE
)
881 ratio
= I915_READ(PFIT_AUTO_RATIOS
);
883 ratio
= I915_READ(PFIT_PGM_RATIOS
);
884 ratio
>>= PFIT_VERT_SCALE_SHIFT
;
885 } else { /* on i965 use the PGM reg to read out the autoscaler values */
886 ratio
= I915_READ(PFIT_PGM_RATIOS
) >> PFIT_VERT_SCALE_SHIFT_965
;
889 overlay
->pfit_vscale_ratio
= ratio
;
892 static int check_overlay_dst(struct intel_overlay
*overlay
,
893 struct drm_intel_overlay_put_image
*rec
)
895 struct drm_display_mode
*mode
= &overlay
->crtc
->base
.mode
;
897 if (rec
->dst_x
< mode
->crtc_hdisplay
&&
898 rec
->dst_x
+ rec
->dst_width
<= mode
->crtc_hdisplay
&&
899 rec
->dst_y
< mode
->crtc_vdisplay
&&
900 rec
->dst_y
+ rec
->dst_height
<= mode
->crtc_vdisplay
)
906 static int check_overlay_scaling(struct put_image_params
*rec
)
910 /* downscaling limit is 8.0 */
911 tmp
= ((rec
->src_scan_h
<< 16) / rec
->dst_h
) >> 16;
914 tmp
= ((rec
->src_scan_w
<< 16) / rec
->dst_w
) >> 16;
921 static int check_overlay_src(struct drm_device
*dev
,
922 struct drm_intel_overlay_put_image
*rec
,
923 struct drm_gem_object
*new_bo
)
925 int uv_hscale
= uv_hsubsampling(rec
->flags
);
926 int uv_vscale
= uv_vsubsampling(rec
->flags
);
927 u32 stride_mask
, depth
, tmp
;
929 /* check src dimensions */
930 if (IS_845G(dev
) || IS_I830(dev
)) {
931 if (rec
->src_height
> IMAGE_MAX_HEIGHT_LEGACY
||
932 rec
->src_width
> IMAGE_MAX_WIDTH_LEGACY
)
935 if (rec
->src_height
> IMAGE_MAX_HEIGHT
||
936 rec
->src_width
> IMAGE_MAX_WIDTH
)
940 /* better safe than sorry, use 4 as the maximal subsampling ratio */
941 if (rec
->src_height
< N_VERT_Y_TAPS
*4 ||
942 rec
->src_width
< N_HORIZ_Y_TAPS
*4)
945 /* check alignment constraints */
946 switch (rec
->flags
& I915_OVERLAY_TYPE_MASK
) {
947 case I915_OVERLAY_RGB
:
948 /* not implemented */
951 case I915_OVERLAY_YUV_PACKED
:
955 depth
= packed_depth_bytes(rec
->flags
);
959 /* ignore UV planes */
963 /* check pixel alignment */
964 if (rec
->offset_Y
% depth
)
968 case I915_OVERLAY_YUV_PLANAR
:
969 if (uv_vscale
< 0 || uv_hscale
< 0)
971 /* no offset restrictions for planar formats */
978 if (rec
->src_width
% uv_hscale
)
981 /* stride checking */
982 if (IS_I830(dev
) || IS_845G(dev
))
987 if (rec
->stride_Y
& stride_mask
|| rec
->stride_UV
& stride_mask
)
989 if (IS_I965G(dev
) && rec
->stride_Y
< 512)
992 tmp
= (rec
->flags
& I915_OVERLAY_TYPE_MASK
) == I915_OVERLAY_YUV_PLANAR
?
994 if (rec
->stride_Y
> tmp
|| rec
->stride_UV
> 2*1024)
997 /* check buffer dimensions */
998 switch (rec
->flags
& I915_OVERLAY_TYPE_MASK
) {
999 case I915_OVERLAY_RGB
:
1000 case I915_OVERLAY_YUV_PACKED
:
1001 /* always 4 Y values per depth pixels */
1002 if (packed_width_bytes(rec
->flags
, rec
->src_width
) > rec
->stride_Y
)
1005 tmp
= rec
->stride_Y
*rec
->src_height
;
1006 if (rec
->offset_Y
+ tmp
> new_bo
->size
)
1010 case I915_OVERLAY_YUV_PLANAR
:
1011 if (rec
->src_width
> rec
->stride_Y
)
1013 if (rec
->src_width
/uv_hscale
> rec
->stride_UV
)
1016 tmp
= rec
->stride_Y
* rec
->src_height
;
1017 if (rec
->offset_Y
+ tmp
> new_bo
->size
)
1020 tmp
= rec
->stride_UV
* (rec
->src_height
/ uv_vscale
);
1021 if (rec
->offset_U
+ tmp
> new_bo
->size
||
1022 rec
->offset_V
+ tmp
> new_bo
->size
)
1030 int intel_overlay_put_image(struct drm_device
*dev
, void *data
,
1031 struct drm_file
*file_priv
)
1033 struct drm_intel_overlay_put_image
*put_image_rec
= data
;
1034 drm_i915_private_t
*dev_priv
= dev
->dev_private
;
1035 struct intel_overlay
*overlay
;
1036 struct drm_mode_object
*drmmode_obj
;
1037 struct intel_crtc
*crtc
;
1038 struct drm_gem_object
*new_bo
;
1039 struct put_image_params
*params
;
1043 DRM_ERROR("called with no initialization\n");
1047 overlay
= dev_priv
->overlay
;
1049 DRM_DEBUG("userspace bug: no overlay\n");
1053 if (!(put_image_rec
->flags
& I915_OVERLAY_ENABLE
)) {
1054 mutex_lock(&dev
->mode_config
.mutex
);
1055 mutex_lock(&dev
->struct_mutex
);
1057 ret
= intel_overlay_switch_off(overlay
);
1059 mutex_unlock(&dev
->struct_mutex
);
1060 mutex_unlock(&dev
->mode_config
.mutex
);
1065 params
= kmalloc(sizeof(struct put_image_params
), GFP_KERNEL
);
1069 drmmode_obj
= drm_mode_object_find(dev
, put_image_rec
->crtc_id
,
1070 DRM_MODE_OBJECT_CRTC
);
1075 crtc
= to_intel_crtc(obj_to_crtc(drmmode_obj
));
1077 new_bo
= drm_gem_object_lookup(dev
, file_priv
,
1078 put_image_rec
->bo_handle
);
1084 mutex_lock(&dev
->mode_config
.mutex
);
1085 mutex_lock(&dev
->struct_mutex
);
1087 if (overlay
->hw_wedged
) {
1088 ret
= intel_overlay_recover_from_interrupt(overlay
, 1);
1093 if (overlay
->crtc
!= crtc
) {
1094 struct drm_display_mode
*mode
= &crtc
->base
.mode
;
1095 ret
= intel_overlay_switch_off(overlay
);
1099 ret
= check_overlay_possible_on_crtc(overlay
, crtc
);
1103 overlay
->crtc
= crtc
;
1104 crtc
->overlay
= overlay
;
1106 if (intel_panel_fitter_pipe(dev
) == crtc
->pipe
1107 /* and line to wide, i.e. one-line-mode */
1108 && mode
->hdisplay
> 1024) {
1109 overlay
->pfit_active
= 1;
1110 update_pfit_vscale_ratio(overlay
);
1112 overlay
->pfit_active
= 0;
1115 ret
= check_overlay_dst(overlay
, put_image_rec
);
1119 if (overlay
->pfit_active
) {
1120 params
->dst_y
= ((((u32
)put_image_rec
->dst_y
) << 12) /
1121 overlay
->pfit_vscale_ratio
);
1122 /* shifting right rounds downwards, so add 1 */
1123 params
->dst_h
= ((((u32
)put_image_rec
->dst_height
) << 12) /
1124 overlay
->pfit_vscale_ratio
) + 1;
1126 params
->dst_y
= put_image_rec
->dst_y
;
1127 params
->dst_h
= put_image_rec
->dst_height
;
1129 params
->dst_x
= put_image_rec
->dst_x
;
1130 params
->dst_w
= put_image_rec
->dst_width
;
1132 params
->src_w
= put_image_rec
->src_width
;
1133 params
->src_h
= put_image_rec
->src_height
;
1134 params
->src_scan_w
= put_image_rec
->src_scan_width
;
1135 params
->src_scan_h
= put_image_rec
->src_scan_height
;
1136 if (params
->src_scan_h
> params
->src_h
||
1137 params
->src_scan_w
> params
->src_w
) {
1142 ret
= check_overlay_src(dev
, put_image_rec
, new_bo
);
1145 params
->format
= put_image_rec
->flags
& ~I915_OVERLAY_FLAGS_MASK
;
1146 params
->stride_Y
= put_image_rec
->stride_Y
;
1147 params
->stride_UV
= put_image_rec
->stride_UV
;
1148 params
->offset_Y
= put_image_rec
->offset_Y
;
1149 params
->offset_U
= put_image_rec
->offset_U
;
1150 params
->offset_V
= put_image_rec
->offset_V
;
1152 /* Check scaling after src size to prevent a divide-by-zero. */
1153 ret
= check_overlay_scaling(params
);
1157 ret
= intel_overlay_do_put_image(overlay
, new_bo
, params
);
1161 mutex_unlock(&dev
->struct_mutex
);
1162 mutex_unlock(&dev
->mode_config
.mutex
);
1169 mutex_unlock(&dev
->struct_mutex
);
1170 mutex_unlock(&dev
->mode_config
.mutex
);
1171 drm_gem_object_unreference_unlocked(new_bo
);
1178 static void update_reg_attrs(struct intel_overlay
*overlay
,
1179 struct overlay_registers
*regs
)
1181 regs
->OCLRC0
= (overlay
->contrast
<< 18) | (overlay
->brightness
& 0xff);
1182 regs
->OCLRC1
= overlay
->saturation
;
1185 static bool check_gamma_bounds(u32 gamma1
, u32 gamma2
)
1189 if (gamma1
& 0xff000000 || gamma2
& 0xff000000)
1192 for (i
= 0; i
< 3; i
++) {
1193 if (((gamma1
>> i
*8) & 0xff) >= ((gamma2
>> i
*8) & 0xff))
1200 static bool check_gamma5_errata(u32 gamma5
)
1204 for (i
= 0; i
< 3; i
++) {
1205 if (((gamma5
>> i
*8) & 0xff) == 0x80)
1212 static int check_gamma(struct drm_intel_overlay_attrs
*attrs
)
1214 if (!check_gamma_bounds(0, attrs
->gamma0
) ||
1215 !check_gamma_bounds(attrs
->gamma0
, attrs
->gamma1
) ||
1216 !check_gamma_bounds(attrs
->gamma1
, attrs
->gamma2
) ||
1217 !check_gamma_bounds(attrs
->gamma2
, attrs
->gamma3
) ||
1218 !check_gamma_bounds(attrs
->gamma3
, attrs
->gamma4
) ||
1219 !check_gamma_bounds(attrs
->gamma4
, attrs
->gamma5
) ||
1220 !check_gamma_bounds(attrs
->gamma5
, 0x00ffffff))
1223 if (!check_gamma5_errata(attrs
->gamma5
))
1229 int intel_overlay_attrs(struct drm_device
*dev
, void *data
,
1230 struct drm_file
*file_priv
)
1232 struct drm_intel_overlay_attrs
*attrs
= data
;
1233 drm_i915_private_t
*dev_priv
= dev
->dev_private
;
1234 struct intel_overlay
*overlay
;
1235 struct overlay_registers
*regs
;
1239 DRM_ERROR("called with no initialization\n");
1243 overlay
= dev_priv
->overlay
;
1245 DRM_DEBUG("userspace bug: no overlay\n");
1249 mutex_lock(&dev
->mode_config
.mutex
);
1250 mutex_lock(&dev
->struct_mutex
);
1253 if (!(attrs
->flags
& I915_OVERLAY_UPDATE_ATTRS
)) {
1254 attrs
->color_key
= overlay
->color_key
;
1255 attrs
->brightness
= overlay
->brightness
;
1256 attrs
->contrast
= overlay
->contrast
;
1257 attrs
->saturation
= overlay
->saturation
;
1260 attrs
->gamma0
= I915_READ(OGAMC0
);
1261 attrs
->gamma1
= I915_READ(OGAMC1
);
1262 attrs
->gamma2
= I915_READ(OGAMC2
);
1263 attrs
->gamma3
= I915_READ(OGAMC3
);
1264 attrs
->gamma4
= I915_READ(OGAMC4
);
1265 attrs
->gamma5
= I915_READ(OGAMC5
);
1268 if (attrs
->brightness
< -128 || attrs
->brightness
> 127)
1270 if (attrs
->contrast
> 255)
1272 if (attrs
->saturation
> 1023)
1275 overlay
->color_key
= attrs
->color_key
;
1276 overlay
->brightness
= attrs
->brightness
;
1277 overlay
->contrast
= attrs
->contrast
;
1278 overlay
->saturation
= attrs
->saturation
;
1280 regs
= intel_overlay_map_regs(overlay
);
1286 update_reg_attrs(overlay
, regs
);
1288 intel_overlay_unmap_regs(overlay
, regs
);
1290 if (attrs
->flags
& I915_OVERLAY_UPDATE_GAMMA
) {
1294 if (overlay
->active
) {
1299 ret
= check_gamma(attrs
);
1303 I915_WRITE(OGAMC0
, attrs
->gamma0
);
1304 I915_WRITE(OGAMC1
, attrs
->gamma1
);
1305 I915_WRITE(OGAMC2
, attrs
->gamma2
);
1306 I915_WRITE(OGAMC3
, attrs
->gamma3
);
1307 I915_WRITE(OGAMC4
, attrs
->gamma4
);
1308 I915_WRITE(OGAMC5
, attrs
->gamma5
);
1314 mutex_unlock(&dev
->struct_mutex
);
1315 mutex_unlock(&dev
->mode_config
.mutex
);
1320 void intel_setup_overlay(struct drm_device
*dev
)
1322 drm_i915_private_t
*dev_priv
= dev
->dev_private
;
1323 struct intel_overlay
*overlay
;
1324 struct drm_gem_object
*reg_bo
;
1325 struct overlay_registers
*regs
;
1328 if (!HAS_OVERLAY(dev
))
1331 overlay
= kzalloc(sizeof(struct intel_overlay
), GFP_KERNEL
);
1336 reg_bo
= i915_gem_alloc_object(dev
, PAGE_SIZE
);
1339 overlay
->reg_bo
= to_intel_bo(reg_bo
);
1341 if (OVERLAY_NEEDS_PHYSICAL(dev
)) {
1342 ret
= i915_gem_attach_phys_object(dev
, reg_bo
,
1343 I915_GEM_PHYS_OVERLAY_REGS
,
1346 DRM_ERROR("failed to attach phys overlay regs\n");
1349 overlay
->flip_addr
= overlay
->reg_bo
->phys_obj
->handle
->busaddr
;
1351 ret
= i915_gem_object_pin(reg_bo
, PAGE_SIZE
);
1353 DRM_ERROR("failed to pin overlay register bo\n");
1356 overlay
->flip_addr
= overlay
->reg_bo
->gtt_offset
;
1358 ret
= i915_gem_object_set_to_gtt_domain(reg_bo
, true);
1360 DRM_ERROR("failed to move overlay register bo into the GTT\n");
1365 /* init all values */
1366 overlay
->color_key
= 0x0101fe;
1367 overlay
->brightness
= -19;
1368 overlay
->contrast
= 75;
1369 overlay
->saturation
= 146;
1371 regs
= intel_overlay_map_regs(overlay
);
1375 memset(regs
, 0, sizeof(struct overlay_registers
));
1376 update_polyphase_filter(regs
);
1377 update_reg_attrs(overlay
, regs
);
1379 intel_overlay_unmap_regs(overlay
, regs
);
1381 dev_priv
->overlay
= overlay
;
1382 DRM_INFO("initialized overlay support\n");
1386 i915_gem_object_unpin(reg_bo
);
1388 drm_gem_object_unreference(reg_bo
);
1394 void intel_cleanup_overlay(struct drm_device
*dev
)
1396 drm_i915_private_t
*dev_priv
= dev
->dev_private
;
1398 if (!dev_priv
->overlay
)
1401 /* The bo's should be free'd by the generic code already.
1402 * Furthermore modesetting teardown happens beforehand so the
1403 * hardware should be off already */
1404 BUG_ON(dev_priv
->overlay
->active
);
1406 drm_gem_object_unreference_unlocked(&dev_priv
->overlay
->reg_bo
->base
);
1407 kfree(dev_priv
->overlay
);
1410 struct intel_overlay_error_state
{
1411 struct overlay_registers regs
;
1417 struct intel_overlay_error_state
*
1418 intel_overlay_capture_error_state(struct drm_device
*dev
)
1420 drm_i915_private_t
*dev_priv
= dev
->dev_private
;
1421 struct intel_overlay
*overlay
= dev_priv
->overlay
;
1422 struct intel_overlay_error_state
*error
;
1423 struct overlay_registers __iomem
*regs
;
1425 if (!overlay
|| !overlay
->active
)
1428 error
= kmalloc(sizeof(*error
), GFP_ATOMIC
);
1432 error
->dovsta
= I915_READ(DOVSTA
);
1433 error
->isr
= I915_READ(ISR
);
1434 if (OVERLAY_NEEDS_PHYSICAL(overlay
->dev
))
1435 error
->base
= (long) overlay
->reg_bo
->phys_obj
->handle
->vaddr
;
1437 error
->base
= (long) overlay
->reg_bo
->gtt_offset
;
1439 regs
= intel_overlay_map_regs_atomic(overlay
, KM_IRQ0
);
1443 memcpy_fromio(&error
->regs
, regs
, sizeof(struct overlay_registers
));
1444 intel_overlay_unmap_regs_atomic(overlay
, KM_IRQ0
, regs
);
1454 intel_overlay_print_error_state(struct seq_file
*m
, struct intel_overlay_error_state
*error
)
1456 seq_printf(m
, "Overlay, status: 0x%08x, interrupt: 0x%08x\n",
1457 error
->dovsta
, error
->isr
);
1458 seq_printf(m
, " Register file at 0x%08lx:\n",
1461 #define P(x) seq_printf(m, " " #x ": 0x%08x\n", error->regs.x)