4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
20 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
24 * Daniel Vetter <daniel@ffwll.ch>
26 * Derived from Xorg ddx, xf86-video-intel, src/i830_video.c
33 #include "intel_drv.h"
35 /* Limits for overlay size. According to intel doc, the real limits are:
36 * Y width: 4095, UV width (planar): 2047, Y height: 2047,
37 * UV width (planar): * 1023. But the xorg thinks 2048 for height and width. Use
38 * the mininum of both. */
39 #define IMAGE_MAX_WIDTH 2048
40 #define IMAGE_MAX_HEIGHT 2046 /* 2 * 1023 */
41 /* on 830 and 845 these large limits result in the card hanging */
42 #define IMAGE_MAX_WIDTH_LEGACY 1024
43 #define IMAGE_MAX_HEIGHT_LEGACY 1088
45 /* overlay register definitions */
47 #define OCMD_TILED_SURFACE (0x1<<19)
48 #define OCMD_MIRROR_MASK (0x3<<17)
49 #define OCMD_MIRROR_MODE (0x3<<17)
50 #define OCMD_MIRROR_HORIZONTAL (0x1<<17)
51 #define OCMD_MIRROR_VERTICAL (0x2<<17)
52 #define OCMD_MIRROR_BOTH (0x3<<17)
53 #define OCMD_BYTEORDER_MASK (0x3<<14) /* zero for YUYV or FOURCC YUY2 */
54 #define OCMD_UV_SWAP (0x1<<14) /* YVYU */
55 #define OCMD_Y_SWAP (0x2<<14) /* UYVY or FOURCC UYVY */
56 #define OCMD_Y_AND_UV_SWAP (0x3<<14) /* VYUY */
57 #define OCMD_SOURCE_FORMAT_MASK (0xf<<10)
58 #define OCMD_RGB_888 (0x1<<10) /* not in i965 Intel docs */
59 #define OCMD_RGB_555 (0x2<<10) /* not in i965 Intel docs */
60 #define OCMD_RGB_565 (0x3<<10) /* not in i965 Intel docs */
61 #define OCMD_YUV_422_PACKED (0x8<<10)
62 #define OCMD_YUV_411_PACKED (0x9<<10) /* not in i965 Intel docs */
63 #define OCMD_YUV_420_PLANAR (0xc<<10)
64 #define OCMD_YUV_422_PLANAR (0xd<<10)
65 #define OCMD_YUV_410_PLANAR (0xe<<10) /* also 411 */
66 #define OCMD_TVSYNCFLIP_PARITY (0x1<<9)
67 #define OCMD_TVSYNCFLIP_ENABLE (0x1<<7)
68 #define OCMD_BUF_TYPE_MASK (Ox1<<5)
69 #define OCMD_BUF_TYPE_FRAME (0x0<<5)
70 #define OCMD_BUF_TYPE_FIELD (0x1<<5)
71 #define OCMD_TEST_MODE (0x1<<4)
72 #define OCMD_BUFFER_SELECT (0x3<<2)
73 #define OCMD_BUFFER0 (0x0<<2)
74 #define OCMD_BUFFER1 (0x1<<2)
75 #define OCMD_FIELD_SELECT (0x1<<2)
76 #define OCMD_FIELD0 (0x0<<1)
77 #define OCMD_FIELD1 (0x1<<1)
78 #define OCMD_ENABLE (0x1<<0)
80 /* OCONFIG register */
81 #define OCONF_PIPE_MASK (0x1<<18)
82 #define OCONF_PIPE_A (0x0<<18)
83 #define OCONF_PIPE_B (0x1<<18)
84 #define OCONF_GAMMA2_ENABLE (0x1<<16)
85 #define OCONF_CSC_MODE_BT601 (0x0<<5)
86 #define OCONF_CSC_MODE_BT709 (0x1<<5)
87 #define OCONF_CSC_BYPASS (0x1<<4)
88 #define OCONF_CC_OUT_8BIT (0x1<<3)
89 #define OCONF_TEST_MODE (0x1<<2)
90 #define OCONF_THREE_LINE_BUFFER (0x1<<0)
91 #define OCONF_TWO_LINE_BUFFER (0x0<<0)
93 /* DCLRKM (dst-key) register */
94 #define DST_KEY_ENABLE (0x1<<31)
95 #define CLK_RGB24_MASK 0x0
96 #define CLK_RGB16_MASK 0x070307
97 #define CLK_RGB15_MASK 0x070707
98 #define CLK_RGB8I_MASK 0xffffff
100 #define RGB16_TO_COLORKEY(c) \
101 (((c & 0xF800) << 8) | ((c & 0x07E0) << 5) | ((c & 0x001F) << 3))
102 #define RGB15_TO_COLORKEY(c) \
103 (((c & 0x7c00) << 9) | ((c & 0x03E0) << 6) | ((c & 0x001F) << 3))
105 /* overlay flip addr flag */
106 #define OFC_UPDATE 0x1
108 /* polyphase filter coefficients */
109 #define N_HORIZ_Y_TAPS 5
110 #define N_VERT_Y_TAPS 3
111 #define N_HORIZ_UV_TAPS 3
112 #define N_VERT_UV_TAPS 3
116 /* memory bufferd overlay registers */
117 struct overlay_registers
{
145 u32 RESERVED1
; /* 0x6C */
158 u32 FASTHSCALE
; /* 0xA0 */
159 u32 UVSCALEV
; /* 0xA4 */
160 u32 RESERVEDC
[(0x200 - 0xA8) / 4]; /* 0xA8 - 0x1FC */
161 u16 Y_VCOEFS
[N_VERT_Y_TAPS
* N_PHASES
]; /* 0x200 */
162 u16 RESERVEDD
[0x100 / 2 - N_VERT_Y_TAPS
* N_PHASES
];
163 u16 Y_HCOEFS
[N_HORIZ_Y_TAPS
* N_PHASES
]; /* 0x300 */
164 u16 RESERVEDE
[0x200 / 2 - N_HORIZ_Y_TAPS
* N_PHASES
];
165 u16 UV_VCOEFS
[N_VERT_UV_TAPS
* N_PHASES
]; /* 0x500 */
166 u16 RESERVEDF
[0x100 / 2 - N_VERT_UV_TAPS
* N_PHASES
];
167 u16 UV_HCOEFS
[N_HORIZ_UV_TAPS
* N_PHASES
]; /* 0x600 */
168 u16 RESERVEDG
[0x100 / 2 - N_HORIZ_UV_TAPS
* N_PHASES
];
171 /* overlay flip addr flag */
172 #define OFC_UPDATE 0x1
174 #define OVERLAY_NONPHYSICAL(dev) (IS_G33(dev) || IS_I965G(dev))
175 #define OVERLAY_EXISTS(dev) (!IS_G4X(dev) && !IS_IRONLAKE(dev) && !IS_GEN6(dev))
178 static struct overlay_registers
*intel_overlay_map_regs_atomic(struct intel_overlay
*overlay
)
180 drm_i915_private_t
*dev_priv
= overlay
->dev
->dev_private
;
181 struct overlay_registers
*regs
;
183 /* no recursive mappings */
184 BUG_ON(overlay
->virt_addr
);
186 if (OVERLAY_NONPHYSICAL(overlay
->dev
)) {
187 regs
= io_mapping_map_atomic_wc(dev_priv
->mm
.gtt_mapping
,
188 overlay
->reg_bo
->gtt_offset
);
191 DRM_ERROR("failed to map overlay regs in GTT\n");
195 regs
= overlay
->reg_bo
->phys_obj
->handle
->vaddr
;
197 return overlay
->virt_addr
= regs
;
200 static void intel_overlay_unmap_regs_atomic(struct intel_overlay
*overlay
)
202 if (OVERLAY_NONPHYSICAL(overlay
->dev
))
203 io_mapping_unmap_atomic(overlay
->virt_addr
);
205 overlay
->virt_addr
= NULL
;
210 /* overlay needs to be disable in OCMD reg */
211 static int intel_overlay_on(struct intel_overlay
*overlay
)
213 struct drm_device
*dev
= overlay
->dev
;
214 drm_i915_private_t
*dev_priv
= dev
->dev_private
;
218 BUG_ON(overlay
->active
);
221 overlay
->hw_wedged
= NEEDS_WAIT_FOR_FLIP
;
224 OUT_RING(MI_OVERLAY_FLIP
| MI_OVERLAY_ON
);
225 OUT_RING(overlay
->flip_addr
| OFC_UPDATE
);
226 OUT_RING(MI_WAIT_FOR_EVENT
| MI_WAIT_FOR_OVERLAY_FLIP
);
230 overlay
->last_flip_req
= i915_add_request(dev
, NULL
, 0);
231 if (overlay
->last_flip_req
== 0)
234 ret
= i915_do_wait_request(dev
, overlay
->last_flip_req
, 1);
238 overlay
->hw_wedged
= 0;
239 overlay
->last_flip_req
= 0;
243 /* overlay needs to be enabled in OCMD reg */
244 static void intel_overlay_continue(struct intel_overlay
*overlay
,
245 bool load_polyphase_filter
)
247 struct drm_device
*dev
= overlay
->dev
;
248 drm_i915_private_t
*dev_priv
= dev
->dev_private
;
249 u32 flip_addr
= overlay
->flip_addr
;
253 BUG_ON(!overlay
->active
);
255 if (load_polyphase_filter
)
256 flip_addr
|= OFC_UPDATE
;
258 /* check for underruns */
259 tmp
= I915_READ(DOVSTA
);
261 DRM_DEBUG("overlay underrun, DOVSTA: %x\n", tmp
);
264 OUT_RING(MI_OVERLAY_FLIP
| MI_OVERLAY_CONTINUE
);
268 overlay
->last_flip_req
= i915_add_request(dev
, NULL
, 0);
271 static int intel_overlay_wait_flip(struct intel_overlay
*overlay
)
273 struct drm_device
*dev
= overlay
->dev
;
274 drm_i915_private_t
*dev_priv
= dev
->dev_private
;
279 if (overlay
->last_flip_req
!= 0) {
280 ret
= i915_do_wait_request(dev
, overlay
->last_flip_req
, 1);
282 overlay
->last_flip_req
= 0;
284 tmp
= I915_READ(ISR
);
286 if (!(tmp
& I915_OVERLAY_PLANE_FLIP_PENDING_INTERRUPT
))
291 /* synchronous slowpath */
292 overlay
->hw_wedged
= RELEASE_OLD_VID
;
295 OUT_RING(MI_WAIT_FOR_EVENT
| MI_WAIT_FOR_OVERLAY_FLIP
);
299 overlay
->last_flip_req
= i915_add_request(dev
, NULL
, 0);
300 if (overlay
->last_flip_req
== 0)
303 ret
= i915_do_wait_request(dev
, overlay
->last_flip_req
, 1);
307 overlay
->hw_wedged
= 0;
308 overlay
->last_flip_req
= 0;
312 /* overlay needs to be disabled in OCMD reg */
313 static int intel_overlay_off(struct intel_overlay
*overlay
)
315 u32 flip_addr
= overlay
->flip_addr
;
316 struct drm_device
*dev
= overlay
->dev
;
317 drm_i915_private_t
*dev_priv
= dev
->dev_private
;
321 BUG_ON(!overlay
->active
);
323 /* According to intel docs the overlay hw may hang (when switching
324 * off) without loading the filter coeffs. It is however unclear whether
325 * this applies to the disabling of the overlay or to the switching off
326 * of the hw. Do it in both cases */
327 flip_addr
|= OFC_UPDATE
;
329 /* wait for overlay to go idle */
330 overlay
->hw_wedged
= SWITCH_OFF_STAGE_1
;
333 OUT_RING(MI_OVERLAY_FLIP
| MI_OVERLAY_CONTINUE
);
335 OUT_RING(MI_WAIT_FOR_EVENT
| MI_WAIT_FOR_OVERLAY_FLIP
);
339 overlay
->last_flip_req
= i915_add_request(dev
, NULL
, 0);
340 if (overlay
->last_flip_req
== 0)
343 ret
= i915_do_wait_request(dev
, overlay
->last_flip_req
, 1);
347 /* turn overlay off */
348 overlay
->hw_wedged
= SWITCH_OFF_STAGE_2
;
351 OUT_RING(MI_OVERLAY_FLIP
| MI_OVERLAY_OFF
);
353 OUT_RING(MI_WAIT_FOR_EVENT
| MI_WAIT_FOR_OVERLAY_FLIP
);
357 overlay
->last_flip_req
= i915_add_request(dev
, NULL
, 0);
358 if (overlay
->last_flip_req
== 0)
361 ret
= i915_do_wait_request(dev
, overlay
->last_flip_req
, 1);
365 overlay
->hw_wedged
= 0;
366 overlay
->last_flip_req
= 0;
370 static void intel_overlay_off_tail(struct intel_overlay
*overlay
)
372 struct drm_gem_object
*obj
;
374 /* never have the overlay hw on without showing a frame */
375 BUG_ON(!overlay
->vid_bo
);
376 obj
= overlay
->vid_bo
->obj
;
378 i915_gem_object_unpin(obj
);
379 drm_gem_object_unreference(obj
);
380 overlay
->vid_bo
= NULL
;
382 overlay
->crtc
->overlay
= NULL
;
383 overlay
->crtc
= NULL
;
387 /* recover from an interruption due to a signal
388 * We have to be careful not to repeat work forever an make forward progess. */
389 int intel_overlay_recover_from_interrupt(struct intel_overlay
*overlay
,
392 struct drm_device
*dev
= overlay
->dev
;
393 drm_i915_private_t
*dev_priv
= dev
->dev_private
;
394 struct drm_gem_object
*obj
;
399 if (overlay
->hw_wedged
== HW_WEDGED
)
402 if (overlay
->last_flip_req
== 0) {
403 overlay
->last_flip_req
= i915_add_request(dev
, NULL
, 0);
404 if (overlay
->last_flip_req
== 0)
408 ret
= i915_do_wait_request(dev
, overlay
->last_flip_req
, interruptible
);
412 switch (overlay
->hw_wedged
) {
413 case RELEASE_OLD_VID
:
414 obj
= overlay
->old_vid_bo
->obj
;
415 i915_gem_object_unpin(obj
);
416 drm_gem_object_unreference(obj
);
417 overlay
->old_vid_bo
= NULL
;
419 case SWITCH_OFF_STAGE_1
:
420 flip_addr
= overlay
->flip_addr
;
421 flip_addr
|= OFC_UPDATE
;
423 overlay
->hw_wedged
= SWITCH_OFF_STAGE_2
;
426 OUT_RING(MI_OVERLAY_FLIP
| MI_OVERLAY_OFF
);
428 OUT_RING(MI_WAIT_FOR_EVENT
| MI_WAIT_FOR_OVERLAY_FLIP
);
432 overlay
->last_flip_req
= i915_add_request(dev
, NULL
, 0);
433 if (overlay
->last_flip_req
== 0)
436 ret
= i915_do_wait_request(dev
, overlay
->last_flip_req
,
441 case SWITCH_OFF_STAGE_2
:
442 intel_overlay_off_tail(overlay
);
445 BUG_ON(overlay
->hw_wedged
!= NEEDS_WAIT_FOR_FLIP
);
448 overlay
->hw_wedged
= 0;
449 overlay
->last_flip_req
= 0;
453 /* Wait for pending overlay flip and release old frame.
454 * Needs to be called before the overlay register are changed
455 * via intel_overlay_(un)map_regs_atomic */
456 static int intel_overlay_release_old_vid(struct intel_overlay
*overlay
)
459 struct drm_gem_object
*obj
;
461 /* only wait if there is actually an old frame to release to
462 * guarantee forward progress */
463 if (!overlay
->old_vid_bo
)
466 ret
= intel_overlay_wait_flip(overlay
);
470 obj
= overlay
->old_vid_bo
->obj
;
471 i915_gem_object_unpin(obj
);
472 drm_gem_object_unreference(obj
);
473 overlay
->old_vid_bo
= NULL
;
478 struct put_image_params
{
495 static int packed_depth_bytes(u32 format
)
497 switch (format
& I915_OVERLAY_DEPTH_MASK
) {
498 case I915_OVERLAY_YUV422
:
500 case I915_OVERLAY_YUV411
:
501 /* return 6; not implemented */
507 static int packed_width_bytes(u32 format
, short width
)
509 switch (format
& I915_OVERLAY_DEPTH_MASK
) {
510 case I915_OVERLAY_YUV422
:
517 static int uv_hsubsampling(u32 format
)
519 switch (format
& I915_OVERLAY_DEPTH_MASK
) {
520 case I915_OVERLAY_YUV422
:
521 case I915_OVERLAY_YUV420
:
523 case I915_OVERLAY_YUV411
:
524 case I915_OVERLAY_YUV410
:
531 static int uv_vsubsampling(u32 format
)
533 switch (format
& I915_OVERLAY_DEPTH_MASK
) {
534 case I915_OVERLAY_YUV420
:
535 case I915_OVERLAY_YUV410
:
537 case I915_OVERLAY_YUV422
:
538 case I915_OVERLAY_YUV411
:
545 static u32
calc_swidthsw(struct drm_device
*dev
, u32 offset
, u32 width
)
547 u32 mask
, shift
, ret
;
555 ret
= ((offset
+ width
+ mask
) >> shift
) - (offset
>> shift
);
562 static const u16 y_static_hcoeffs
[N_HORIZ_Y_TAPS
* N_PHASES
] = {
563 0x3000, 0xb4a0, 0x1930, 0x1920, 0xb4a0,
564 0x3000, 0xb500, 0x19d0, 0x1880, 0xb440,
565 0x3000, 0xb540, 0x1a88, 0x2f80, 0xb3e0,
566 0x3000, 0xb580, 0x1b30, 0x2e20, 0xb380,
567 0x3000, 0xb5c0, 0x1bd8, 0x2cc0, 0xb320,
568 0x3020, 0xb5e0, 0x1c60, 0x2b80, 0xb2c0,
569 0x3020, 0xb5e0, 0x1cf8, 0x2a20, 0xb260,
570 0x3020, 0xb5e0, 0x1d80, 0x28e0, 0xb200,
571 0x3020, 0xb5c0, 0x1e08, 0x3f40, 0xb1c0,
572 0x3020, 0xb580, 0x1e78, 0x3ce0, 0xb160,
573 0x3040, 0xb520, 0x1ed8, 0x3aa0, 0xb120,
574 0x3040, 0xb4a0, 0x1f30, 0x3880, 0xb0e0,
575 0x3040, 0xb400, 0x1f78, 0x3680, 0xb0a0,
576 0x3020, 0xb340, 0x1fb8, 0x34a0, 0xb060,
577 0x3020, 0xb240, 0x1fe0, 0x32e0, 0xb040,
578 0x3020, 0xb140, 0x1ff8, 0x3160, 0xb020,
579 0xb000, 0x3000, 0x0800, 0x3000, 0xb000};
580 static const u16 uv_static_hcoeffs
[N_HORIZ_UV_TAPS
* N_PHASES
] = {
581 0x3000, 0x1800, 0x1800, 0xb000, 0x18d0, 0x2e60,
582 0xb000, 0x1990, 0x2ce0, 0xb020, 0x1a68, 0x2b40,
583 0xb040, 0x1b20, 0x29e0, 0xb060, 0x1bd8, 0x2880,
584 0xb080, 0x1c88, 0x3e60, 0xb0a0, 0x1d28, 0x3c00,
585 0xb0c0, 0x1db8, 0x39e0, 0xb0e0, 0x1e40, 0x37e0,
586 0xb100, 0x1eb8, 0x3620, 0xb100, 0x1f18, 0x34a0,
587 0xb100, 0x1f68, 0x3360, 0xb0e0, 0x1fa8, 0x3240,
588 0xb0c0, 0x1fe0, 0x3140, 0xb060, 0x1ff0, 0x30a0,
589 0x3000, 0x0800, 0x3000};
591 static void update_polyphase_filter(struct overlay_registers
*regs
)
593 memcpy(regs
->Y_HCOEFS
, y_static_hcoeffs
, sizeof(y_static_hcoeffs
));
594 memcpy(regs
->UV_HCOEFS
, uv_static_hcoeffs
, sizeof(uv_static_hcoeffs
));
597 static bool update_scaling_factors(struct intel_overlay
*overlay
,
598 struct overlay_registers
*regs
,
599 struct put_image_params
*params
)
601 /* fixed point with a 12 bit shift */
602 u32 xscale
, yscale
, xscale_UV
, yscale_UV
;
604 #define FRACT_MASK 0xfff
605 bool scale_changed
= false;
606 int uv_hscale
= uv_hsubsampling(params
->format
);
607 int uv_vscale
= uv_vsubsampling(params
->format
);
609 if (params
->dst_w
> 1)
610 xscale
= ((params
->src_scan_w
- 1) << FP_SHIFT
)
613 xscale
= 1 << FP_SHIFT
;
615 if (params
->dst_h
> 1)
616 yscale
= ((params
->src_scan_h
- 1) << FP_SHIFT
)
619 yscale
= 1 << FP_SHIFT
;
621 /*if (params->format & I915_OVERLAY_YUV_PLANAR) {*/
622 xscale_UV
= xscale
/uv_hscale
;
623 yscale_UV
= yscale
/uv_vscale
;
624 /* make the Y scale to UV scale ratio an exact multiply */
625 xscale
= xscale_UV
* uv_hscale
;
626 yscale
= yscale_UV
* uv_vscale
;
632 if (xscale
!= overlay
->old_xscale
|| yscale
!= overlay
->old_yscale
)
633 scale_changed
= true;
634 overlay
->old_xscale
= xscale
;
635 overlay
->old_yscale
= yscale
;
637 regs
->YRGBSCALE
= ((yscale
& FRACT_MASK
) << 20)
638 | ((xscale
>> FP_SHIFT
) << 16)
639 | ((xscale
& FRACT_MASK
) << 3);
640 regs
->UVSCALE
= ((yscale_UV
& FRACT_MASK
) << 20)
641 | ((xscale_UV
>> FP_SHIFT
) << 16)
642 | ((xscale_UV
& FRACT_MASK
) << 3);
643 regs
->UVSCALEV
= ((yscale
>> FP_SHIFT
) << 16)
644 | ((yscale_UV
>> FP_SHIFT
) << 0);
647 update_polyphase_filter(regs
);
649 return scale_changed
;
652 static void update_colorkey(struct intel_overlay
*overlay
,
653 struct overlay_registers
*regs
)
655 u32 key
= overlay
->color_key
;
656 switch (overlay
->crtc
->base
.fb
->bits_per_pixel
) {
659 regs
->DCLRKM
= CLK_RGB8I_MASK
| DST_KEY_ENABLE
;
661 if (overlay
->crtc
->base
.fb
->depth
== 15) {
662 regs
->DCLRKV
= RGB15_TO_COLORKEY(key
);
663 regs
->DCLRKM
= CLK_RGB15_MASK
| DST_KEY_ENABLE
;
665 regs
->DCLRKV
= RGB16_TO_COLORKEY(key
);
666 regs
->DCLRKM
= CLK_RGB16_MASK
| DST_KEY_ENABLE
;
671 regs
->DCLRKM
= CLK_RGB24_MASK
| DST_KEY_ENABLE
;
675 static u32
overlay_cmd_reg(struct put_image_params
*params
)
677 u32 cmd
= OCMD_ENABLE
| OCMD_BUF_TYPE_FRAME
| OCMD_BUFFER0
;
679 if (params
->format
& I915_OVERLAY_YUV_PLANAR
) {
680 switch (params
->format
& I915_OVERLAY_DEPTH_MASK
) {
681 case I915_OVERLAY_YUV422
:
682 cmd
|= OCMD_YUV_422_PLANAR
;
684 case I915_OVERLAY_YUV420
:
685 cmd
|= OCMD_YUV_420_PLANAR
;
687 case I915_OVERLAY_YUV411
:
688 case I915_OVERLAY_YUV410
:
689 cmd
|= OCMD_YUV_410_PLANAR
;
692 } else { /* YUV packed */
693 switch (params
->format
& I915_OVERLAY_DEPTH_MASK
) {
694 case I915_OVERLAY_YUV422
:
695 cmd
|= OCMD_YUV_422_PACKED
;
697 case I915_OVERLAY_YUV411
:
698 cmd
|= OCMD_YUV_411_PACKED
;
702 switch (params
->format
& I915_OVERLAY_SWAP_MASK
) {
703 case I915_OVERLAY_NO_SWAP
:
705 case I915_OVERLAY_UV_SWAP
:
708 case I915_OVERLAY_Y_SWAP
:
711 case I915_OVERLAY_Y_AND_UV_SWAP
:
712 cmd
|= OCMD_Y_AND_UV_SWAP
;
720 int intel_overlay_do_put_image(struct intel_overlay
*overlay
,
721 struct drm_gem_object
*new_bo
,
722 struct put_image_params
*params
)
725 struct overlay_registers
*regs
;
726 bool scale_changed
= false;
727 struct drm_i915_gem_object
*bo_priv
= new_bo
->driver_private
;
728 struct drm_device
*dev
= overlay
->dev
;
730 BUG_ON(!mutex_is_locked(&dev
->struct_mutex
));
731 BUG_ON(!mutex_is_locked(&dev
->mode_config
.mutex
));
734 ret
= intel_overlay_release_old_vid(overlay
);
738 ret
= i915_gem_object_pin(new_bo
, PAGE_SIZE
);
742 ret
= i915_gem_object_set_to_gtt_domain(new_bo
, 0);
746 if (!overlay
->active
) {
747 regs
= intel_overlay_map_regs_atomic(overlay
);
752 regs
->OCONFIG
= OCONF_CC_OUT_8BIT
;
753 if (IS_I965GM(overlay
->dev
))
754 regs
->OCONFIG
|= OCONF_CSC_MODE_BT709
;
755 regs
->OCONFIG
|= overlay
->crtc
->pipe
== 0 ?
756 OCONF_PIPE_A
: OCONF_PIPE_B
;
757 intel_overlay_unmap_regs_atomic(overlay
);
759 ret
= intel_overlay_on(overlay
);
764 regs
= intel_overlay_map_regs_atomic(overlay
);
770 regs
->DWINPOS
= (params
->dst_y
<< 16) | params
->dst_x
;
771 regs
->DWINSZ
= (params
->dst_h
<< 16) | params
->dst_w
;
773 if (params
->format
& I915_OVERLAY_YUV_PACKED
)
774 tmp_width
= packed_width_bytes(params
->format
, params
->src_w
);
776 tmp_width
= params
->src_w
;
778 regs
->SWIDTH
= params
->src_w
;
779 regs
->SWIDTHSW
= calc_swidthsw(overlay
->dev
,
780 params
->offset_Y
, tmp_width
);
781 regs
->SHEIGHT
= params
->src_h
;
782 regs
->OBUF_0Y
= bo_priv
->gtt_offset
+ params
-> offset_Y
;
783 regs
->OSTRIDE
= params
->stride_Y
;
785 if (params
->format
& I915_OVERLAY_YUV_PLANAR
) {
786 int uv_hscale
= uv_hsubsampling(params
->format
);
787 int uv_vscale
= uv_vsubsampling(params
->format
);
789 regs
->SWIDTH
|= (params
->src_w
/uv_hscale
) << 16;
790 tmp_U
= calc_swidthsw(overlay
->dev
, params
->offset_U
,
791 params
->src_w
/uv_hscale
);
792 tmp_V
= calc_swidthsw(overlay
->dev
, params
->offset_V
,
793 params
->src_w
/uv_hscale
);
794 regs
->SWIDTHSW
|= max_t(u32
, tmp_U
, tmp_V
) << 16;
795 regs
->SHEIGHT
|= (params
->src_h
/uv_vscale
) << 16;
796 regs
->OBUF_0U
= bo_priv
->gtt_offset
+ params
->offset_U
;
797 regs
->OBUF_0V
= bo_priv
->gtt_offset
+ params
->offset_V
;
798 regs
->OSTRIDE
|= params
->stride_UV
<< 16;
801 scale_changed
= update_scaling_factors(overlay
, regs
, params
);
803 update_colorkey(overlay
, regs
);
805 regs
->OCMD
= overlay_cmd_reg(params
);
807 intel_overlay_unmap_regs_atomic(overlay
);
809 intel_overlay_continue(overlay
, scale_changed
);
811 overlay
->old_vid_bo
= overlay
->vid_bo
;
812 overlay
->vid_bo
= new_bo
->driver_private
;
817 i915_gem_object_unpin(new_bo
);
821 int intel_overlay_switch_off(struct intel_overlay
*overlay
)
824 struct overlay_registers
*regs
;
825 struct drm_device
*dev
= overlay
->dev
;
827 BUG_ON(!mutex_is_locked(&dev
->struct_mutex
));
828 BUG_ON(!mutex_is_locked(&dev
->mode_config
.mutex
));
830 if (overlay
->hw_wedged
) {
831 ret
= intel_overlay_recover_from_interrupt(overlay
, 1);
836 if (!overlay
->active
)
839 ret
= intel_overlay_release_old_vid(overlay
);
843 regs
= intel_overlay_map_regs_atomic(overlay
);
845 intel_overlay_unmap_regs_atomic(overlay
);
847 ret
= intel_overlay_off(overlay
);
851 intel_overlay_off_tail(overlay
);
856 static int check_overlay_possible_on_crtc(struct intel_overlay
*overlay
,
857 struct intel_crtc
*crtc
)
859 drm_i915_private_t
*dev_priv
= overlay
->dev
->dev_private
;
861 int pipeconf_reg
= (crtc
->pipe
== 0) ? PIPEACONF
: PIPEBCONF
;
863 if (!crtc
->base
.enabled
|| crtc
->dpms_mode
!= DRM_MODE_DPMS_ON
)
866 pipeconf
= I915_READ(pipeconf_reg
);
868 /* can't use the overlay with double wide pipe */
869 if (!IS_I965G(overlay
->dev
) && pipeconf
& PIPEACONF_DOUBLE_WIDE
)
875 static void update_pfit_vscale_ratio(struct intel_overlay
*overlay
)
877 struct drm_device
*dev
= overlay
->dev
;
878 drm_i915_private_t
*dev_priv
= dev
->dev_private
;
880 u32 pfit_control
= I915_READ(PFIT_CONTROL
);
882 /* XXX: This is not the same logic as in the xorg driver, but more in
883 * line with the intel documentation for the i965 */
884 if (!IS_I965G(dev
) && (pfit_control
& VERT_AUTO_SCALE
)) {
885 ratio
= I915_READ(PFIT_AUTO_RATIOS
) >> PFIT_VERT_SCALE_SHIFT
;
886 } else { /* on i965 use the PGM reg to read out the autoscaler values */
887 ratio
= I915_READ(PFIT_PGM_RATIOS
);
889 ratio
>>= PFIT_VERT_SCALE_SHIFT_965
;
891 ratio
>>= PFIT_VERT_SCALE_SHIFT
;
894 overlay
->pfit_vscale_ratio
= ratio
;
897 static int check_overlay_dst(struct intel_overlay
*overlay
,
898 struct drm_intel_overlay_put_image
*rec
)
900 struct drm_display_mode
*mode
= &overlay
->crtc
->base
.mode
;
902 if ((rec
->dst_x
< mode
->crtc_hdisplay
)
903 && (rec
->dst_x
+ rec
->dst_width
904 <= mode
->crtc_hdisplay
)
905 && (rec
->dst_y
< mode
->crtc_vdisplay
)
906 && (rec
->dst_y
+ rec
->dst_height
907 <= mode
->crtc_vdisplay
))
913 static int check_overlay_scaling(struct put_image_params
*rec
)
917 /* downscaling limit is 8.0 */
918 tmp
= ((rec
->src_scan_h
<< 16) / rec
->dst_h
) >> 16;
921 tmp
= ((rec
->src_scan_w
<< 16) / rec
->dst_w
) >> 16;
928 static int check_overlay_src(struct drm_device
*dev
,
929 struct drm_intel_overlay_put_image
*rec
,
930 struct drm_gem_object
*new_bo
)
934 int uv_hscale
= uv_hsubsampling(rec
->flags
);
935 int uv_vscale
= uv_vsubsampling(rec
->flags
);
938 /* check src dimensions */
939 if (IS_845G(dev
) || IS_I830(dev
)) {
940 if (rec
->src_height
> IMAGE_MAX_HEIGHT_LEGACY
941 || rec
->src_width
> IMAGE_MAX_WIDTH_LEGACY
)
944 if (rec
->src_height
> IMAGE_MAX_HEIGHT
945 || rec
->src_width
> IMAGE_MAX_WIDTH
)
948 /* better safe than sorry, use 4 as the maximal subsampling ratio */
949 if (rec
->src_height
< N_VERT_Y_TAPS
*4
950 || rec
->src_width
< N_HORIZ_Y_TAPS
*4)
953 /* check alingment constrains */
954 switch (rec
->flags
& I915_OVERLAY_TYPE_MASK
) {
955 case I915_OVERLAY_RGB
:
956 /* not implemented */
958 case I915_OVERLAY_YUV_PACKED
:
959 depth
= packed_depth_bytes(rec
->flags
);
964 /* ignore UV planes */
968 /* check pixel alignment */
969 if (rec
->offset_Y
% depth
)
972 case I915_OVERLAY_YUV_PLANAR
:
973 if (uv_vscale
< 0 || uv_hscale
< 0)
975 /* no offset restrictions for planar formats */
981 if (rec
->src_width
% uv_hscale
)
984 /* stride checking */
987 if (rec
->stride_Y
& stride_mask
|| rec
->stride_UV
& stride_mask
)
989 if (IS_I965G(dev
) && rec
->stride_Y
< 512)
992 tmp
= (rec
->flags
& I915_OVERLAY_TYPE_MASK
) == I915_OVERLAY_YUV_PLANAR
?
994 if (rec
->stride_Y
> tmp
*1024 || rec
->stride_UV
> 2*1024)
997 /* check buffer dimensions */
998 switch (rec
->flags
& I915_OVERLAY_TYPE_MASK
) {
999 case I915_OVERLAY_RGB
:
1000 case I915_OVERLAY_YUV_PACKED
:
1001 /* always 4 Y values per depth pixels */
1002 if (packed_width_bytes(rec
->flags
, rec
->src_width
)
1006 tmp
= rec
->stride_Y
*rec
->src_height
;
1007 if (rec
->offset_Y
+ tmp
> new_bo
->size
)
1010 case I915_OVERLAY_YUV_PLANAR
:
1011 if (rec
->src_width
> rec
->stride_Y
)
1013 if (rec
->src_width
/uv_hscale
> rec
->stride_UV
)
1016 tmp
= rec
->stride_Y
*rec
->src_height
;
1017 if (rec
->offset_Y
+ tmp
> new_bo
->size
)
1019 tmp
= rec
->stride_UV
*rec
->src_height
;
1021 if (rec
->offset_U
+ tmp
> new_bo
->size
1022 || rec
->offset_V
+ tmp
> new_bo
->size
)
1030 int intel_overlay_put_image(struct drm_device
*dev
, void *data
,
1031 struct drm_file
*file_priv
)
1033 struct drm_intel_overlay_put_image
*put_image_rec
= data
;
1034 drm_i915_private_t
*dev_priv
= dev
->dev_private
;
1035 struct intel_overlay
*overlay
;
1036 struct drm_mode_object
*drmmode_obj
;
1037 struct intel_crtc
*crtc
;
1038 struct drm_gem_object
*new_bo
;
1039 struct put_image_params
*params
;
1043 DRM_ERROR("called with no initialization\n");
1047 overlay
= dev_priv
->overlay
;
1049 DRM_DEBUG("userspace bug: no overlay\n");
1053 if (!(put_image_rec
->flags
& I915_OVERLAY_ENABLE
)) {
1054 mutex_lock(&dev
->mode_config
.mutex
);
1055 mutex_lock(&dev
->struct_mutex
);
1057 ret
= intel_overlay_switch_off(overlay
);
1059 mutex_unlock(&dev
->struct_mutex
);
1060 mutex_unlock(&dev
->mode_config
.mutex
);
1065 params
= kmalloc(sizeof(struct put_image_params
), GFP_KERNEL
);
1069 drmmode_obj
= drm_mode_object_find(dev
, put_image_rec
->crtc_id
,
1070 DRM_MODE_OBJECT_CRTC
);
1073 crtc
= to_intel_crtc(obj_to_crtc(drmmode_obj
));
1075 new_bo
= drm_gem_object_lookup(dev
, file_priv
,
1076 put_image_rec
->bo_handle
);
1080 mutex_lock(&dev
->mode_config
.mutex
);
1081 mutex_lock(&dev
->struct_mutex
);
1083 if (overlay
->hw_wedged
) {
1084 ret
= intel_overlay_recover_from_interrupt(overlay
, 1);
1089 if (overlay
->crtc
!= crtc
) {
1090 struct drm_display_mode
*mode
= &crtc
->base
.mode
;
1091 ret
= intel_overlay_switch_off(overlay
);
1095 ret
= check_overlay_possible_on_crtc(overlay
, crtc
);
1099 overlay
->crtc
= crtc
;
1100 crtc
->overlay
= overlay
;
1102 if (intel_panel_fitter_pipe(dev
) == crtc
->pipe
1103 /* and line to wide, i.e. one-line-mode */
1104 && mode
->hdisplay
> 1024) {
1105 overlay
->pfit_active
= 1;
1106 update_pfit_vscale_ratio(overlay
);
1108 overlay
->pfit_active
= 0;
1111 ret
= check_overlay_dst(overlay
, put_image_rec
);
1115 if (overlay
->pfit_active
) {
1116 params
->dst_y
= ((((u32
)put_image_rec
->dst_y
) << 12) /
1117 overlay
->pfit_vscale_ratio
);
1118 /* shifting right rounds downwards, so add 1 */
1119 params
->dst_h
= ((((u32
)put_image_rec
->dst_height
) << 12) /
1120 overlay
->pfit_vscale_ratio
) + 1;
1122 params
->dst_y
= put_image_rec
->dst_y
;
1123 params
->dst_h
= put_image_rec
->dst_height
;
1125 params
->dst_x
= put_image_rec
->dst_x
;
1126 params
->dst_w
= put_image_rec
->dst_width
;
1128 params
->src_w
= put_image_rec
->src_width
;
1129 params
->src_h
= put_image_rec
->src_height
;
1130 params
->src_scan_w
= put_image_rec
->src_scan_width
;
1131 params
->src_scan_h
= put_image_rec
->src_scan_height
;
1132 if (params
->src_scan_h
> params
->src_h
1133 || params
->src_scan_w
> params
->src_w
) {
1138 ret
= check_overlay_src(dev
, put_image_rec
, new_bo
);
1141 params
->format
= put_image_rec
->flags
& ~I915_OVERLAY_FLAGS_MASK
;
1142 params
->stride_Y
= put_image_rec
->stride_Y
;
1143 params
->stride_UV
= put_image_rec
->stride_UV
;
1144 params
->offset_Y
= put_image_rec
->offset_Y
;
1145 params
->offset_U
= put_image_rec
->offset_U
;
1146 params
->offset_V
= put_image_rec
->offset_V
;
1148 /* Check scaling after src size to prevent a divide-by-zero. */
1149 ret
= check_overlay_scaling(params
);
1153 ret
= intel_overlay_do_put_image(overlay
, new_bo
, params
);
1157 mutex_unlock(&dev
->struct_mutex
);
1158 mutex_unlock(&dev
->mode_config
.mutex
);
1165 mutex_unlock(&dev
->struct_mutex
);
1166 mutex_unlock(&dev
->mode_config
.mutex
);
1167 drm_gem_object_unreference_unlocked(new_bo
);
1173 static void update_reg_attrs(struct intel_overlay
*overlay
,
1174 struct overlay_registers
*regs
)
1176 regs
->OCLRC0
= (overlay
->contrast
<< 18) | (overlay
->brightness
& 0xff);
1177 regs
->OCLRC1
= overlay
->saturation
;
1180 static bool check_gamma_bounds(u32 gamma1
, u32 gamma2
)
1184 if (gamma1
& 0xff000000 || gamma2
& 0xff000000)
1187 for (i
= 0; i
< 3; i
++) {
1188 if (((gamma1
>> i
* 8) & 0xff) >= ((gamma2
>> i
*8) & 0xff))
1195 static bool check_gamma5_errata(u32 gamma5
)
1199 for (i
= 0; i
< 3; i
++) {
1200 if (((gamma5
>> i
*8) & 0xff) == 0x80)
1207 static int check_gamma(struct drm_intel_overlay_attrs
*attrs
)
1209 if (!check_gamma_bounds(0, attrs
->gamma0
)
1210 || !check_gamma_bounds(attrs
->gamma0
, attrs
->gamma1
)
1211 || !check_gamma_bounds(attrs
->gamma1
, attrs
->gamma2
)
1212 || !check_gamma_bounds(attrs
->gamma2
, attrs
->gamma3
)
1213 || !check_gamma_bounds(attrs
->gamma3
, attrs
->gamma4
)
1214 || !check_gamma_bounds(attrs
->gamma4
, attrs
->gamma5
)
1215 || !check_gamma_bounds(attrs
->gamma5
, 0x00ffffff))
1217 if (!check_gamma5_errata(attrs
->gamma5
))
1222 int intel_overlay_attrs(struct drm_device
*dev
, void *data
,
1223 struct drm_file
*file_priv
)
1225 struct drm_intel_overlay_attrs
*attrs
= data
;
1226 drm_i915_private_t
*dev_priv
= dev
->dev_private
;
1227 struct intel_overlay
*overlay
;
1228 struct overlay_registers
*regs
;
1232 DRM_ERROR("called with no initialization\n");
1236 overlay
= dev_priv
->overlay
;
1238 DRM_DEBUG("userspace bug: no overlay\n");
1242 mutex_lock(&dev
->mode_config
.mutex
);
1243 mutex_lock(&dev
->struct_mutex
);
1245 if (!(attrs
->flags
& I915_OVERLAY_UPDATE_ATTRS
)) {
1246 attrs
->color_key
= overlay
->color_key
;
1247 attrs
->brightness
= overlay
->brightness
;
1248 attrs
->contrast
= overlay
->contrast
;
1249 attrs
->saturation
= overlay
->saturation
;
1252 attrs
->gamma0
= I915_READ(OGAMC0
);
1253 attrs
->gamma1
= I915_READ(OGAMC1
);
1254 attrs
->gamma2
= I915_READ(OGAMC2
);
1255 attrs
->gamma3
= I915_READ(OGAMC3
);
1256 attrs
->gamma4
= I915_READ(OGAMC4
);
1257 attrs
->gamma5
= I915_READ(OGAMC5
);
1261 overlay
->color_key
= attrs
->color_key
;
1262 if (attrs
->brightness
>= -128 && attrs
->brightness
<= 127) {
1263 overlay
->brightness
= attrs
->brightness
;
1268 if (attrs
->contrast
<= 255) {
1269 overlay
->contrast
= attrs
->contrast
;
1274 if (attrs
->saturation
<= 1023) {
1275 overlay
->saturation
= attrs
->saturation
;
1281 regs
= intel_overlay_map_regs_atomic(overlay
);
1287 update_reg_attrs(overlay
, regs
);
1289 intel_overlay_unmap_regs_atomic(overlay
);
1291 if (attrs
->flags
& I915_OVERLAY_UPDATE_GAMMA
) {
1292 if (!IS_I9XX(dev
)) {
1297 if (overlay
->active
) {
1302 ret
= check_gamma(attrs
);
1306 I915_WRITE(OGAMC0
, attrs
->gamma0
);
1307 I915_WRITE(OGAMC1
, attrs
->gamma1
);
1308 I915_WRITE(OGAMC2
, attrs
->gamma2
);
1309 I915_WRITE(OGAMC3
, attrs
->gamma3
);
1310 I915_WRITE(OGAMC4
, attrs
->gamma4
);
1311 I915_WRITE(OGAMC5
, attrs
->gamma5
);
1317 mutex_unlock(&dev
->struct_mutex
);
1318 mutex_unlock(&dev
->mode_config
.mutex
);
1323 void intel_setup_overlay(struct drm_device
*dev
)
1325 drm_i915_private_t
*dev_priv
= dev
->dev_private
;
1326 struct intel_overlay
*overlay
;
1327 struct drm_gem_object
*reg_bo
;
1328 struct overlay_registers
*regs
;
1331 if (!OVERLAY_EXISTS(dev
))
1334 overlay
= kzalloc(sizeof(struct intel_overlay
), GFP_KERNEL
);
1339 reg_bo
= drm_gem_object_alloc(dev
, PAGE_SIZE
);
1342 overlay
->reg_bo
= reg_bo
->driver_private
;
1344 if (OVERLAY_NONPHYSICAL(dev
)) {
1345 ret
= i915_gem_object_pin(reg_bo
, PAGE_SIZE
);
1347 DRM_ERROR("failed to pin overlay register bo\n");
1350 overlay
->flip_addr
= overlay
->reg_bo
->gtt_offset
;
1352 ret
= i915_gem_attach_phys_object(dev
, reg_bo
,
1353 I915_GEM_PHYS_OVERLAY_REGS
);
1355 DRM_ERROR("failed to attach phys overlay regs\n");
1358 overlay
->flip_addr
= overlay
->reg_bo
->phys_obj
->handle
->busaddr
;
1361 /* init all values */
1362 overlay
->color_key
= 0x0101fe;
1363 overlay
->brightness
= -19;
1364 overlay
->contrast
= 75;
1365 overlay
->saturation
= 146;
1367 regs
= intel_overlay_map_regs_atomic(overlay
);
1371 memset(regs
, 0, sizeof(struct overlay_registers
));
1372 update_polyphase_filter(regs
);
1374 update_reg_attrs(overlay
, regs
);
1376 intel_overlay_unmap_regs_atomic(overlay
);
1378 dev_priv
->overlay
= overlay
;
1379 DRM_INFO("initialized overlay support\n");
1383 drm_gem_object_unreference(reg_bo
);
1389 void intel_cleanup_overlay(struct drm_device
*dev
)
1391 drm_i915_private_t
*dev_priv
= dev
->dev_private
;
1393 if (dev_priv
->overlay
) {
1394 /* The bo's should be free'd by the generic code already.
1395 * Furthermore modesetting teardown happens beforehand so the
1396 * hardware should be off already */
1397 BUG_ON(dev_priv
->overlay
->active
);
1399 kfree(dev_priv
->overlay
);