4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
20 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
24 * Daniel Vetter <daniel@ffwll.ch>
26 * Derived from Xorg ddx, xf86-video-intel, src/i830_video.c
33 #include "intel_drv.h"
35 /* Limits for overlay size. According to intel doc, the real limits are:
36 * Y width: 4095, UV width (planar): 2047, Y height: 2047,
37 * UV width (planar): * 1023. But the xorg thinks 2048 for height and width. Use
38 * the mininum of both. */
39 #define IMAGE_MAX_WIDTH 2048
40 #define IMAGE_MAX_HEIGHT 2046 /* 2 * 1023 */
41 /* on 830 and 845 these large limits result in the card hanging */
42 #define IMAGE_MAX_WIDTH_LEGACY 1024
43 #define IMAGE_MAX_HEIGHT_LEGACY 1088
45 /* overlay register definitions */
47 #define OCMD_TILED_SURFACE (0x1<<19)
48 #define OCMD_MIRROR_MASK (0x3<<17)
49 #define OCMD_MIRROR_MODE (0x3<<17)
50 #define OCMD_MIRROR_HORIZONTAL (0x1<<17)
51 #define OCMD_MIRROR_VERTICAL (0x2<<17)
52 #define OCMD_MIRROR_BOTH (0x3<<17)
53 #define OCMD_BYTEORDER_MASK (0x3<<14) /* zero for YUYV or FOURCC YUY2 */
54 #define OCMD_UV_SWAP (0x1<<14) /* YVYU */
55 #define OCMD_Y_SWAP (0x2<<14) /* UYVY or FOURCC UYVY */
56 #define OCMD_Y_AND_UV_SWAP (0x3<<14) /* VYUY */
57 #define OCMD_SOURCE_FORMAT_MASK (0xf<<10)
58 #define OCMD_RGB_888 (0x1<<10) /* not in i965 Intel docs */
59 #define OCMD_RGB_555 (0x2<<10) /* not in i965 Intel docs */
60 #define OCMD_RGB_565 (0x3<<10) /* not in i965 Intel docs */
61 #define OCMD_YUV_422_PACKED (0x8<<10)
62 #define OCMD_YUV_411_PACKED (0x9<<10) /* not in i965 Intel docs */
63 #define OCMD_YUV_420_PLANAR (0xc<<10)
64 #define OCMD_YUV_422_PLANAR (0xd<<10)
65 #define OCMD_YUV_410_PLANAR (0xe<<10) /* also 411 */
66 #define OCMD_TVSYNCFLIP_PARITY (0x1<<9)
67 #define OCMD_TVSYNCFLIP_ENABLE (0x1<<7)
68 #define OCMD_BUF_TYPE_MASK (0x1<<5)
69 #define OCMD_BUF_TYPE_FRAME (0x0<<5)
70 #define OCMD_BUF_TYPE_FIELD (0x1<<5)
71 #define OCMD_TEST_MODE (0x1<<4)
72 #define OCMD_BUFFER_SELECT (0x3<<2)
73 #define OCMD_BUFFER0 (0x0<<2)
74 #define OCMD_BUFFER1 (0x1<<2)
75 #define OCMD_FIELD_SELECT (0x1<<2)
76 #define OCMD_FIELD0 (0x0<<1)
77 #define OCMD_FIELD1 (0x1<<1)
78 #define OCMD_ENABLE (0x1<<0)
80 /* OCONFIG register */
81 #define OCONF_PIPE_MASK (0x1<<18)
82 #define OCONF_PIPE_A (0x0<<18)
83 #define OCONF_PIPE_B (0x1<<18)
84 #define OCONF_GAMMA2_ENABLE (0x1<<16)
85 #define OCONF_CSC_MODE_BT601 (0x0<<5)
86 #define OCONF_CSC_MODE_BT709 (0x1<<5)
87 #define OCONF_CSC_BYPASS (0x1<<4)
88 #define OCONF_CC_OUT_8BIT (0x1<<3)
89 #define OCONF_TEST_MODE (0x1<<2)
90 #define OCONF_THREE_LINE_BUFFER (0x1<<0)
91 #define OCONF_TWO_LINE_BUFFER (0x0<<0)
93 /* DCLRKM (dst-key) register */
94 #define DST_KEY_ENABLE (0x1<<31)
95 #define CLK_RGB24_MASK 0x0
96 #define CLK_RGB16_MASK 0x070307
97 #define CLK_RGB15_MASK 0x070707
98 #define CLK_RGB8I_MASK 0xffffff
100 #define RGB16_TO_COLORKEY(c) \
101 (((c & 0xF800) << 8) | ((c & 0x07E0) << 5) | ((c & 0x001F) << 3))
102 #define RGB15_TO_COLORKEY(c) \
103 (((c & 0x7c00) << 9) | ((c & 0x03E0) << 6) | ((c & 0x001F) << 3))
105 /* overlay flip addr flag */
106 #define OFC_UPDATE 0x1
108 /* polyphase filter coefficients */
109 #define N_HORIZ_Y_TAPS 5
110 #define N_VERT_Y_TAPS 3
111 #define N_HORIZ_UV_TAPS 3
112 #define N_VERT_UV_TAPS 3
116 /* memory bufferd overlay registers */
117 struct overlay_registers {
145 u32 RESERVED1; /* 0x6C */
158 u32 FASTHSCALE; /* 0xA0 */
159 u32 UVSCALEV; /* 0xA4 */
160 u32 RESERVEDC[(0x200 - 0xA8) / 4]; /* 0xA8 - 0x1FC */
161 u16 Y_VCOEFS[N_VERT_Y_TAPS * N_PHASES]; /* 0x200 */
162 u16 RESERVEDD[0x100 / 2 - N_VERT_Y_TAPS * N_PHASES];
163 u16 Y_HCOEFS[N_HORIZ_Y_TAPS * N_PHASES]; /* 0x300 */
164 u16 RESERVEDE[0x200 / 2 - N_HORIZ_Y_TAPS * N_PHASES];
165 u16 UV_VCOEFS[N_VERT_UV_TAPS * N_PHASES]; /* 0x500 */
166 u16 RESERVEDF[0x100 / 2 - N_VERT_UV_TAPS * N_PHASES];
167 u16 UV_HCOEFS[N_HORIZ_UV_TAPS * N_PHASES]; /* 0x600 */
168 u16 RESERVEDG[0x100 / 2 - N_HORIZ_UV_TAPS * N_PHASES];
171 struct intel_overlay {
172 struct drm_device *dev;
173 struct intel_crtc *crtc;
174 struct drm_i915_gem_object *vid_bo;
175 struct drm_i915_gem_object *old_vid_bo;
178 u32 pfit_vscale_ratio; /* shifted-point number, (1<<12) == 1.0 */
180 u32 brightness, contrast, saturation;
181 u32 old_xscale, old_yscale;
182 /* register access */
184 struct drm_i915_gem_object *reg_bo;
186 uint32_t last_flip_req;
187 void (*flip_tail)(struct intel_overlay *);
190 static struct overlay_registers __iomem *
191 intel_overlay_map_regs(struct intel_overlay *overlay)
193 drm_i915_private_t *dev_priv = overlay->dev->dev_private;
194 struct overlay_registers __iomem *regs;
196 if (OVERLAY_NEEDS_PHYSICAL(overlay->dev))
197 regs = (struct overlay_registers __iomem *)overlay->reg_bo->phys_obj->handle->vaddr;
199 regs = io_mapping_map_wc(dev_priv->mm.gtt_mapping,
200 overlay->reg_bo->gtt_offset);
205 static void intel_overlay_unmap_regs(struct intel_overlay *overlay,
206 struct overlay_registers __iomem *regs)
208 if (!OVERLAY_NEEDS_PHYSICAL(overlay->dev))
209 io_mapping_unmap(regs);
212 static int intel_overlay_do_wait_request(struct intel_overlay *overlay,
213 struct drm_i915_gem_request *request,
214 void (*tail)(struct intel_overlay *))
216 struct drm_device *dev = overlay->dev;
217 drm_i915_private_t *dev_priv = dev->dev_private;
218 struct intel_ring_buffer *ring = &dev_priv->ring[RCS];
221 BUG_ON(overlay->last_flip_req);
222 ret = i915_add_request(ring, NULL, request);
227 overlay->last_flip_req = request->seqno;
228 overlay->flip_tail = tail;
229 ret = i915_wait_seqno(ring, overlay->last_flip_req);
232 i915_gem_retire_requests(dev);
234 overlay->last_flip_req = 0;
238 /* overlay needs to be disable in OCMD reg */
239 static int intel_overlay_on(struct intel_overlay *overlay)
241 struct drm_device *dev = overlay->dev;
242 struct drm_i915_private *dev_priv = dev->dev_private;
243 struct intel_ring_buffer *ring = &dev_priv->ring[RCS];
244 struct drm_i915_gem_request *request;
247 BUG_ON(overlay->active);
250 WARN_ON(IS_I830(dev) && !(dev_priv->quirks & QUIRK_PIPEA_FORCE));
252 request = kzalloc(sizeof(*request), GFP_KERNEL);
253 if (request == NULL) {
258 ret = intel_ring_begin(ring, 4);
264 intel_ring_emit(ring, MI_OVERLAY_FLIP | MI_OVERLAY_ON);
265 intel_ring_emit(ring, overlay->flip_addr | OFC_UPDATE);
266 intel_ring_emit(ring, MI_WAIT_FOR_EVENT | MI_WAIT_FOR_OVERLAY_FLIP);
267 intel_ring_emit(ring, MI_NOOP);
268 intel_ring_advance(ring);
270 ret = intel_overlay_do_wait_request(overlay, request, NULL);
275 /* overlay needs to be enabled in OCMD reg */
276 static int intel_overlay_continue(struct intel_overlay *overlay,
277 bool load_polyphase_filter)
279 struct drm_device *dev = overlay->dev;
280 drm_i915_private_t *dev_priv = dev->dev_private;
281 struct intel_ring_buffer *ring = &dev_priv->ring[RCS];
282 struct drm_i915_gem_request *request;
283 u32 flip_addr = overlay->flip_addr;
287 BUG_ON(!overlay->active);
289 request = kzalloc(sizeof(*request), GFP_KERNEL);
293 if (load_polyphase_filter)
294 flip_addr |= OFC_UPDATE;
296 /* check for underruns */
297 tmp = I915_READ(DOVSTA);
299 DRM_DEBUG("overlay underrun, DOVSTA: %x\n", tmp);
301 ret = intel_ring_begin(ring, 2);
306 intel_ring_emit(ring, MI_OVERLAY_FLIP | MI_OVERLAY_CONTINUE);
307 intel_ring_emit(ring, flip_addr);
308 intel_ring_advance(ring);
310 ret = i915_add_request(ring, NULL, request);
316 overlay->last_flip_req = request->seqno;
320 static void intel_overlay_release_old_vid_tail(struct intel_overlay *overlay)
322 struct drm_i915_gem_object *obj = overlay->old_vid_bo;
324 i915_gem_object_unpin(obj);
325 drm_gem_object_unreference(&obj->base);
327 overlay->old_vid_bo = NULL;
330 static void intel_overlay_off_tail(struct intel_overlay *overlay)
332 struct drm_i915_gem_object *obj = overlay->vid_bo;
334 /* never have the overlay hw on without showing a frame */
335 BUG_ON(!overlay->vid_bo);
337 i915_gem_object_unpin(obj);
338 drm_gem_object_unreference(&obj->base);
339 overlay->vid_bo = NULL;
341 overlay->crtc->overlay = NULL;
342 overlay->crtc = NULL;
346 /* overlay needs to be disabled in OCMD reg */
347 static int intel_overlay_off(struct intel_overlay *overlay)
349 struct drm_device *dev = overlay->dev;
350 struct drm_i915_private *dev_priv = dev->dev_private;
351 struct intel_ring_buffer *ring = &dev_priv->ring[RCS];
352 u32 flip_addr = overlay->flip_addr;
353 struct drm_i915_gem_request *request;
356 BUG_ON(!overlay->active);
358 request = kzalloc(sizeof(*request), GFP_KERNEL);
362 /* According to intel docs the overlay hw may hang (when switching
363 * off) without loading the filter coeffs. It is however unclear whether
364 * this applies to the disabling of the overlay or to the switching off
365 * of the hw. Do it in both cases */
366 flip_addr |= OFC_UPDATE;
368 ret = intel_ring_begin(ring, 6);
373 /* wait for overlay to go idle */
374 intel_ring_emit(ring, MI_OVERLAY_FLIP | MI_OVERLAY_CONTINUE);
375 intel_ring_emit(ring, flip_addr);
376 intel_ring_emit(ring, MI_WAIT_FOR_EVENT | MI_WAIT_FOR_OVERLAY_FLIP);
377 /* turn overlay off */
378 intel_ring_emit(ring, MI_OVERLAY_FLIP | MI_OVERLAY_OFF);
379 intel_ring_emit(ring, flip_addr);
380 intel_ring_emit(ring, MI_WAIT_FOR_EVENT | MI_WAIT_FOR_OVERLAY_FLIP);
381 intel_ring_advance(ring);
383 return intel_overlay_do_wait_request(overlay, request,
384 intel_overlay_off_tail);
387 /* recover from an interruption due to a signal
388 * We have to be careful not to repeat work forever an make forward progess. */
389 static int intel_overlay_recover_from_interrupt(struct intel_overlay *overlay)
391 struct drm_device *dev = overlay->dev;
392 drm_i915_private_t *dev_priv = dev->dev_private;
393 struct intel_ring_buffer *ring = &dev_priv->ring[RCS];
396 if (overlay->last_flip_req == 0)
399 ret = i915_wait_seqno(ring, overlay->last_flip_req);
402 i915_gem_retire_requests(dev);
404 if (overlay->flip_tail)
405 overlay->flip_tail(overlay);
407 overlay->last_flip_req = 0;
411 /* Wait for pending overlay flip and release old frame.
412 * Needs to be called before the overlay register are changed
413 * via intel_overlay_(un)map_regs
415 static int intel_overlay_release_old_vid(struct intel_overlay *overlay)
417 struct drm_device *dev = overlay->dev;
418 drm_i915_private_t *dev_priv = dev->dev_private;
419 struct intel_ring_buffer *ring = &dev_priv->ring[RCS];
422 /* Only wait if there is actually an old frame to release to
423 * guarantee forward progress.
425 if (!overlay->old_vid_bo)
428 if (I915_READ(ISR) & I915_OVERLAY_PLANE_FLIP_PENDING_INTERRUPT) {
429 struct drm_i915_gem_request *request;
431 /* synchronous slowpath */
432 request = kzalloc(sizeof(*request), GFP_KERNEL);
436 ret = intel_ring_begin(ring, 2);
442 intel_ring_emit(ring, MI_WAIT_FOR_EVENT | MI_WAIT_FOR_OVERLAY_FLIP);
443 intel_ring_emit(ring, MI_NOOP);
444 intel_ring_advance(ring);
446 ret = intel_overlay_do_wait_request(overlay, request,
447 intel_overlay_release_old_vid_tail);
452 intel_overlay_release_old_vid_tail(overlay);
456 struct put_image_params {
473 static int packed_depth_bytes(u32 format)
475 switch (format & I915_OVERLAY_DEPTH_MASK) {
476 case I915_OVERLAY_YUV422:
478 case I915_OVERLAY_YUV411:
479 /* return 6; not implemented */
485 static int packed_width_bytes(u32 format, short width)
487 switch (format & I915_OVERLAY_DEPTH_MASK) {
488 case I915_OVERLAY_YUV422:
495 static int uv_hsubsampling(u32 format)
497 switch (format & I915_OVERLAY_DEPTH_MASK) {
498 case I915_OVERLAY_YUV422:
499 case I915_OVERLAY_YUV420:
501 case I915_OVERLAY_YUV411:
502 case I915_OVERLAY_YUV410:
509 static int uv_vsubsampling(u32 format)
511 switch (format & I915_OVERLAY_DEPTH_MASK) {
512 case I915_OVERLAY_YUV420:
513 case I915_OVERLAY_YUV410:
515 case I915_OVERLAY_YUV422:
516 case I915_OVERLAY_YUV411:
523 static u32 calc_swidthsw(struct drm_device *dev, u32 offset, u32 width)
525 u32 mask, shift, ret;
533 ret = ((offset + width + mask) >> shift) - (offset >> shift);
540 static const u16 y_static_hcoeffs[N_HORIZ_Y_TAPS * N_PHASES] = {
541 0x3000, 0xb4a0, 0x1930, 0x1920, 0xb4a0,
542 0x3000, 0xb500, 0x19d0, 0x1880, 0xb440,
543 0x3000, 0xb540, 0x1a88, 0x2f80, 0xb3e0,
544 0x3000, 0xb580, 0x1b30, 0x2e20, 0xb380,
545 0x3000, 0xb5c0, 0x1bd8, 0x2cc0, 0xb320,
546 0x3020, 0xb5e0, 0x1c60, 0x2b80, 0xb2c0,
547 0x3020, 0xb5e0, 0x1cf8, 0x2a20, 0xb260,
548 0x3020, 0xb5e0, 0x1d80, 0x28e0, 0xb200,
549 0x3020, 0xb5c0, 0x1e08, 0x3f40, 0xb1c0,
550 0x3020, 0xb580, 0x1e78, 0x3ce0, 0xb160,
551 0x3040, 0xb520, 0x1ed8, 0x3aa0, 0xb120,
552 0x3040, 0xb4a0, 0x1f30, 0x3880, 0xb0e0,
553 0x3040, 0xb400, 0x1f78, 0x3680, 0xb0a0,
554 0x3020, 0xb340, 0x1fb8, 0x34a0, 0xb060,
555 0x3020, 0xb240, 0x1fe0, 0x32e0, 0xb040,
556 0x3020, 0xb140, 0x1ff8, 0x3160, 0xb020,
557 0xb000, 0x3000, 0x0800, 0x3000, 0xb000
560 static const u16 uv_static_hcoeffs[N_HORIZ_UV_TAPS * N_PHASES] = {
561 0x3000, 0x1800, 0x1800, 0xb000, 0x18d0, 0x2e60,
562 0xb000, 0x1990, 0x2ce0, 0xb020, 0x1a68, 0x2b40,
563 0xb040, 0x1b20, 0x29e0, 0xb060, 0x1bd8, 0x2880,
564 0xb080, 0x1c88, 0x3e60, 0xb0a0, 0x1d28, 0x3c00,
565 0xb0c0, 0x1db8, 0x39e0, 0xb0e0, 0x1e40, 0x37e0,
566 0xb100, 0x1eb8, 0x3620, 0xb100, 0x1f18, 0x34a0,
567 0xb100, 0x1f68, 0x3360, 0xb0e0, 0x1fa8, 0x3240,
568 0xb0c0, 0x1fe0, 0x3140, 0xb060, 0x1ff0, 0x30a0,
569 0x3000, 0x0800, 0x3000
572 static void update_polyphase_filter(struct overlay_registers __iomem *regs)
574 memcpy_toio(regs->Y_HCOEFS, y_static_hcoeffs, sizeof(y_static_hcoeffs));
575 memcpy_toio(regs->UV_HCOEFS, uv_static_hcoeffs,
576 sizeof(uv_static_hcoeffs));
579 static bool update_scaling_factors(struct intel_overlay *overlay,
580 struct overlay_registers __iomem *regs,
581 struct put_image_params *params)
583 /* fixed point with a 12 bit shift */
584 u32 xscale, yscale, xscale_UV, yscale_UV;
586 #define FRACT_MASK 0xfff
587 bool scale_changed = false;
588 int uv_hscale = uv_hsubsampling(params->format);
589 int uv_vscale = uv_vsubsampling(params->format);
591 if (params->dst_w > 1)
592 xscale = ((params->src_scan_w - 1) << FP_SHIFT)
595 xscale = 1 << FP_SHIFT;
597 if (params->dst_h > 1)
598 yscale = ((params->src_scan_h - 1) << FP_SHIFT)
601 yscale = 1 << FP_SHIFT;
603 /*if (params->format & I915_OVERLAY_YUV_PLANAR) {*/
604 xscale_UV = xscale/uv_hscale;
605 yscale_UV = yscale/uv_vscale;
606 /* make the Y scale to UV scale ratio an exact multiply */
607 xscale = xscale_UV * uv_hscale;
608 yscale = yscale_UV * uv_vscale;
614 if (xscale != overlay->old_xscale || yscale != overlay->old_yscale)
615 scale_changed = true;
616 overlay->old_xscale = xscale;
617 overlay->old_yscale = yscale;
619 iowrite32(((yscale & FRACT_MASK) << 20) |
620 ((xscale >> FP_SHIFT) << 16) |
621 ((xscale & FRACT_MASK) << 3),
624 iowrite32(((yscale_UV & FRACT_MASK) << 20) |
625 ((xscale_UV >> FP_SHIFT) << 16) |
626 ((xscale_UV & FRACT_MASK) << 3),
629 iowrite32((((yscale >> FP_SHIFT) << 16) |
630 ((yscale_UV >> FP_SHIFT) << 0)),
634 update_polyphase_filter(regs);
636 return scale_changed;
639 static void update_colorkey(struct intel_overlay *overlay,
640 struct overlay_registers __iomem *regs)
642 u32 key = overlay->color_key;
644 switch (overlay->crtc->base.fb->bits_per_pixel) {
646 iowrite32(0, ®s->DCLRKV);
647 iowrite32(CLK_RGB8I_MASK | DST_KEY_ENABLE, ®s->DCLRKM);
651 if (overlay->crtc->base.fb->depth == 15) {
652 iowrite32(RGB15_TO_COLORKEY(key), ®s->DCLRKV);
653 iowrite32(CLK_RGB15_MASK | DST_KEY_ENABLE,
656 iowrite32(RGB16_TO_COLORKEY(key), ®s->DCLRKV);
657 iowrite32(CLK_RGB16_MASK | DST_KEY_ENABLE,
664 iowrite32(key, ®s->DCLRKV);
665 iowrite32(CLK_RGB24_MASK | DST_KEY_ENABLE, ®s->DCLRKM);
670 static u32 overlay_cmd_reg(struct put_image_params *params)
672 u32 cmd = OCMD_ENABLE | OCMD_BUF_TYPE_FRAME | OCMD_BUFFER0;
674 if (params->format & I915_OVERLAY_YUV_PLANAR) {
675 switch (params->format & I915_OVERLAY_DEPTH_MASK) {
676 case I915_OVERLAY_YUV422:
677 cmd |= OCMD_YUV_422_PLANAR;
679 case I915_OVERLAY_YUV420:
680 cmd |= OCMD_YUV_420_PLANAR;
682 case I915_OVERLAY_YUV411:
683 case I915_OVERLAY_YUV410:
684 cmd |= OCMD_YUV_410_PLANAR;
687 } else { /* YUV packed */
688 switch (params->format & I915_OVERLAY_DEPTH_MASK) {
689 case I915_OVERLAY_YUV422:
690 cmd |= OCMD_YUV_422_PACKED;
692 case I915_OVERLAY_YUV411:
693 cmd |= OCMD_YUV_411_PACKED;
697 switch (params->format & I915_OVERLAY_SWAP_MASK) {
698 case I915_OVERLAY_NO_SWAP:
700 case I915_OVERLAY_UV_SWAP:
703 case I915_OVERLAY_Y_SWAP:
706 case I915_OVERLAY_Y_AND_UV_SWAP:
707 cmd |= OCMD_Y_AND_UV_SWAP;
715 static int intel_overlay_do_put_image(struct intel_overlay *overlay,
716 struct drm_i915_gem_object *new_bo,
717 struct put_image_params *params)
720 struct overlay_registers __iomem *regs;
721 bool scale_changed = false;
722 struct drm_device *dev = overlay->dev;
723 u32 swidth, swidthsw, sheight, ostride;
725 BUG_ON(!mutex_is_locked(&dev->struct_mutex));
726 BUG_ON(!mutex_is_locked(&dev->mode_config.mutex));
729 ret = intel_overlay_release_old_vid(overlay);
733 ret = i915_gem_object_pin_to_display_plane(new_bo, 0, NULL);
737 ret = i915_gem_object_put_fence(new_bo);
741 if (!overlay->active) {
743 regs = intel_overlay_map_regs(overlay);
748 oconfig = OCONF_CC_OUT_8BIT;
749 if (IS_GEN4(overlay->dev))
750 oconfig |= OCONF_CSC_MODE_BT709;
751 oconfig |= overlay->crtc->pipe == 0 ?
752 OCONF_PIPE_A : OCONF_PIPE_B;
753 iowrite32(oconfig, ®s->OCONFIG);
754 intel_overlay_unmap_regs(overlay, regs);
756 ret = intel_overlay_on(overlay);
761 regs = intel_overlay_map_regs(overlay);
767 iowrite32((params->dst_y << 16) | params->dst_x, ®s->DWINPOS);
768 iowrite32((params->dst_h << 16) | params->dst_w, ®s->DWINSZ);
770 if (params->format & I915_OVERLAY_YUV_PACKED)
771 tmp_width = packed_width_bytes(params->format, params->src_w);
773 tmp_width = params->src_w;
775 swidth = params->src_w;
776 swidthsw = calc_swidthsw(overlay->dev, params->offset_Y, tmp_width);
777 sheight = params->src_h;
778 iowrite32(new_bo->gtt_offset + params->offset_Y, ®s->OBUF_0Y);
779 ostride = params->stride_Y;
781 if (params->format & I915_OVERLAY_YUV_PLANAR) {
782 int uv_hscale = uv_hsubsampling(params->format);
783 int uv_vscale = uv_vsubsampling(params->format);
785 swidth |= (params->src_w/uv_hscale) << 16;
786 tmp_U = calc_swidthsw(overlay->dev, params->offset_U,
787 params->src_w/uv_hscale);
788 tmp_V = calc_swidthsw(overlay->dev, params->offset_V,
789 params->src_w/uv_hscale);
790 swidthsw |= max_t(u32, tmp_U, tmp_V) << 16;
791 sheight |= (params->src_h/uv_vscale) << 16;
792 iowrite32(new_bo->gtt_offset + params->offset_U, ®s->OBUF_0U);
793 iowrite32(new_bo->gtt_offset + params->offset_V, ®s->OBUF_0V);
794 ostride |= params->stride_UV << 16;
797 iowrite32(swidth, ®s->SWIDTH);
798 iowrite32(swidthsw, ®s->SWIDTHSW);
799 iowrite32(sheight, ®s->SHEIGHT);
800 iowrite32(ostride, ®s->OSTRIDE);
802 scale_changed = update_scaling_factors(overlay, regs, params);
804 update_colorkey(overlay, regs);
806 iowrite32(overlay_cmd_reg(params), ®s->OCMD);
808 intel_overlay_unmap_regs(overlay, regs);
810 ret = intel_overlay_continue(overlay, scale_changed);
814 overlay->old_vid_bo = overlay->vid_bo;
815 overlay->vid_bo = new_bo;
820 i915_gem_object_unpin(new_bo);
824 int intel_overlay_switch_off(struct intel_overlay *overlay)
826 struct overlay_registers __iomem *regs;
827 struct drm_device *dev = overlay->dev;
830 BUG_ON(!mutex_is_locked(&dev->struct_mutex));
831 BUG_ON(!mutex_is_locked(&dev->mode_config.mutex));
833 ret = intel_overlay_recover_from_interrupt(overlay);
837 if (!overlay->active)
840 ret = intel_overlay_release_old_vid(overlay);
844 regs = intel_overlay_map_regs(overlay);
845 iowrite32(0, ®s->OCMD);
846 intel_overlay_unmap_regs(overlay, regs);
848 ret = intel_overlay_off(overlay);
852 intel_overlay_off_tail(overlay);
856 static int check_overlay_possible_on_crtc(struct intel_overlay *overlay,
857 struct intel_crtc *crtc)
859 drm_i915_private_t *dev_priv = overlay->dev->dev_private;
864 /* can't use the overlay with double wide pipe */
865 if (INTEL_INFO(overlay->dev)->gen < 4 &&
866 (I915_READ(PIPECONF(crtc->pipe)) & (PIPECONF_DOUBLE_WIDE | PIPECONF_ENABLE)) != PIPECONF_ENABLE)
872 static void update_pfit_vscale_ratio(struct intel_overlay *overlay)
874 struct drm_device *dev = overlay->dev;
875 drm_i915_private_t *dev_priv = dev->dev_private;
876 u32 pfit_control = I915_READ(PFIT_CONTROL);
879 /* XXX: This is not the same logic as in the xorg driver, but more in
880 * line with the intel documentation for the i965
882 if (INTEL_INFO(dev)->gen >= 4) {
883 /* on i965 use the PGM reg to read out the autoscaler values */
884 ratio = I915_READ(PFIT_PGM_RATIOS) >> PFIT_VERT_SCALE_SHIFT_965;
886 if (pfit_control & VERT_AUTO_SCALE)
887 ratio = I915_READ(PFIT_AUTO_RATIOS);
889 ratio = I915_READ(PFIT_PGM_RATIOS);
890 ratio >>= PFIT_VERT_SCALE_SHIFT;
893 overlay->pfit_vscale_ratio = ratio;
896 static int check_overlay_dst(struct intel_overlay *overlay,
897 struct drm_intel_overlay_put_image *rec)
899 struct drm_display_mode *mode = &overlay->crtc->base.mode;
901 if (rec->dst_x < mode->hdisplay &&
902 rec->dst_x + rec->dst_width <= mode->hdisplay &&
903 rec->dst_y < mode->vdisplay &&
904 rec->dst_y + rec->dst_height <= mode->vdisplay)
910 static int check_overlay_scaling(struct put_image_params *rec)
914 /* downscaling limit is 8.0 */
915 tmp = ((rec->src_scan_h << 16) / rec->dst_h) >> 16;
918 tmp = ((rec->src_scan_w << 16) / rec->dst_w) >> 16;
925 static int check_overlay_src(struct drm_device *dev,
926 struct drm_intel_overlay_put_image *rec,
927 struct drm_i915_gem_object *new_bo)
929 int uv_hscale = uv_hsubsampling(rec->flags);
930 int uv_vscale = uv_vsubsampling(rec->flags);
935 /* check src dimensions */
936 if (IS_845G(dev) || IS_I830(dev)) {
937 if (rec->src_height > IMAGE_MAX_HEIGHT_LEGACY ||
938 rec->src_width > IMAGE_MAX_WIDTH_LEGACY)
941 if (rec->src_height > IMAGE_MAX_HEIGHT ||
942 rec->src_width > IMAGE_MAX_WIDTH)
946 /* better safe than sorry, use 4 as the maximal subsampling ratio */
947 if (rec->src_height < N_VERT_Y_TAPS*4 ||
948 rec->src_width < N_HORIZ_Y_TAPS*4)
951 /* check alignment constraints */
952 switch (rec->flags & I915_OVERLAY_TYPE_MASK) {
953 case I915_OVERLAY_RGB:
954 /* not implemented */
957 case I915_OVERLAY_YUV_PACKED:
961 depth = packed_depth_bytes(rec->flags);
965 /* ignore UV planes */
969 /* check pixel alignment */
970 if (rec->offset_Y % depth)
974 case I915_OVERLAY_YUV_PLANAR:
975 if (uv_vscale < 0 || uv_hscale < 0)
977 /* no offset restrictions for planar formats */
984 if (rec->src_width % uv_hscale)
987 /* stride checking */
988 if (IS_I830(dev) || IS_845G(dev))
993 if (rec->stride_Y & stride_mask || rec->stride_UV & stride_mask)
995 if (IS_GEN4(dev) && rec->stride_Y < 512)
998 tmp = (rec->flags & I915_OVERLAY_TYPE_MASK) == I915_OVERLAY_YUV_PLANAR ?
1000 if (rec->stride_Y > tmp || rec->stride_UV > 2*1024)
1003 /* check buffer dimensions */
1004 switch (rec->flags & I915_OVERLAY_TYPE_MASK) {
1005 case I915_OVERLAY_RGB:
1006 case I915_OVERLAY_YUV_PACKED:
1007 /* always 4 Y values per depth pixels */
1008 if (packed_width_bytes(rec->flags, rec->src_width) > rec->stride_Y)
1011 tmp = rec->stride_Y*rec->src_height;
1012 if (rec->offset_Y + tmp > new_bo->base.size)
1016 case I915_OVERLAY_YUV_PLANAR:
1017 if (rec->src_width > rec->stride_Y)
1019 if (rec->src_width/uv_hscale > rec->stride_UV)
1022 tmp = rec->stride_Y * rec->src_height;
1023 if (rec->offset_Y + tmp > new_bo->base.size)
1026 tmp = rec->stride_UV * (rec->src_height / uv_vscale);
1027 if (rec->offset_U + tmp > new_bo->base.size ||
1028 rec->offset_V + tmp > new_bo->base.size)
1037 * Return the pipe currently connected to the panel fitter,
1038 * or -1 if the panel fitter is not present or not in use
1040 static int intel_panel_fitter_pipe(struct drm_device *dev)
1042 struct drm_i915_private *dev_priv = dev->dev_private;
1045 /* i830 doesn't have a panel fitter */
1049 pfit_control = I915_READ(PFIT_CONTROL);
1051 /* See if the panel fitter is in use */
1052 if ((pfit_control & PFIT_ENABLE) == 0)
1055 /* 965 can place panel fitter on either pipe */
1057 return (pfit_control >> 29) & 0x3;
1059 /* older chips can only use pipe 1 */
1063 int intel_overlay_put_image(struct drm_device *dev, void *data,
1064 struct drm_file *file_priv)
1066 struct drm_intel_overlay_put_image *put_image_rec = data;
1067 drm_i915_private_t *dev_priv = dev->dev_private;
1068 struct intel_overlay *overlay;
1069 struct drm_mode_object *drmmode_obj;
1070 struct intel_crtc *crtc;
1071 struct drm_i915_gem_object *new_bo;
1072 struct put_image_params *params;
1075 /* No need to check for DRIVER_MODESET - we don't set it up then. */
1076 overlay = dev_priv->overlay;
1078 DRM_DEBUG("userspace bug: no overlay\n");
1082 if (!(put_image_rec->flags & I915_OVERLAY_ENABLE)) {
1083 mutex_lock(&dev->mode_config.mutex);
1084 mutex_lock(&dev->struct_mutex);
1086 ret = intel_overlay_switch_off(overlay);
1088 mutex_unlock(&dev->struct_mutex);
1089 mutex_unlock(&dev->mode_config.mutex);
1094 params = kmalloc(sizeof(struct put_image_params), GFP_KERNEL);
1098 drmmode_obj = drm_mode_object_find(dev, put_image_rec->crtc_id,
1099 DRM_MODE_OBJECT_CRTC);
1104 crtc = to_intel_crtc(obj_to_crtc(drmmode_obj));
1106 new_bo = to_intel_bo(drm_gem_object_lookup(dev, file_priv,
1107 put_image_rec->bo_handle));
1108 if (&new_bo->base == NULL) {
1113 mutex_lock(&dev->mode_config.mutex);
1114 mutex_lock(&dev->struct_mutex);
1116 if (new_bo->tiling_mode) {
1117 DRM_ERROR("buffer used for overlay image can not be tiled\n");
1122 ret = intel_overlay_recover_from_interrupt(overlay);
1126 if (overlay->crtc != crtc) {
1127 struct drm_display_mode *mode = &crtc->base.mode;
1128 ret = intel_overlay_switch_off(overlay);
1132 ret = check_overlay_possible_on_crtc(overlay, crtc);
1136 overlay->crtc = crtc;
1137 crtc->overlay = overlay;
1139 /* line too wide, i.e. one-line-mode */
1140 if (mode->hdisplay > 1024 &&
1141 intel_panel_fitter_pipe(dev) == crtc->pipe) {
1142 overlay->pfit_active = 1;
1143 update_pfit_vscale_ratio(overlay);
1145 overlay->pfit_active = 0;
1148 ret = check_overlay_dst(overlay, put_image_rec);
1152 if (overlay->pfit_active) {
1153 params->dst_y = ((((u32)put_image_rec->dst_y) << 12) /
1154 overlay->pfit_vscale_ratio);
1155 /* shifting right rounds downwards, so add 1 */
1156 params->dst_h = ((((u32)put_image_rec->dst_height) << 12) /
1157 overlay->pfit_vscale_ratio) + 1;
1159 params->dst_y = put_image_rec->dst_y;
1160 params->dst_h = put_image_rec->dst_height;
1162 params->dst_x = put_image_rec->dst_x;
1163 params->dst_w = put_image_rec->dst_width;
1165 params->src_w = put_image_rec->src_width;
1166 params->src_h = put_image_rec->src_height;
1167 params->src_scan_w = put_image_rec->src_scan_width;
1168 params->src_scan_h = put_image_rec->src_scan_height;
1169 if (params->src_scan_h > params->src_h ||
1170 params->src_scan_w > params->src_w) {
1175 ret = check_overlay_src(dev, put_image_rec, new_bo);
1178 params->format = put_image_rec->flags & ~I915_OVERLAY_FLAGS_MASK;
1179 params->stride_Y = put_image_rec->stride_Y;
1180 params->stride_UV = put_image_rec->stride_UV;
1181 params->offset_Y = put_image_rec->offset_Y;
1182 params->offset_U = put_image_rec->offset_U;
1183 params->offset_V = put_image_rec->offset_V;
1185 /* Check scaling after src size to prevent a divide-by-zero. */
1186 ret = check_overlay_scaling(params);
1190 ret = intel_overlay_do_put_image(overlay, new_bo, params);
1194 mutex_unlock(&dev->struct_mutex);
1195 mutex_unlock(&dev->mode_config.mutex);
1202 mutex_unlock(&dev->struct_mutex);
1203 mutex_unlock(&dev->mode_config.mutex);
1204 drm_gem_object_unreference_unlocked(&new_bo->base);
1211 static void update_reg_attrs(struct intel_overlay *overlay,
1212 struct overlay_registers __iomem *regs)
1214 iowrite32((overlay->contrast << 18) | (overlay->brightness & 0xff),
1216 iowrite32(overlay->saturation, ®s->OCLRC1);
1219 static bool check_gamma_bounds(u32 gamma1, u32 gamma2)
1223 if (gamma1 & 0xff000000 || gamma2 & 0xff000000)
1226 for (i = 0; i < 3; i++) {
1227 if (((gamma1 >> i*8) & 0xff) >= ((gamma2 >> i*8) & 0xff))
1234 static bool check_gamma5_errata(u32 gamma5)
1238 for (i = 0; i < 3; i++) {
1239 if (((gamma5 >> i*8) & 0xff) == 0x80)
1246 static int check_gamma(struct drm_intel_overlay_attrs *attrs)
1248 if (!check_gamma_bounds(0, attrs->gamma0) ||
1249 !check_gamma_bounds(attrs->gamma0, attrs->gamma1) ||
1250 !check_gamma_bounds(attrs->gamma1, attrs->gamma2) ||
1251 !check_gamma_bounds(attrs->gamma2, attrs->gamma3) ||
1252 !check_gamma_bounds(attrs->gamma3, attrs->gamma4) ||
1253 !check_gamma_bounds(attrs->gamma4, attrs->gamma5) ||
1254 !check_gamma_bounds(attrs->gamma5, 0x00ffffff))
1257 if (!check_gamma5_errata(attrs->gamma5))
1263 int intel_overlay_attrs(struct drm_device *dev, void *data,
1264 struct drm_file *file_priv)
1266 struct drm_intel_overlay_attrs *attrs = data;
1267 drm_i915_private_t *dev_priv = dev->dev_private;
1268 struct intel_overlay *overlay;
1269 struct overlay_registers __iomem *regs;
1272 /* No need to check for DRIVER_MODESET - we don't set it up then. */
1273 overlay = dev_priv->overlay;
1275 DRM_DEBUG("userspace bug: no overlay\n");
1279 mutex_lock(&dev->mode_config.mutex);
1280 mutex_lock(&dev->struct_mutex);
1283 if (!(attrs->flags & I915_OVERLAY_UPDATE_ATTRS)) {
1284 attrs->color_key = overlay->color_key;
1285 attrs->brightness = overlay->brightness;
1286 attrs->contrast = overlay->contrast;
1287 attrs->saturation = overlay->saturation;
1289 if (!IS_GEN2(dev)) {
1290 attrs->gamma0 = I915_READ(OGAMC0);
1291 attrs->gamma1 = I915_READ(OGAMC1);
1292 attrs->gamma2 = I915_READ(OGAMC2);
1293 attrs->gamma3 = I915_READ(OGAMC3);
1294 attrs->gamma4 = I915_READ(OGAMC4);
1295 attrs->gamma5 = I915_READ(OGAMC5);
1298 if (attrs->brightness < -128 || attrs->brightness > 127)
1300 if (attrs->contrast > 255)
1302 if (attrs->saturation > 1023)
1305 overlay->color_key = attrs->color_key;
1306 overlay->brightness = attrs->brightness;
1307 overlay->contrast = attrs->contrast;
1308 overlay->saturation = attrs->saturation;
1310 regs = intel_overlay_map_regs(overlay);
1316 update_reg_attrs(overlay, regs);
1318 intel_overlay_unmap_regs(overlay, regs);
1320 if (attrs->flags & I915_OVERLAY_UPDATE_GAMMA) {
1324 if (overlay->active) {
1329 ret = check_gamma(attrs);
1333 I915_WRITE(OGAMC0, attrs->gamma0);
1334 I915_WRITE(OGAMC1, attrs->gamma1);
1335 I915_WRITE(OGAMC2, attrs->gamma2);
1336 I915_WRITE(OGAMC3, attrs->gamma3);
1337 I915_WRITE(OGAMC4, attrs->gamma4);
1338 I915_WRITE(OGAMC5, attrs->gamma5);
1344 mutex_unlock(&dev->struct_mutex);
1345 mutex_unlock(&dev->mode_config.mutex);
1350 void intel_setup_overlay(struct drm_device *dev)
1352 drm_i915_private_t *dev_priv = dev->dev_private;
1353 struct intel_overlay *overlay;
1354 struct drm_i915_gem_object *reg_bo;
1355 struct overlay_registers __iomem *regs;
1358 if (!HAS_OVERLAY(dev))
1361 overlay = kzalloc(sizeof(struct intel_overlay), GFP_KERNEL);
1365 mutex_lock(&dev->struct_mutex);
1366 if (WARN_ON(dev_priv->overlay))
1371 reg_bo = i915_gem_alloc_object(dev, PAGE_SIZE);
1374 overlay->reg_bo = reg_bo;
1376 if (OVERLAY_NEEDS_PHYSICAL(dev)) {
1377 ret = i915_gem_attach_phys_object(dev, reg_bo,
1378 I915_GEM_PHYS_OVERLAY_REGS,
1381 DRM_ERROR("failed to attach phys overlay regs\n");
1384 overlay->flip_addr = reg_bo->phys_obj->handle->busaddr;
1386 ret = i915_gem_object_pin(reg_bo, PAGE_SIZE, true, false);
1388 DRM_ERROR("failed to pin overlay register bo\n");
1391 overlay->flip_addr = reg_bo->gtt_offset;
1393 ret = i915_gem_object_set_to_gtt_domain(reg_bo, true);
1395 DRM_ERROR("failed to move overlay register bo into the GTT\n");
1400 /* init all values */
1401 overlay->color_key = 0x0101fe;
1402 overlay->brightness = -19;
1403 overlay->contrast = 75;
1404 overlay->saturation = 146;
1406 regs = intel_overlay_map_regs(overlay);
1410 memset_io(regs, 0, sizeof(struct overlay_registers));
1411 update_polyphase_filter(regs);
1412 update_reg_attrs(overlay, regs);
1414 intel_overlay_unmap_regs(overlay, regs);
1416 dev_priv->overlay = overlay;
1417 mutex_unlock(&dev->struct_mutex);
1418 DRM_INFO("initialized overlay support\n");
1422 if (!OVERLAY_NEEDS_PHYSICAL(dev))
1423 i915_gem_object_unpin(reg_bo);
1425 drm_gem_object_unreference(®_bo->base);
1427 mutex_unlock(&dev->struct_mutex);
1432 void intel_cleanup_overlay(struct drm_device *dev)
1434 drm_i915_private_t *dev_priv = dev->dev_private;
1436 if (!dev_priv->overlay)
1439 /* The bo's should be free'd by the generic code already.
1440 * Furthermore modesetting teardown happens beforehand so the
1441 * hardware should be off already */
1442 BUG_ON(dev_priv->overlay->active);
1444 drm_gem_object_unreference_unlocked(&dev_priv->overlay->reg_bo->base);
1445 kfree(dev_priv->overlay);
1448 #ifdef CONFIG_DEBUG_FS
1449 #include <linux/seq_file.h>
1451 struct intel_overlay_error_state {
1452 struct overlay_registers regs;
1458 static struct overlay_registers __iomem *
1459 intel_overlay_map_regs_atomic(struct intel_overlay *overlay)
1461 drm_i915_private_t *dev_priv = overlay->dev->dev_private;
1462 struct overlay_registers __iomem *regs;
1464 if (OVERLAY_NEEDS_PHYSICAL(overlay->dev))
1465 /* Cast to make sparse happy, but it's wc memory anyway, so
1466 * equivalent to the wc io mapping on X86. */
1467 regs = (struct overlay_registers __iomem *)
1468 overlay->reg_bo->phys_obj->handle->vaddr;
1470 regs = io_mapping_map_atomic_wc(dev_priv->mm.gtt_mapping,
1471 overlay->reg_bo->gtt_offset);
1476 static void intel_overlay_unmap_regs_atomic(struct intel_overlay *overlay,
1477 struct overlay_registers __iomem *regs)
1479 if (!OVERLAY_NEEDS_PHYSICAL(overlay->dev))
1480 io_mapping_unmap_atomic(regs);
1484 struct intel_overlay_error_state *
1485 intel_overlay_capture_error_state(struct drm_device *dev)
1487 drm_i915_private_t *dev_priv = dev->dev_private;
1488 struct intel_overlay *overlay = dev_priv->overlay;
1489 struct intel_overlay_error_state *error;
1490 struct overlay_registers __iomem *regs;
1492 if (!overlay || !overlay->active)
1495 error = kmalloc(sizeof(*error), GFP_ATOMIC);
1499 error->dovsta = I915_READ(DOVSTA);
1500 error->isr = I915_READ(ISR);
1501 if (OVERLAY_NEEDS_PHYSICAL(overlay->dev))
1502 error->base = (__force long)overlay->reg_bo->phys_obj->handle->vaddr;
1504 error->base = overlay->reg_bo->gtt_offset;
1506 regs = intel_overlay_map_regs_atomic(overlay);
1510 memcpy_fromio(&error->regs, regs, sizeof(struct overlay_registers));
1511 intel_overlay_unmap_regs_atomic(overlay, regs);
1521 intel_overlay_print_error_state(struct seq_file *m, struct intel_overlay_error_state *error)
1523 seq_printf(m, "Overlay, status: 0x%08x, interrupt: 0x%08x\n",
1524 error->dovsta, error->isr);
1525 seq_printf(m, " Register file at 0x%08lx:\n",
1528 #define P(x) seq_printf(m, " " #x ": 0x%08x\n", error->regs.x)