4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
20 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
24 * Daniel Vetter <daniel@ffwll.ch>
26 * Derived from Xorg ddx, xf86-video-intel, src/i830_video.c
28 #include <sys/cdefs.h>
29 __FBSDID("$FreeBSD$");
31 #include <dev/drm2/drmP.h>
32 #include <dev/drm2/i915/i915_drm.h>
33 #include <dev/drm2/i915/i915_drv.h>
34 #include <dev/drm2/i915/i915_reg.h>
35 #include <dev/drm2/i915/intel_drv.h>
37 /* Limits for overlay size. According to intel doc, the real limits are:
38 * Y width: 4095, UV width (planar): 2047, Y height: 2047,
39 * UV width (planar): * 1023. But the xorg thinks 2048 for height and width. Use
40 * the mininum of both. */
41 #define IMAGE_MAX_WIDTH 2048
42 #define IMAGE_MAX_HEIGHT 2046 /* 2 * 1023 */
43 /* on 830 and 845 these large limits result in the card hanging */
44 #define IMAGE_MAX_WIDTH_LEGACY 1024
45 #define IMAGE_MAX_HEIGHT_LEGACY 1088
47 /* overlay register definitions */
49 #define OCMD_TILED_SURFACE (0x1<<19)
50 #define OCMD_MIRROR_MASK (0x3<<17)
51 #define OCMD_MIRROR_MODE (0x3<<17)
52 #define OCMD_MIRROR_HORIZONTAL (0x1<<17)
53 #define OCMD_MIRROR_VERTICAL (0x2<<17)
54 #define OCMD_MIRROR_BOTH (0x3<<17)
55 #define OCMD_BYTEORDER_MASK (0x3<<14) /* zero for YUYV or FOURCC YUY2 */
56 #define OCMD_UV_SWAP (0x1<<14) /* YVYU */
57 #define OCMD_Y_SWAP (0x2<<14) /* UYVY or FOURCC UYVY */
58 #define OCMD_Y_AND_UV_SWAP (0x3<<14) /* VYUY */
59 #define OCMD_SOURCE_FORMAT_MASK (0xf<<10)
60 #define OCMD_RGB_888 (0x1<<10) /* not in i965 Intel docs */
61 #define OCMD_RGB_555 (0x2<<10) /* not in i965 Intel docs */
62 #define OCMD_RGB_565 (0x3<<10) /* not in i965 Intel docs */
63 #define OCMD_YUV_422_PACKED (0x8<<10)
64 #define OCMD_YUV_411_PACKED (0x9<<10) /* not in i965 Intel docs */
65 #define OCMD_YUV_420_PLANAR (0xc<<10)
66 #define OCMD_YUV_422_PLANAR (0xd<<10)
67 #define OCMD_YUV_410_PLANAR (0xe<<10) /* also 411 */
68 #define OCMD_TVSYNCFLIP_PARITY (0x1<<9)
69 #define OCMD_TVSYNCFLIP_ENABLE (0x1<<7)
70 #define OCMD_BUF_TYPE_MASK (0x1<<5)
71 #define OCMD_BUF_TYPE_FRAME (0x0<<5)
72 #define OCMD_BUF_TYPE_FIELD (0x1<<5)
73 #define OCMD_TEST_MODE (0x1<<4)
74 #define OCMD_BUFFER_SELECT (0x3<<2)
75 #define OCMD_BUFFER0 (0x0<<2)
76 #define OCMD_BUFFER1 (0x1<<2)
77 #define OCMD_FIELD_SELECT (0x1<<2)
78 #define OCMD_FIELD0 (0x0<<1)
79 #define OCMD_FIELD1 (0x1<<1)
80 #define OCMD_ENABLE (0x1<<0)
82 /* OCONFIG register */
83 #define OCONF_PIPE_MASK (0x1<<18)
84 #define OCONF_PIPE_A (0x0<<18)
85 #define OCONF_PIPE_B (0x1<<18)
86 #define OCONF_GAMMA2_ENABLE (0x1<<16)
87 #define OCONF_CSC_MODE_BT601 (0x0<<5)
88 #define OCONF_CSC_MODE_BT709 (0x1<<5)
89 #define OCONF_CSC_BYPASS (0x1<<4)
90 #define OCONF_CC_OUT_8BIT (0x1<<3)
91 #define OCONF_TEST_MODE (0x1<<2)
92 #define OCONF_THREE_LINE_BUFFER (0x1<<0)
93 #define OCONF_TWO_LINE_BUFFER (0x0<<0)
95 /* DCLRKM (dst-key) register */
96 #define DST_KEY_ENABLE (0x1<<31)
97 #define CLK_RGB24_MASK 0x0
98 #define CLK_RGB16_MASK 0x070307
99 #define CLK_RGB15_MASK 0x070707
100 #define CLK_RGB8I_MASK 0xffffff
102 #define RGB16_TO_COLORKEY(c) \
103 (((c & 0xF800) << 8) | ((c & 0x07E0) << 5) | ((c & 0x001F) << 3))
104 #define RGB15_TO_COLORKEY(c) \
105 (((c & 0x7c00) << 9) | ((c & 0x03E0) << 6) | ((c & 0x001F) << 3))
107 /* overlay flip addr flag */
108 #define OFC_UPDATE 0x1
110 /* polyphase filter coefficients */
111 #define N_HORIZ_Y_TAPS 5
112 #define N_VERT_Y_TAPS 3
113 #define N_HORIZ_UV_TAPS 3
114 #define N_VERT_UV_TAPS 3
118 /* memory bufferd overlay registers */
119 struct overlay_registers {
147 u32 RESERVED1; /* 0x6C */
160 u32 FASTHSCALE; /* 0xA0 */
161 u32 UVSCALEV; /* 0xA4 */
162 u32 RESERVEDC[(0x200 - 0xA8) / 4]; /* 0xA8 - 0x1FC */
163 u16 Y_VCOEFS[N_VERT_Y_TAPS * N_PHASES]; /* 0x200 */
164 u16 RESERVEDD[0x100 / 2 - N_VERT_Y_TAPS * N_PHASES];
165 u16 Y_HCOEFS[N_HORIZ_Y_TAPS * N_PHASES]; /* 0x300 */
166 u16 RESERVEDE[0x200 / 2 - N_HORIZ_Y_TAPS * N_PHASES];
167 u16 UV_VCOEFS[N_VERT_UV_TAPS * N_PHASES]; /* 0x500 */
168 u16 RESERVEDF[0x100 / 2 - N_VERT_UV_TAPS * N_PHASES];
169 u16 UV_HCOEFS[N_HORIZ_UV_TAPS * N_PHASES]; /* 0x600 */
170 u16 RESERVEDG[0x100 / 2 - N_HORIZ_UV_TAPS * N_PHASES];
173 struct intel_overlay {
174 struct drm_device *dev;
175 struct intel_crtc *crtc;
176 struct drm_i915_gem_object *vid_bo;
177 struct drm_i915_gem_object *old_vid_bo;
180 u32 pfit_vscale_ratio; /* shifted-point number, (1<<12) == 1.0 */
182 u32 brightness, contrast, saturation;
183 u32 old_xscale, old_yscale;
184 /* register access */
186 struct drm_i915_gem_object *reg_bo;
188 uint32_t last_flip_req;
189 void (*flip_tail)(struct intel_overlay *);
192 static struct overlay_registers __iomem *
193 intel_overlay_map_regs(struct intel_overlay *overlay)
195 drm_i915_private_t *dev_priv = overlay->dev->dev_private;
196 struct overlay_registers __iomem *regs;
198 if (OVERLAY_NEEDS_PHYSICAL(overlay->dev))
199 regs = (struct overlay_registers __iomem *)overlay->reg_bo->phys_obj->handle->vaddr;
201 regs = pmap_mapdev_attr(dev_priv->mm.gtt_base_addr +
202 overlay->reg_bo->gtt_offset, PAGE_SIZE,
203 PAT_WRITE_COMBINING);
208 static void intel_overlay_unmap_regs(struct intel_overlay *overlay,
209 struct overlay_registers __iomem *regs)
211 if (!OVERLAY_NEEDS_PHYSICAL(overlay->dev))
212 pmap_unmapdev((vm_offset_t)regs, PAGE_SIZE);
215 static int intel_overlay_do_wait_request(struct intel_overlay *overlay,
216 void (*tail)(struct intel_overlay *))
218 struct drm_device *dev = overlay->dev;
219 drm_i915_private_t *dev_priv = dev->dev_private;
220 struct intel_ring_buffer *ring = &dev_priv->ring[RCS];
223 BUG_ON(overlay->last_flip_req);
224 ret = i915_add_request(ring, NULL, &overlay->last_flip_req);
228 overlay->flip_tail = tail;
229 ret = i915_wait_seqno(ring, overlay->last_flip_req);
232 i915_gem_retire_requests(dev);
234 overlay->last_flip_req = 0;
238 /* overlay needs to be disable in OCMD reg */
239 static int intel_overlay_on(struct intel_overlay *overlay)
241 struct drm_device *dev = overlay->dev;
242 struct drm_i915_private *dev_priv = dev->dev_private;
243 struct intel_ring_buffer *ring = &dev_priv->ring[RCS];
246 BUG_ON(overlay->active);
249 WARN_ON(IS_I830(dev) && !(dev_priv->quirks & QUIRK_PIPEA_FORCE));
251 ret = intel_ring_begin(ring, 4);
255 intel_ring_emit(ring, MI_OVERLAY_FLIP | MI_OVERLAY_ON);
256 intel_ring_emit(ring, overlay->flip_addr | OFC_UPDATE);
257 intel_ring_emit(ring, MI_WAIT_FOR_EVENT | MI_WAIT_FOR_OVERLAY_FLIP);
258 intel_ring_emit(ring, MI_NOOP);
259 intel_ring_advance(ring);
261 return intel_overlay_do_wait_request(overlay, NULL);
264 /* overlay needs to be enabled in OCMD reg */
265 static int intel_overlay_continue(struct intel_overlay *overlay,
266 bool load_polyphase_filter)
268 struct drm_device *dev = overlay->dev;
269 drm_i915_private_t *dev_priv = dev->dev_private;
270 struct intel_ring_buffer *ring = &dev_priv->ring[RCS];
271 u32 flip_addr = overlay->flip_addr;
275 BUG_ON(!overlay->active);
277 if (load_polyphase_filter)
278 flip_addr |= OFC_UPDATE;
280 /* check for underruns */
281 tmp = I915_READ(DOVSTA);
283 DRM_DEBUG("overlay underrun, DOVSTA: %x\n", tmp);
285 ret = intel_ring_begin(ring, 2);
289 intel_ring_emit(ring, MI_OVERLAY_FLIP | MI_OVERLAY_CONTINUE);
290 intel_ring_emit(ring, flip_addr);
291 intel_ring_advance(ring);
293 return i915_add_request(ring, NULL, &overlay->last_flip_req);
296 static void intel_overlay_release_old_vid_tail(struct intel_overlay *overlay)
298 struct drm_i915_gem_object *obj = overlay->old_vid_bo;
300 i915_gem_object_unpin(obj);
301 drm_gem_object_unreference(&obj->base);
303 overlay->old_vid_bo = NULL;
306 static void intel_overlay_off_tail(struct intel_overlay *overlay)
308 struct drm_i915_gem_object *obj = overlay->vid_bo;
310 /* never have the overlay hw on without showing a frame */
311 BUG_ON(!overlay->vid_bo);
313 i915_gem_object_unpin(obj);
314 drm_gem_object_unreference(&obj->base);
315 overlay->vid_bo = NULL;
317 overlay->crtc->overlay = NULL;
318 overlay->crtc = NULL;
322 /* overlay needs to be disabled in OCMD reg */
323 static int intel_overlay_off(struct intel_overlay *overlay)
325 struct drm_device *dev = overlay->dev;
326 struct drm_i915_private *dev_priv = dev->dev_private;
327 struct intel_ring_buffer *ring = &dev_priv->ring[RCS];
328 u32 flip_addr = overlay->flip_addr;
331 BUG_ON(!overlay->active);
333 /* According to intel docs the overlay hw may hang (when switching
334 * off) without loading the filter coeffs. It is however unclear whether
335 * this applies to the disabling of the overlay or to the switching off
336 * of the hw. Do it in both cases */
337 flip_addr |= OFC_UPDATE;
339 ret = intel_ring_begin(ring, 6);
343 /* wait for overlay to go idle */
344 intel_ring_emit(ring, MI_OVERLAY_FLIP | MI_OVERLAY_CONTINUE);
345 intel_ring_emit(ring, flip_addr);
346 intel_ring_emit(ring, MI_WAIT_FOR_EVENT | MI_WAIT_FOR_OVERLAY_FLIP);
347 /* turn overlay off */
349 /* Workaround: Don't disable the overlay fully, since otherwise
350 * it dies on the next OVERLAY_ON cmd. */
351 intel_ring_emit(ring, MI_NOOP);
352 intel_ring_emit(ring, MI_NOOP);
353 intel_ring_emit(ring, MI_NOOP);
355 intel_ring_emit(ring, MI_OVERLAY_FLIP | MI_OVERLAY_OFF);
356 intel_ring_emit(ring, flip_addr);
357 intel_ring_emit(ring, MI_WAIT_FOR_EVENT | MI_WAIT_FOR_OVERLAY_FLIP);
359 intel_ring_advance(ring);
361 return intel_overlay_do_wait_request(overlay, intel_overlay_off_tail);
364 /* recover from an interruption due to a signal
365 * We have to be careful not to repeat work forever an make forward progess. */
366 static int intel_overlay_recover_from_interrupt(struct intel_overlay *overlay)
368 struct drm_device *dev = overlay->dev;
369 drm_i915_private_t *dev_priv = dev->dev_private;
370 struct intel_ring_buffer *ring = &dev_priv->ring[RCS];
373 if (overlay->last_flip_req == 0)
376 ret = i915_wait_seqno(ring, overlay->last_flip_req);
379 i915_gem_retire_requests(dev);
381 if (overlay->flip_tail)
382 overlay->flip_tail(overlay);
384 overlay->last_flip_req = 0;
388 /* Wait for pending overlay flip and release old frame.
389 * Needs to be called before the overlay register are changed
390 * via intel_overlay_(un)map_regs
392 static int intel_overlay_release_old_vid(struct intel_overlay *overlay)
394 struct drm_device *dev = overlay->dev;
395 drm_i915_private_t *dev_priv = dev->dev_private;
396 struct intel_ring_buffer *ring = &dev_priv->ring[RCS];
399 /* Only wait if there is actually an old frame to release to
400 * guarantee forward progress.
402 if (!overlay->old_vid_bo)
405 if (I915_READ(ISR) & I915_OVERLAY_PLANE_FLIP_PENDING_INTERRUPT) {
406 /* synchronous slowpath */
407 ret = intel_ring_begin(ring, 2);
411 intel_ring_emit(ring, MI_WAIT_FOR_EVENT | MI_WAIT_FOR_OVERLAY_FLIP);
412 intel_ring_emit(ring, MI_NOOP);
413 intel_ring_advance(ring);
415 ret = intel_overlay_do_wait_request(overlay,
416 intel_overlay_release_old_vid_tail);
421 intel_overlay_release_old_vid_tail(overlay);
425 struct put_image_params {
442 static int packed_depth_bytes(u32 format)
444 switch (format & I915_OVERLAY_DEPTH_MASK) {
445 case I915_OVERLAY_YUV422:
447 case I915_OVERLAY_YUV411:
448 /* return 6; not implemented */
454 static int packed_width_bytes(u32 format, short width)
456 switch (format & I915_OVERLAY_DEPTH_MASK) {
457 case I915_OVERLAY_YUV422:
464 static int uv_hsubsampling(u32 format)
466 switch (format & I915_OVERLAY_DEPTH_MASK) {
467 case I915_OVERLAY_YUV422:
468 case I915_OVERLAY_YUV420:
470 case I915_OVERLAY_YUV411:
471 case I915_OVERLAY_YUV410:
478 static int uv_vsubsampling(u32 format)
480 switch (format & I915_OVERLAY_DEPTH_MASK) {
481 case I915_OVERLAY_YUV420:
482 case I915_OVERLAY_YUV410:
484 case I915_OVERLAY_YUV422:
485 case I915_OVERLAY_YUV411:
492 static u32 calc_swidthsw(struct drm_device *dev, u32 offset, u32 width)
494 u32 mask, shift, ret;
502 ret = ((offset + width + mask) >> shift) - (offset >> shift);
509 static const u16 y_static_hcoeffs[N_HORIZ_Y_TAPS * N_PHASES] = {
510 0x3000, 0xb4a0, 0x1930, 0x1920, 0xb4a0,
511 0x3000, 0xb500, 0x19d0, 0x1880, 0xb440,
512 0x3000, 0xb540, 0x1a88, 0x2f80, 0xb3e0,
513 0x3000, 0xb580, 0x1b30, 0x2e20, 0xb380,
514 0x3000, 0xb5c0, 0x1bd8, 0x2cc0, 0xb320,
515 0x3020, 0xb5e0, 0x1c60, 0x2b80, 0xb2c0,
516 0x3020, 0xb5e0, 0x1cf8, 0x2a20, 0xb260,
517 0x3020, 0xb5e0, 0x1d80, 0x28e0, 0xb200,
518 0x3020, 0xb5c0, 0x1e08, 0x3f40, 0xb1c0,
519 0x3020, 0xb580, 0x1e78, 0x3ce0, 0xb160,
520 0x3040, 0xb520, 0x1ed8, 0x3aa0, 0xb120,
521 0x3040, 0xb4a0, 0x1f30, 0x3880, 0xb0e0,
522 0x3040, 0xb400, 0x1f78, 0x3680, 0xb0a0,
523 0x3020, 0xb340, 0x1fb8, 0x34a0, 0xb060,
524 0x3020, 0xb240, 0x1fe0, 0x32e0, 0xb040,
525 0x3020, 0xb140, 0x1ff8, 0x3160, 0xb020,
526 0xb000, 0x3000, 0x0800, 0x3000, 0xb000
529 static const u16 uv_static_hcoeffs[N_HORIZ_UV_TAPS * N_PHASES] = {
530 0x3000, 0x1800, 0x1800, 0xb000, 0x18d0, 0x2e60,
531 0xb000, 0x1990, 0x2ce0, 0xb020, 0x1a68, 0x2b40,
532 0xb040, 0x1b20, 0x29e0, 0xb060, 0x1bd8, 0x2880,
533 0xb080, 0x1c88, 0x3e60, 0xb0a0, 0x1d28, 0x3c00,
534 0xb0c0, 0x1db8, 0x39e0, 0xb0e0, 0x1e40, 0x37e0,
535 0xb100, 0x1eb8, 0x3620, 0xb100, 0x1f18, 0x34a0,
536 0xb100, 0x1f68, 0x3360, 0xb0e0, 0x1fa8, 0x3240,
537 0xb0c0, 0x1fe0, 0x3140, 0xb060, 0x1ff0, 0x30a0,
538 0x3000, 0x0800, 0x3000
541 static void update_polyphase_filter(struct overlay_registers __iomem *regs)
543 memcpy_toio(regs->Y_HCOEFS, y_static_hcoeffs, sizeof(y_static_hcoeffs));
544 memcpy_toio(regs->UV_HCOEFS, uv_static_hcoeffs,
545 sizeof(uv_static_hcoeffs));
548 static bool update_scaling_factors(struct intel_overlay *overlay,
549 struct overlay_registers __iomem *regs,
550 struct put_image_params *params)
552 /* fixed point with a 12 bit shift */
553 u32 xscale, yscale, xscale_UV, yscale_UV;
555 #define FRACT_MASK 0xfff
556 bool scale_changed = false;
557 int uv_hscale = uv_hsubsampling(params->format);
558 int uv_vscale = uv_vsubsampling(params->format);
560 if (params->dst_w > 1)
561 xscale = ((params->src_scan_w - 1) << FP_SHIFT)
564 xscale = 1 << FP_SHIFT;
566 if (params->dst_h > 1)
567 yscale = ((params->src_scan_h - 1) << FP_SHIFT)
570 yscale = 1 << FP_SHIFT;
572 /*if (params->format & I915_OVERLAY_YUV_PLANAR) {*/
573 xscale_UV = xscale/uv_hscale;
574 yscale_UV = yscale/uv_vscale;
575 /* make the Y scale to UV scale ratio an exact multiply */
576 xscale = xscale_UV * uv_hscale;
577 yscale = yscale_UV * uv_vscale;
583 if (xscale != overlay->old_xscale || yscale != overlay->old_yscale)
584 scale_changed = true;
585 overlay->old_xscale = xscale;
586 overlay->old_yscale = yscale;
588 iowrite32(((yscale & FRACT_MASK) << 20) |
589 ((xscale >> FP_SHIFT) << 16) |
590 ((xscale & FRACT_MASK) << 3),
593 iowrite32(((yscale_UV & FRACT_MASK) << 20) |
594 ((xscale_UV >> FP_SHIFT) << 16) |
595 ((xscale_UV & FRACT_MASK) << 3),
598 iowrite32((((yscale >> FP_SHIFT) << 16) |
599 ((yscale_UV >> FP_SHIFT) << 0)),
603 update_polyphase_filter(regs);
605 return scale_changed;
608 static void update_colorkey(struct intel_overlay *overlay,
609 struct overlay_registers __iomem *regs)
611 u32 key = overlay->color_key;
613 switch (overlay->crtc->base.fb->bits_per_pixel) {
615 iowrite32(0, ®s->DCLRKV);
616 iowrite32(CLK_RGB8I_MASK | DST_KEY_ENABLE, ®s->DCLRKM);
620 if (overlay->crtc->base.fb->depth == 15) {
621 iowrite32(RGB15_TO_COLORKEY(key), ®s->DCLRKV);
622 iowrite32(CLK_RGB15_MASK | DST_KEY_ENABLE,
625 iowrite32(RGB16_TO_COLORKEY(key), ®s->DCLRKV);
626 iowrite32(CLK_RGB16_MASK | DST_KEY_ENABLE,
633 iowrite32(key, ®s->DCLRKV);
634 iowrite32(CLK_RGB24_MASK | DST_KEY_ENABLE, ®s->DCLRKM);
639 static u32 overlay_cmd_reg(struct put_image_params *params)
641 u32 cmd = OCMD_ENABLE | OCMD_BUF_TYPE_FRAME | OCMD_BUFFER0;
643 if (params->format & I915_OVERLAY_YUV_PLANAR) {
644 switch (params->format & I915_OVERLAY_DEPTH_MASK) {
645 case I915_OVERLAY_YUV422:
646 cmd |= OCMD_YUV_422_PLANAR;
648 case I915_OVERLAY_YUV420:
649 cmd |= OCMD_YUV_420_PLANAR;
651 case I915_OVERLAY_YUV411:
652 case I915_OVERLAY_YUV410:
653 cmd |= OCMD_YUV_410_PLANAR;
656 } else { /* YUV packed */
657 switch (params->format & I915_OVERLAY_DEPTH_MASK) {
658 case I915_OVERLAY_YUV422:
659 cmd |= OCMD_YUV_422_PACKED;
661 case I915_OVERLAY_YUV411:
662 cmd |= OCMD_YUV_411_PACKED;
666 switch (params->format & I915_OVERLAY_SWAP_MASK) {
667 case I915_OVERLAY_NO_SWAP:
669 case I915_OVERLAY_UV_SWAP:
672 case I915_OVERLAY_Y_SWAP:
675 case I915_OVERLAY_Y_AND_UV_SWAP:
676 cmd |= OCMD_Y_AND_UV_SWAP;
684 static int intel_overlay_do_put_image(struct intel_overlay *overlay,
685 struct drm_i915_gem_object *new_bo,
686 struct put_image_params *params)
689 struct overlay_registers __iomem *regs;
690 bool scale_changed = false;
692 struct drm_device *dev = overlay->dev;
694 u32 swidth, swidthsw, sheight, ostride;
696 DRM_LOCK_ASSERT(dev);
697 sx_assert(&dev->mode_config.mutex, SA_XLOCKED);
700 ret = intel_overlay_release_old_vid(overlay);
704 ret = i915_gem_object_pin_to_display_plane(new_bo, 0, NULL);
708 ret = i915_gem_object_put_fence(new_bo);
712 if (!overlay->active) {
714 regs = intel_overlay_map_regs(overlay);
719 oconfig = OCONF_CC_OUT_8BIT;
720 if (IS_GEN4(overlay->dev))
721 oconfig |= OCONF_CSC_MODE_BT709;
722 oconfig |= overlay->crtc->pipe == 0 ?
723 OCONF_PIPE_A : OCONF_PIPE_B;
724 iowrite32(oconfig, ®s->OCONFIG);
725 intel_overlay_unmap_regs(overlay, regs);
727 ret = intel_overlay_on(overlay);
732 regs = intel_overlay_map_regs(overlay);
738 iowrite32((params->dst_y << 16) | params->dst_x, ®s->DWINPOS);
739 iowrite32((params->dst_h << 16) | params->dst_w, ®s->DWINSZ);
741 if (params->format & I915_OVERLAY_YUV_PACKED)
742 tmp_width = packed_width_bytes(params->format, params->src_w);
744 tmp_width = params->src_w;
746 swidth = params->src_w;
747 swidthsw = calc_swidthsw(overlay->dev, params->offset_Y, tmp_width);
748 sheight = params->src_h;
749 iowrite32(new_bo->gtt_offset + params->offset_Y, ®s->OBUF_0Y);
750 ostride = params->stride_Y;
752 if (params->format & I915_OVERLAY_YUV_PLANAR) {
753 int uv_hscale = uv_hsubsampling(params->format);
754 int uv_vscale = uv_vsubsampling(params->format);
756 swidth |= (params->src_w/uv_hscale) << 16;
757 tmp_U = calc_swidthsw(overlay->dev, params->offset_U,
758 params->src_w/uv_hscale);
759 tmp_V = calc_swidthsw(overlay->dev, params->offset_V,
760 params->src_w/uv_hscale);
761 swidthsw |= max_t(u32, tmp_U, tmp_V) << 16;
762 sheight |= (params->src_h/uv_vscale) << 16;
763 iowrite32(new_bo->gtt_offset + params->offset_U, ®s->OBUF_0U);
764 iowrite32(new_bo->gtt_offset + params->offset_V, ®s->OBUF_0V);
765 ostride |= params->stride_UV << 16;
768 iowrite32(swidth, ®s->SWIDTH);
769 iowrite32(swidthsw, ®s->SWIDTHSW);
770 iowrite32(sheight, ®s->SHEIGHT);
771 iowrite32(ostride, ®s->OSTRIDE);
773 scale_changed = update_scaling_factors(overlay, regs, params);
775 update_colorkey(overlay, regs);
777 iowrite32(overlay_cmd_reg(params), ®s->OCMD);
779 intel_overlay_unmap_regs(overlay, regs);
781 ret = intel_overlay_continue(overlay, scale_changed);
785 overlay->old_vid_bo = overlay->vid_bo;
786 overlay->vid_bo = new_bo;
791 i915_gem_object_unpin(new_bo);
795 int intel_overlay_switch_off(struct intel_overlay *overlay)
797 struct overlay_registers __iomem *regs;
799 struct drm_device *dev = overlay->dev;
803 DRM_LOCK_ASSERT(dev);
804 sx_assert(&dev->mode_config.mutex, SA_XLOCKED);
806 ret = intel_overlay_recover_from_interrupt(overlay);
810 if (!overlay->active)
813 ret = intel_overlay_release_old_vid(overlay);
817 regs = intel_overlay_map_regs(overlay);
818 iowrite32(0, ®s->OCMD);
819 intel_overlay_unmap_regs(overlay, regs);
821 ret = intel_overlay_off(overlay);
825 intel_overlay_off_tail(overlay);
829 static int check_overlay_possible_on_crtc(struct intel_overlay *overlay,
830 struct intel_crtc *crtc)
832 drm_i915_private_t *dev_priv = overlay->dev->dev_private;
837 /* can't use the overlay with double wide pipe */
838 if (INTEL_INFO(overlay->dev)->gen < 4 &&
839 (I915_READ(PIPECONF(crtc->pipe)) & (PIPECONF_DOUBLE_WIDE | PIPECONF_ENABLE)) != PIPECONF_ENABLE)
845 static void update_pfit_vscale_ratio(struct intel_overlay *overlay)
847 struct drm_device *dev = overlay->dev;
848 drm_i915_private_t *dev_priv = dev->dev_private;
849 u32 pfit_control = I915_READ(PFIT_CONTROL);
852 /* XXX: This is not the same logic as in the xorg driver, but more in
853 * line with the intel documentation for the i965
855 if (INTEL_INFO(dev)->gen >= 4) {
856 /* on i965 use the PGM reg to read out the autoscaler values */
857 ratio = I915_READ(PFIT_PGM_RATIOS) >> PFIT_VERT_SCALE_SHIFT_965;
859 if (pfit_control & VERT_AUTO_SCALE)
860 ratio = I915_READ(PFIT_AUTO_RATIOS);
862 ratio = I915_READ(PFIT_PGM_RATIOS);
863 ratio >>= PFIT_VERT_SCALE_SHIFT;
866 overlay->pfit_vscale_ratio = ratio;
869 static int check_overlay_dst(struct intel_overlay *overlay,
870 struct drm_intel_overlay_put_image *rec)
872 struct drm_display_mode *mode = &overlay->crtc->base.mode;
874 if (rec->dst_x < mode->hdisplay &&
875 rec->dst_x + rec->dst_width <= mode->hdisplay &&
876 rec->dst_y < mode->vdisplay &&
877 rec->dst_y + rec->dst_height <= mode->vdisplay)
883 static int check_overlay_scaling(struct put_image_params *rec)
887 /* downscaling limit is 8.0 */
888 tmp = ((rec->src_scan_h << 16) / rec->dst_h) >> 16;
891 tmp = ((rec->src_scan_w << 16) / rec->dst_w) >> 16;
898 static int check_overlay_src(struct drm_device *dev,
899 struct drm_intel_overlay_put_image *rec,
900 struct drm_i915_gem_object *new_bo)
902 int uv_hscale = uv_hsubsampling(rec->flags);
903 int uv_vscale = uv_vsubsampling(rec->flags);
908 /* check src dimensions */
909 if (IS_845G(dev) || IS_I830(dev)) {
910 if (rec->src_height > IMAGE_MAX_HEIGHT_LEGACY ||
911 rec->src_width > IMAGE_MAX_WIDTH_LEGACY)
914 if (rec->src_height > IMAGE_MAX_HEIGHT ||
915 rec->src_width > IMAGE_MAX_WIDTH)
919 /* better safe than sorry, use 4 as the maximal subsampling ratio */
920 if (rec->src_height < N_VERT_Y_TAPS*4 ||
921 rec->src_width < N_HORIZ_Y_TAPS*4)
924 /* check alignment constraints */
925 switch (rec->flags & I915_OVERLAY_TYPE_MASK) {
926 case I915_OVERLAY_RGB:
927 /* not implemented */
930 case I915_OVERLAY_YUV_PACKED:
934 depth = packed_depth_bytes(rec->flags);
938 /* ignore UV planes */
942 /* check pixel alignment */
943 if (rec->offset_Y % depth)
947 case I915_OVERLAY_YUV_PLANAR:
948 if (uv_vscale < 0 || uv_hscale < 0)
950 /* no offset restrictions for planar formats */
957 if (rec->src_width % uv_hscale)
960 /* stride checking */
961 if (IS_I830(dev) || IS_845G(dev))
966 if (rec->stride_Y & stride_mask || rec->stride_UV & stride_mask)
968 if (IS_GEN4(dev) && rec->stride_Y < 512)
971 tmp = (rec->flags & I915_OVERLAY_TYPE_MASK) == I915_OVERLAY_YUV_PLANAR ?
973 if (rec->stride_Y > tmp || rec->stride_UV > 2*1024)
976 /* check buffer dimensions */
977 switch (rec->flags & I915_OVERLAY_TYPE_MASK) {
978 case I915_OVERLAY_RGB:
979 case I915_OVERLAY_YUV_PACKED:
980 /* always 4 Y values per depth pixels */
981 if (packed_width_bytes(rec->flags, rec->src_width) > rec->stride_Y)
984 tmp = rec->stride_Y*rec->src_height;
985 if (rec->offset_Y + tmp > new_bo->base.size)
989 case I915_OVERLAY_YUV_PLANAR:
990 if (rec->src_width > rec->stride_Y)
992 if (rec->src_width/uv_hscale > rec->stride_UV)
995 tmp = rec->stride_Y * rec->src_height;
996 if (rec->offset_Y + tmp > new_bo->base.size)
999 tmp = rec->stride_UV * (rec->src_height / uv_vscale);
1000 if (rec->offset_U + tmp > new_bo->base.size ||
1001 rec->offset_V + tmp > new_bo->base.size)
1010 * Return the pipe currently connected to the panel fitter,
1011 * or -1 if the panel fitter is not present or not in use
1013 static int intel_panel_fitter_pipe(struct drm_device *dev)
1015 struct drm_i915_private *dev_priv = dev->dev_private;
1018 /* i830 doesn't have a panel fitter */
1022 pfit_control = I915_READ(PFIT_CONTROL);
1024 /* See if the panel fitter is in use */
1025 if ((pfit_control & PFIT_ENABLE) == 0)
1028 /* 965 can place panel fitter on either pipe */
1030 return (pfit_control >> 29) & 0x3;
1032 /* older chips can only use pipe 1 */
1036 int intel_overlay_put_image(struct drm_device *dev, void *data,
1037 struct drm_file *file_priv)
1039 struct drm_intel_overlay_put_image *put_image_rec = data;
1040 drm_i915_private_t *dev_priv = dev->dev_private;
1041 struct intel_overlay *overlay;
1042 struct drm_mode_object *drmmode_obj;
1043 struct intel_crtc *crtc;
1044 struct drm_i915_gem_object *new_bo;
1045 struct put_image_params *params;
1048 /* No need to check for DRIVER_MODESET - we don't set it up then. */
1049 overlay = dev_priv->overlay;
1051 DRM_DEBUG("userspace bug: no overlay\n");
1055 if (!(put_image_rec->flags & I915_OVERLAY_ENABLE)) {
1056 sx_xlock(&dev->mode_config.mutex);
1059 ret = intel_overlay_switch_off(overlay);
1062 sx_xunlock(&dev->mode_config.mutex);
1067 params = malloc(sizeof(struct put_image_params), DRM_I915_GEM, M_WAITOK);
1071 drmmode_obj = drm_mode_object_find(dev, put_image_rec->crtc_id,
1072 DRM_MODE_OBJECT_CRTC);
1077 crtc = to_intel_crtc(obj_to_crtc(drmmode_obj));
1079 new_bo = to_intel_bo(drm_gem_object_lookup(dev, file_priv,
1080 put_image_rec->bo_handle));
1081 if (&new_bo->base == NULL) {
1086 sx_xlock(&dev->mode_config.mutex);
1089 if (new_bo->tiling_mode) {
1090 DRM_ERROR("buffer used for overlay image can not be tiled\n");
1095 ret = intel_overlay_recover_from_interrupt(overlay);
1099 if (overlay->crtc != crtc) {
1100 struct drm_display_mode *mode = &crtc->base.mode;
1101 ret = intel_overlay_switch_off(overlay);
1105 ret = check_overlay_possible_on_crtc(overlay, crtc);
1109 overlay->crtc = crtc;
1110 crtc->overlay = overlay;
1112 /* line too wide, i.e. one-line-mode */
1113 if (mode->hdisplay > 1024 &&
1114 intel_panel_fitter_pipe(dev) == crtc->pipe) {
1115 overlay->pfit_active = 1;
1116 update_pfit_vscale_ratio(overlay);
1118 overlay->pfit_active = 0;
1121 ret = check_overlay_dst(overlay, put_image_rec);
1125 if (overlay->pfit_active) {
1126 params->dst_y = ((((u32)put_image_rec->dst_y) << 12) /
1127 overlay->pfit_vscale_ratio);
1128 /* shifting right rounds downwards, so add 1 */
1129 params->dst_h = ((((u32)put_image_rec->dst_height) << 12) /
1130 overlay->pfit_vscale_ratio) + 1;
1132 params->dst_y = put_image_rec->dst_y;
1133 params->dst_h = put_image_rec->dst_height;
1135 params->dst_x = put_image_rec->dst_x;
1136 params->dst_w = put_image_rec->dst_width;
1138 params->src_w = put_image_rec->src_width;
1139 params->src_h = put_image_rec->src_height;
1140 params->src_scan_w = put_image_rec->src_scan_width;
1141 params->src_scan_h = put_image_rec->src_scan_height;
1142 if (params->src_scan_h > params->src_h ||
1143 params->src_scan_w > params->src_w) {
1148 ret = check_overlay_src(dev, put_image_rec, new_bo);
1151 params->format = put_image_rec->flags & ~I915_OVERLAY_FLAGS_MASK;
1152 params->stride_Y = put_image_rec->stride_Y;
1153 params->stride_UV = put_image_rec->stride_UV;
1154 params->offset_Y = put_image_rec->offset_Y;
1155 params->offset_U = put_image_rec->offset_U;
1156 params->offset_V = put_image_rec->offset_V;
1158 /* Check scaling after src size to prevent a divide-by-zero. */
1159 ret = check_overlay_scaling(params);
1163 ret = intel_overlay_do_put_image(overlay, new_bo, params);
1168 sx_xunlock(&dev->mode_config.mutex);
1170 free(params, DRM_I915_GEM);
1176 sx_xunlock(&dev->mode_config.mutex);
1177 drm_gem_object_unreference_unlocked(&new_bo->base);
1179 free(params, DRM_I915_GEM);
1184 static void update_reg_attrs(struct intel_overlay *overlay,
1185 struct overlay_registers __iomem *regs)
1187 iowrite32((overlay->contrast << 18) | (overlay->brightness & 0xff),
1189 iowrite32(overlay->saturation, ®s->OCLRC1);
1192 static bool check_gamma_bounds(u32 gamma1, u32 gamma2)
1196 if (gamma1 & 0xff000000 || gamma2 & 0xff000000)
1199 for (i = 0; i < 3; i++) {
1200 if (((gamma1 >> i*8) & 0xff) >= ((gamma2 >> i*8) & 0xff))
1207 static bool check_gamma5_errata(u32 gamma5)
1211 for (i = 0; i < 3; i++) {
1212 if (((gamma5 >> i*8) & 0xff) == 0x80)
1219 static int check_gamma(struct drm_intel_overlay_attrs *attrs)
1221 if (!check_gamma_bounds(0, attrs->gamma0) ||
1222 !check_gamma_bounds(attrs->gamma0, attrs->gamma1) ||
1223 !check_gamma_bounds(attrs->gamma1, attrs->gamma2) ||
1224 !check_gamma_bounds(attrs->gamma2, attrs->gamma3) ||
1225 !check_gamma_bounds(attrs->gamma3, attrs->gamma4) ||
1226 !check_gamma_bounds(attrs->gamma4, attrs->gamma5) ||
1227 !check_gamma_bounds(attrs->gamma5, 0x00ffffff))
1230 if (!check_gamma5_errata(attrs->gamma5))
1236 int intel_overlay_attrs(struct drm_device *dev, void *data,
1237 struct drm_file *file_priv)
1239 struct drm_intel_overlay_attrs *attrs = data;
1240 drm_i915_private_t *dev_priv = dev->dev_private;
1241 struct intel_overlay *overlay;
1242 struct overlay_registers __iomem *regs;
1245 /* No need to check for DRIVER_MODESET - we don't set it up then. */
1246 overlay = dev_priv->overlay;
1248 DRM_DEBUG("userspace bug: no overlay\n");
1252 sx_xlock(&dev->mode_config.mutex);
1256 if (!(attrs->flags & I915_OVERLAY_UPDATE_ATTRS)) {
1257 attrs->color_key = overlay->color_key;
1258 attrs->brightness = overlay->brightness;
1259 attrs->contrast = overlay->contrast;
1260 attrs->saturation = overlay->saturation;
1262 if (!IS_GEN2(dev)) {
1263 attrs->gamma0 = I915_READ(OGAMC0);
1264 attrs->gamma1 = I915_READ(OGAMC1);
1265 attrs->gamma2 = I915_READ(OGAMC2);
1266 attrs->gamma3 = I915_READ(OGAMC3);
1267 attrs->gamma4 = I915_READ(OGAMC4);
1268 attrs->gamma5 = I915_READ(OGAMC5);
1271 if (attrs->brightness < -128 || attrs->brightness > 127)
1273 if (attrs->contrast > 255)
1275 if (attrs->saturation > 1023)
1278 overlay->color_key = attrs->color_key;
1279 overlay->brightness = attrs->brightness;
1280 overlay->contrast = attrs->contrast;
1281 overlay->saturation = attrs->saturation;
1283 regs = intel_overlay_map_regs(overlay);
1289 update_reg_attrs(overlay, regs);
1291 intel_overlay_unmap_regs(overlay, regs);
1293 if (attrs->flags & I915_OVERLAY_UPDATE_GAMMA) {
1297 if (overlay->active) {
1302 ret = check_gamma(attrs);
1306 I915_WRITE(OGAMC0, attrs->gamma0);
1307 I915_WRITE(OGAMC1, attrs->gamma1);
1308 I915_WRITE(OGAMC2, attrs->gamma2);
1309 I915_WRITE(OGAMC3, attrs->gamma3);
1310 I915_WRITE(OGAMC4, attrs->gamma4);
1311 I915_WRITE(OGAMC5, attrs->gamma5);
1318 sx_xunlock(&dev->mode_config.mutex);
1323 void intel_setup_overlay(struct drm_device *dev)
1325 drm_i915_private_t *dev_priv = dev->dev_private;
1326 struct intel_overlay *overlay;
1327 struct drm_i915_gem_object *reg_bo;
1328 struct overlay_registers __iomem *regs;
1331 if (!HAS_OVERLAY(dev))
1334 overlay = malloc(sizeof(struct intel_overlay), DRM_I915_GEM, M_WAITOK | M_ZERO);
1339 if (WARN_ON(dev_priv->overlay))
1344 reg_bo = i915_gem_alloc_object(dev, PAGE_SIZE);
1347 overlay->reg_bo = reg_bo;
1349 if (OVERLAY_NEEDS_PHYSICAL(dev)) {
1350 ret = i915_gem_attach_phys_object(dev, reg_bo,
1351 I915_GEM_PHYS_OVERLAY_REGS,
1354 DRM_ERROR("failed to attach phys overlay regs\n");
1357 overlay->flip_addr = reg_bo->phys_obj->handle->busaddr;
1359 ret = i915_gem_object_pin(reg_bo, PAGE_SIZE, true, false);
1361 DRM_ERROR("failed to pin overlay register bo\n");
1364 overlay->flip_addr = reg_bo->gtt_offset;
1366 ret = i915_gem_object_set_to_gtt_domain(reg_bo, true);
1368 DRM_ERROR("failed to move overlay register bo into the GTT\n");
1373 /* init all values */
1374 overlay->color_key = 0x0101fe;
1375 overlay->brightness = -19;
1376 overlay->contrast = 75;
1377 overlay->saturation = 146;
1379 regs = intel_overlay_map_regs(overlay);
1383 memset_io(regs, 0, sizeof(struct overlay_registers));
1384 update_polyphase_filter(regs);
1385 update_reg_attrs(overlay, regs);
1387 intel_overlay_unmap_regs(overlay, regs);
1389 dev_priv->overlay = overlay;
1391 DRM_INFO("initialized overlay support\n");
1395 if (!OVERLAY_NEEDS_PHYSICAL(dev))
1396 i915_gem_object_unpin(reg_bo);
1398 drm_gem_object_unreference(®_bo->base);
1401 free(overlay, DRM_I915_GEM);
1405 void intel_cleanup_overlay(struct drm_device *dev)
1407 drm_i915_private_t *dev_priv = dev->dev_private;
1409 if (!dev_priv->overlay)
1412 /* The bo's should be free'd by the generic code already.
1413 * Furthermore modesetting teardown happens beforehand so the
1414 * hardware should be off already */
1415 BUG_ON(dev_priv->overlay->active);
1417 drm_gem_object_unreference_unlocked(&dev_priv->overlay->reg_bo->base);
1418 free(dev_priv->overlay, DRM_I915_GEM);
1421 //#ifdef CONFIG_DEBUG_FS
1422 #define seq_printf(m, fmt, ...) sbuf_printf((m), (fmt), ##__VA_ARGS__)
1424 struct intel_overlay_error_state {
1425 struct overlay_registers regs;
1432 * NOTE Linux<->FreeBSD: We use the normal intel_overlay_map_regs() and
1433 * intel_overlay_unmap_regs() defined at the top of this file.
1436 struct intel_overlay_error_state *
1437 intel_overlay_capture_error_state(struct drm_device *dev)
1439 drm_i915_private_t *dev_priv = dev->dev_private;
1440 struct intel_overlay *overlay = dev_priv->overlay;
1441 struct intel_overlay_error_state *error;
1442 struct overlay_registers __iomem *regs;
1444 if (!overlay || !overlay->active)
1447 error = malloc(sizeof(*error), DRM_I915_GEM, M_NOWAIT);
1451 error->dovsta = I915_READ(DOVSTA);
1452 error->isr = I915_READ(ISR);
1453 if (OVERLAY_NEEDS_PHYSICAL(overlay->dev))
1454 error->base = (__force long)overlay->reg_bo->phys_obj->handle->vaddr;
1456 error->base = overlay->reg_bo->gtt_offset;
1458 regs = intel_overlay_map_regs(overlay);
1462 memcpy_fromio(&error->regs, regs, sizeof(struct overlay_registers));
1463 intel_overlay_unmap_regs(overlay, regs);
1468 free(error, DRM_I915_GEM);
1473 intel_overlay_print_error_state(struct sbuf *m, struct intel_overlay_error_state *error)
1475 seq_printf(m, "Overlay, status: 0x%08x, interrupt: 0x%08x\n",
1476 error->dovsta, error->isr);
1477 seq_printf(m, " Register file at 0x%08lx:\n",
1480 #define P(x) seq_printf(m, " " #x ": 0x%08x\n", error->regs.x)