]> git.proxmox.com Git - mirror_ubuntu-jammy-kernel.git/blame - drivers/gpu/drm/i915/intel_overlay.c
drm/i915: Prevent stalling for a GTT read back from a read-only GPU target
[mirror_ubuntu-jammy-kernel.git] / drivers / gpu / drm / i915 / intel_overlay.c
CommitLineData
02e792fb
DV
1/*
2 * Copyright © 2009
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
10 *
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
13 * Software.
14 *
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
20 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
21 * SOFTWARE.
22 *
23 * Authors:
24 * Daniel Vetter <daniel@ffwll.ch>
25 *
26 * Derived from Xorg ddx, xf86-video-intel, src/i830_video.c
27 */
e167976e
AM
28
29#include <linux/seq_file.h>
02e792fb
DV
30#include "drmP.h"
31#include "drm.h"
32#include "i915_drm.h"
33#include "i915_drv.h"
34#include "i915_reg.h"
35#include "intel_drv.h"
36
37/* Limits for overlay size. According to intel doc, the real limits are:
38 * Y width: 4095, UV width (planar): 2047, Y height: 2047,
39 * UV width (planar): * 1023. But the xorg thinks 2048 for height and width. Use
40 * the mininum of both. */
41#define IMAGE_MAX_WIDTH 2048
42#define IMAGE_MAX_HEIGHT 2046 /* 2 * 1023 */
43/* on 830 and 845 these large limits result in the card hanging */
44#define IMAGE_MAX_WIDTH_LEGACY 1024
45#define IMAGE_MAX_HEIGHT_LEGACY 1088
46
47/* overlay register definitions */
48/* OCMD register */
49#define OCMD_TILED_SURFACE (0x1<<19)
50#define OCMD_MIRROR_MASK (0x3<<17)
51#define OCMD_MIRROR_MODE (0x3<<17)
52#define OCMD_MIRROR_HORIZONTAL (0x1<<17)
53#define OCMD_MIRROR_VERTICAL (0x2<<17)
54#define OCMD_MIRROR_BOTH (0x3<<17)
55#define OCMD_BYTEORDER_MASK (0x3<<14) /* zero for YUYV or FOURCC YUY2 */
56#define OCMD_UV_SWAP (0x1<<14) /* YVYU */
57#define OCMD_Y_SWAP (0x2<<14) /* UYVY or FOURCC UYVY */
58#define OCMD_Y_AND_UV_SWAP (0x3<<14) /* VYUY */
59#define OCMD_SOURCE_FORMAT_MASK (0xf<<10)
60#define OCMD_RGB_888 (0x1<<10) /* not in i965 Intel docs */
61#define OCMD_RGB_555 (0x2<<10) /* not in i965 Intel docs */
62#define OCMD_RGB_565 (0x3<<10) /* not in i965 Intel docs */
63#define OCMD_YUV_422_PACKED (0x8<<10)
64#define OCMD_YUV_411_PACKED (0x9<<10) /* not in i965 Intel docs */
65#define OCMD_YUV_420_PLANAR (0xc<<10)
66#define OCMD_YUV_422_PLANAR (0xd<<10)
67#define OCMD_YUV_410_PLANAR (0xe<<10) /* also 411 */
68#define OCMD_TVSYNCFLIP_PARITY (0x1<<9)
69#define OCMD_TVSYNCFLIP_ENABLE (0x1<<7)
d7961364 70#define OCMD_BUF_TYPE_MASK (0x1<<5)
02e792fb
DV
71#define OCMD_BUF_TYPE_FRAME (0x0<<5)
72#define OCMD_BUF_TYPE_FIELD (0x1<<5)
73#define OCMD_TEST_MODE (0x1<<4)
74#define OCMD_BUFFER_SELECT (0x3<<2)
75#define OCMD_BUFFER0 (0x0<<2)
76#define OCMD_BUFFER1 (0x1<<2)
77#define OCMD_FIELD_SELECT (0x1<<2)
78#define OCMD_FIELD0 (0x0<<1)
79#define OCMD_FIELD1 (0x1<<1)
80#define OCMD_ENABLE (0x1<<0)
81
82/* OCONFIG register */
83#define OCONF_PIPE_MASK (0x1<<18)
84#define OCONF_PIPE_A (0x0<<18)
85#define OCONF_PIPE_B (0x1<<18)
86#define OCONF_GAMMA2_ENABLE (0x1<<16)
87#define OCONF_CSC_MODE_BT601 (0x0<<5)
88#define OCONF_CSC_MODE_BT709 (0x1<<5)
89#define OCONF_CSC_BYPASS (0x1<<4)
90#define OCONF_CC_OUT_8BIT (0x1<<3)
91#define OCONF_TEST_MODE (0x1<<2)
92#define OCONF_THREE_LINE_BUFFER (0x1<<0)
93#define OCONF_TWO_LINE_BUFFER (0x0<<0)
94
95/* DCLRKM (dst-key) register */
96#define DST_KEY_ENABLE (0x1<<31)
97#define CLK_RGB24_MASK 0x0
98#define CLK_RGB16_MASK 0x070307
99#define CLK_RGB15_MASK 0x070707
100#define CLK_RGB8I_MASK 0xffffff
101
102#define RGB16_TO_COLORKEY(c) \
103 (((c & 0xF800) << 8) | ((c & 0x07E0) << 5) | ((c & 0x001F) << 3))
104#define RGB15_TO_COLORKEY(c) \
105 (((c & 0x7c00) << 9) | ((c & 0x03E0) << 6) | ((c & 0x001F) << 3))
106
107/* overlay flip addr flag */
108#define OFC_UPDATE 0x1
109
110/* polyphase filter coefficients */
111#define N_HORIZ_Y_TAPS 5
112#define N_VERT_Y_TAPS 3
113#define N_HORIZ_UV_TAPS 3
114#define N_VERT_UV_TAPS 3
115#define N_PHASES 17
116#define MAX_TAPS 5
117
118/* memory bufferd overlay registers */
119struct overlay_registers {
120 u32 OBUF_0Y;
121 u32 OBUF_1Y;
122 u32 OBUF_0U;
123 u32 OBUF_0V;
124 u32 OBUF_1U;
125 u32 OBUF_1V;
126 u32 OSTRIDE;
127 u32 YRGB_VPH;
128 u32 UV_VPH;
129 u32 HORZ_PH;
130 u32 INIT_PHS;
131 u32 DWINPOS;
132 u32 DWINSZ;
133 u32 SWIDTH;
134 u32 SWIDTHSW;
135 u32 SHEIGHT;
136 u32 YRGBSCALE;
137 u32 UVSCALE;
138 u32 OCLRC0;
139 u32 OCLRC1;
140 u32 DCLRKV;
141 u32 DCLRKM;
142 u32 SCLRKVH;
143 u32 SCLRKVL;
144 u32 SCLRKEN;
145 u32 OCONFIG;
146 u32 OCMD;
147 u32 RESERVED1; /* 0x6C */
148 u32 OSTART_0Y;
149 u32 OSTART_1Y;
150 u32 OSTART_0U;
151 u32 OSTART_0V;
152 u32 OSTART_1U;
153 u32 OSTART_1V;
154 u32 OTILEOFF_0Y;
155 u32 OTILEOFF_1Y;
156 u32 OTILEOFF_0U;
157 u32 OTILEOFF_0V;
158 u32 OTILEOFF_1U;
159 u32 OTILEOFF_1V;
160 u32 FASTHSCALE; /* 0xA0 */
161 u32 UVSCALEV; /* 0xA4 */
162 u32 RESERVEDC[(0x200 - 0xA8) / 4]; /* 0xA8 - 0x1FC */
163 u16 Y_VCOEFS[N_VERT_Y_TAPS * N_PHASES]; /* 0x200 */
164 u16 RESERVEDD[0x100 / 2 - N_VERT_Y_TAPS * N_PHASES];
165 u16 Y_HCOEFS[N_HORIZ_Y_TAPS * N_PHASES]; /* 0x300 */
166 u16 RESERVEDE[0x200 / 2 - N_HORIZ_Y_TAPS * N_PHASES];
167 u16 UV_VCOEFS[N_VERT_UV_TAPS * N_PHASES]; /* 0x500 */
168 u16 RESERVEDF[0x100 / 2 - N_VERT_UV_TAPS * N_PHASES];
169 u16 UV_HCOEFS[N_HORIZ_UV_TAPS * N_PHASES]; /* 0x600 */
170 u16 RESERVEDG[0x100 / 2 - N_HORIZ_UV_TAPS * N_PHASES];
171};
172
23f09ce3
CW
173struct intel_overlay {
174 struct drm_device *dev;
175 struct intel_crtc *crtc;
176 struct drm_i915_gem_object *vid_bo;
177 struct drm_i915_gem_object *old_vid_bo;
178 int active;
179 int pfit_active;
180 u32 pfit_vscale_ratio; /* shifted-point number, (1<<12) == 1.0 */
181 u32 color_key;
182 u32 brightness, contrast, saturation;
183 u32 old_xscale, old_yscale;
184 /* register access */
185 u32 flip_addr;
186 struct drm_i915_gem_object *reg_bo;
187 /* flip handling */
188 uint32_t last_flip_req;
b303cf95 189 void (*flip_tail)(struct intel_overlay *);
23f09ce3 190};
02e792fb 191
8d74f656
CW
192static struct overlay_registers *
193intel_overlay_map_regs(struct intel_overlay *overlay)
02e792fb
DV
194{
195 drm_i915_private_t *dev_priv = overlay->dev->dev_private;
196 struct overlay_registers *regs;
197
9bb2ff73 198 if (OVERLAY_NEEDS_PHYSICAL(overlay->dev))
8d74f656 199 regs = overlay->reg_bo->phys_obj->handle->vaddr;
9bb2ff73 200 else
8d74f656
CW
201 regs = io_mapping_map_wc(dev_priv->mm.gtt_mapping,
202 overlay->reg_bo->gtt_offset);
02e792fb 203
9bb2ff73 204 return regs;
8d74f656 205}
02e792fb 206
9bb2ff73
CW
207static void intel_overlay_unmap_regs(struct intel_overlay *overlay,
208 struct overlay_registers *regs)
8d74f656
CW
209{
210 if (!OVERLAY_NEEDS_PHYSICAL(overlay->dev))
9bb2ff73 211 io_mapping_unmap(regs);
02e792fb
DV
212}
213
b6c028e0 214static int intel_overlay_do_wait_request(struct intel_overlay *overlay,
8dc5d147 215 struct drm_i915_gem_request *request,
b6c028e0 216 bool interruptible,
b303cf95 217 void (*tail)(struct intel_overlay *))
02e792fb
DV
218{
219 struct drm_device *dev = overlay->dev;
852835f3 220 drm_i915_private_t *dev_priv = dev->dev_private;
b6c028e0 221 int ret;
02e792fb 222
b303cf95 223 BUG_ON(overlay->last_flip_req);
3cce469c
CW
224 ret = i915_add_request(dev, NULL, request, &dev_priv->render_ring);
225 if (ret) {
226 kfree(request);
227 return ret;
228 }
229 overlay->last_flip_req = request->seqno;
b303cf95 230 overlay->flip_tail = tail;
852835f3 231 ret = i915_do_wait_request(dev,
722506f0
CW
232 overlay->last_flip_req, true,
233 &dev_priv->render_ring);
b6c028e0 234 if (ret)
03f77ea5 235 return ret;
02e792fb 236
03f77ea5 237 overlay->last_flip_req = 0;
02e792fb 238 return 0;
02e792fb
DV
239}
240
106dadac
CW
241/* Workaround for i830 bug where pipe a must be enable to change control regs */
242static int
243i830_activate_pipe_a(struct drm_device *dev)
02e792fb 244{
106dadac
CW
245 drm_i915_private_t *dev_priv = dev->dev_private;
246 struct intel_crtc *crtc;
247 struct drm_crtc_helper_funcs *crtc_funcs;
248 struct drm_display_mode vesa_640x480 = {
249 DRM_MODE("640x480", DRM_MODE_TYPE_DRIVER, 25175, 640, 656,
250 752, 800, 0, 480, 489, 492, 525, 0,
251 DRM_MODE_FLAG_NHSYNC | DRM_MODE_FLAG_NVSYNC)
252 }, *mode;
253
254 crtc = to_intel_crtc(dev_priv->pipe_to_crtc_mapping[0]);
255 if (crtc->dpms_mode == DRM_MODE_DPMS_ON)
256 return 0;
02e792fb 257
106dadac 258 /* most i8xx have pipe a forced on, so don't trust dpms mode */
5eddb70b 259 if (I915_READ(PIPEACONF) & PIPECONF_ENABLE)
106dadac 260 return 0;
02e792fb 261
106dadac
CW
262 crtc_funcs = crtc->base.helper_private;
263 if (crtc_funcs->dpms == NULL)
264 return 0;
265
266 DRM_DEBUG_DRIVER("Enabling pipe A in order to enable overlay\n");
267
268 mode = drm_mode_duplicate(dev, &vesa_640x480);
269 drm_mode_set_crtcinfo(mode, CRTC_INTERLACE_HALVE_V);
270 if(!drm_crtc_helper_set_mode(&crtc->base, mode,
271 crtc->base.x, crtc->base.y,
272 crtc->base.fb))
273 return 0;
274
275 crtc_funcs->dpms(&crtc->base, DRM_MODE_DPMS_ON);
276 return 1;
277}
278
279static void
280i830_deactivate_pipe_a(struct drm_device *dev)
281{
282 drm_i915_private_t *dev_priv = dev->dev_private;
283 struct drm_crtc *crtc = dev_priv->pipe_to_crtc_mapping[0];
284 struct drm_crtc_helper_funcs *crtc_funcs = crtc->helper_private;
285
286 crtc_funcs->dpms(crtc, DRM_MODE_DPMS_OFF);
02e792fb
DV
287}
288
289/* overlay needs to be disable in OCMD reg */
290static int intel_overlay_on(struct intel_overlay *overlay)
291{
292 struct drm_device *dev = overlay->dev;
e1f99ce6 293 struct drm_i915_private *dev_priv = dev->dev_private;
8dc5d147 294 struct drm_i915_gem_request *request;
106dadac 295 int pipe_a_quirk = 0;
02e792fb 296 int ret;
02e792fb
DV
297
298 BUG_ON(overlay->active);
03f77ea5 299 overlay->active = 1;
b6c028e0 300
106dadac
CW
301 if (IS_I830(dev)) {
302 pipe_a_quirk = i830_activate_pipe_a(dev);
303 if (pipe_a_quirk < 0)
304 return pipe_a_quirk;
305 }
306
8dc5d147 307 request = kzalloc(sizeof(*request), GFP_KERNEL);
106dadac
CW
308 if (request == NULL) {
309 ret = -ENOMEM;
310 goto out;
311 }
03f77ea5 312
e1f99ce6
CW
313 ret = BEGIN_LP_RING(4);
314 if (ret) {
315 kfree(request);
316 goto out;
317 }
318
02e792fb
DV
319 OUT_RING(MI_OVERLAY_FLIP | MI_OVERLAY_ON);
320 OUT_RING(overlay->flip_addr | OFC_UPDATE);
321 OUT_RING(MI_WAIT_FOR_EVENT | MI_WAIT_FOR_OVERLAY_FLIP);
322 OUT_RING(MI_NOOP);
323 ADVANCE_LP_RING();
324
b303cf95 325 ret = intel_overlay_do_wait_request(overlay, request, true, NULL);
106dadac
CW
326out:
327 if (pipe_a_quirk)
328 i830_deactivate_pipe_a(dev);
02e792fb 329
106dadac 330 return ret;
02e792fb
DV
331}
332
333/* overlay needs to be enabled in OCMD reg */
8dc5d147
CW
334static int intel_overlay_continue(struct intel_overlay *overlay,
335 bool load_polyphase_filter)
02e792fb
DV
336{
337 struct drm_device *dev = overlay->dev;
338 drm_i915_private_t *dev_priv = dev->dev_private;
8dc5d147 339 struct drm_i915_gem_request *request;
02e792fb
DV
340 u32 flip_addr = overlay->flip_addr;
341 u32 tmp;
e1f99ce6 342 int ret;
02e792fb
DV
343
344 BUG_ON(!overlay->active);
345
8dc5d147
CW
346 request = kzalloc(sizeof(*request), GFP_KERNEL);
347 if (request == NULL)
348 return -ENOMEM;
349
02e792fb
DV
350 if (load_polyphase_filter)
351 flip_addr |= OFC_UPDATE;
352
353 /* check for underruns */
354 tmp = I915_READ(DOVSTA);
355 if (tmp & (1 << 17))
356 DRM_DEBUG("overlay underrun, DOVSTA: %x\n", tmp);
357
e1f99ce6
CW
358 ret = BEGIN_LP_RING(2);
359 if (ret) {
360 kfree(request);
361 return ret;
362 }
02e792fb
DV
363 OUT_RING(MI_OVERLAY_FLIP | MI_OVERLAY_CONTINUE);
364 OUT_RING(flip_addr);
5a5a0c64
DV
365 ADVANCE_LP_RING();
366
3cce469c
CW
367 ret = i915_add_request(dev, NULL, request, &dev_priv->render_ring);
368 if (ret) {
369 kfree(request);
370 return ret;
371 }
372
373 overlay->last_flip_req = request->seqno;
8dc5d147 374 return 0;
5a5a0c64
DV
375}
376
b303cf95 377static void intel_overlay_release_old_vid_tail(struct intel_overlay *overlay)
5a5a0c64 378{
05394f39 379 struct drm_i915_gem_object *obj = overlay->old_vid_bo;
5a5a0c64 380
b303cf95 381 i915_gem_object_unpin(obj);
05394f39 382 drm_gem_object_unreference(&obj->base);
5a5a0c64 383
b303cf95
CW
384 overlay->old_vid_bo = NULL;
385}
03f77ea5 386
b303cf95
CW
387static void intel_overlay_off_tail(struct intel_overlay *overlay)
388{
05394f39 389 struct drm_i915_gem_object *obj = overlay->vid_bo;
02e792fb 390
b303cf95
CW
391 /* never have the overlay hw on without showing a frame */
392 BUG_ON(!overlay->vid_bo);
02e792fb 393
b303cf95 394 i915_gem_object_unpin(obj);
05394f39 395 drm_gem_object_unreference(&obj->base);
b303cf95 396 overlay->vid_bo = NULL;
03f77ea5 397
b303cf95
CW
398 overlay->crtc->overlay = NULL;
399 overlay->crtc = NULL;
400 overlay->active = 0;
02e792fb
DV
401}
402
403/* overlay needs to be disabled in OCMD reg */
5dcdbcb0
CW
404static int intel_overlay_off(struct intel_overlay *overlay,
405 bool interruptible)
02e792fb 406{
02e792fb 407 struct drm_device *dev = overlay->dev;
e1f99ce6 408 struct drm_i915_private *dev_priv = dev->dev_private;
8dc5d147
CW
409 u32 flip_addr = overlay->flip_addr;
410 struct drm_i915_gem_request *request;
e1f99ce6 411 int ret;
02e792fb
DV
412
413 BUG_ON(!overlay->active);
414
8dc5d147
CW
415 request = kzalloc(sizeof(*request), GFP_KERNEL);
416 if (request == NULL)
417 return -ENOMEM;
418
02e792fb
DV
419 /* According to intel docs the overlay hw may hang (when switching
420 * off) without loading the filter coeffs. It is however unclear whether
421 * this applies to the disabling of the overlay or to the switching off
422 * of the hw. Do it in both cases */
423 flip_addr |= OFC_UPDATE;
424
e1f99ce6
CW
425 ret = BEGIN_LP_RING(6);
426 if (ret) {
427 kfree(request);
428 return ret;
429 }
02e792fb 430 /* wait for overlay to go idle */
02e792fb
DV
431 OUT_RING(MI_OVERLAY_FLIP | MI_OVERLAY_CONTINUE);
432 OUT_RING(flip_addr);
722506f0 433 OUT_RING(MI_WAIT_FOR_EVENT | MI_WAIT_FOR_OVERLAY_FLIP);
02e792fb 434 /* turn overlay off */
722506f0 435 OUT_RING(MI_OVERLAY_FLIP | MI_OVERLAY_OFF);
02e792fb 436 OUT_RING(flip_addr);
722506f0 437 OUT_RING(MI_WAIT_FOR_EVENT | MI_WAIT_FOR_OVERLAY_FLIP);
02e792fb
DV
438 ADVANCE_LP_RING();
439
5dcdbcb0 440 return intel_overlay_do_wait_request(overlay, request, interruptible,
b303cf95 441 intel_overlay_off_tail);
12ca45fe
DV
442}
443
03f77ea5
DV
444/* recover from an interruption due to a signal
445 * We have to be careful not to repeat work forever an make forward progess. */
5dcdbcb0
CW
446static int intel_overlay_recover_from_interrupt(struct intel_overlay *overlay,
447 bool interruptible)
03f77ea5
DV
448{
449 struct drm_device *dev = overlay->dev;
852835f3 450 drm_i915_private_t *dev_priv = dev->dev_private;
03f77ea5 451 int ret;
03f77ea5 452
b303cf95
CW
453 if (overlay->last_flip_req == 0)
454 return 0;
03f77ea5 455
852835f3 456 ret = i915_do_wait_request(dev, overlay->last_flip_req,
722506f0 457 interruptible, &dev_priv->render_ring);
b6c028e0 458 if (ret)
03f77ea5
DV
459 return ret;
460
b303cf95
CW
461 if (overlay->flip_tail)
462 overlay->flip_tail(overlay);
03f77ea5 463
03f77ea5
DV
464 overlay->last_flip_req = 0;
465 return 0;
466}
467
5a5a0c64
DV
468/* Wait for pending overlay flip and release old frame.
469 * Needs to be called before the overlay register are changed
8d74f656
CW
470 * via intel_overlay_(un)map_regs
471 */
02e792fb
DV
472static int intel_overlay_release_old_vid(struct intel_overlay *overlay)
473{
5cd68c98
CW
474 struct drm_device *dev = overlay->dev;
475 drm_i915_private_t *dev_priv = dev->dev_private;
02e792fb 476 int ret;
02e792fb 477
5cd68c98
CW
478 /* Only wait if there is actually an old frame to release to
479 * guarantee forward progress.
480 */
03f77ea5
DV
481 if (!overlay->old_vid_bo)
482 return 0;
483
5cd68c98 484 if (I915_READ(ISR) & I915_OVERLAY_PLANE_FLIP_PENDING_INTERRUPT) {
8dc5d147 485 struct drm_i915_gem_request *request;
02e792fb 486
5cd68c98 487 /* synchronous slowpath */
8dc5d147
CW
488 request = kzalloc(sizeof(*request), GFP_KERNEL);
489 if (request == NULL)
490 return -ENOMEM;
02e792fb 491
e1f99ce6
CW
492 ret = BEGIN_LP_RING(2);
493 if (ret) {
494 kfree(request);
495 return ret;
496 }
497
5cd68c98
CW
498 OUT_RING(MI_WAIT_FOR_EVENT | MI_WAIT_FOR_OVERLAY_FLIP);
499 OUT_RING(MI_NOOP);
500 ADVANCE_LP_RING();
501
8dc5d147 502 ret = intel_overlay_do_wait_request(overlay, request, true,
b303cf95 503 intel_overlay_release_old_vid_tail);
5cd68c98
CW
504 if (ret)
505 return ret;
506 }
02e792fb 507
5cd68c98 508 intel_overlay_release_old_vid_tail(overlay);
02e792fb
DV
509 return 0;
510}
511
512struct put_image_params {
513 int format;
514 short dst_x;
515 short dst_y;
516 short dst_w;
517 short dst_h;
518 short src_w;
519 short src_scan_h;
520 short src_scan_w;
521 short src_h;
522 short stride_Y;
523 short stride_UV;
524 int offset_Y;
525 int offset_U;
526 int offset_V;
527};
528
529static int packed_depth_bytes(u32 format)
530{
531 switch (format & I915_OVERLAY_DEPTH_MASK) {
722506f0
CW
532 case I915_OVERLAY_YUV422:
533 return 4;
534 case I915_OVERLAY_YUV411:
535 /* return 6; not implemented */
536 default:
537 return -EINVAL;
02e792fb
DV
538 }
539}
540
541static int packed_width_bytes(u32 format, short width)
542{
543 switch (format & I915_OVERLAY_DEPTH_MASK) {
722506f0
CW
544 case I915_OVERLAY_YUV422:
545 return width << 1;
546 default:
547 return -EINVAL;
02e792fb
DV
548 }
549}
550
551static int uv_hsubsampling(u32 format)
552{
553 switch (format & I915_OVERLAY_DEPTH_MASK) {
722506f0
CW
554 case I915_OVERLAY_YUV422:
555 case I915_OVERLAY_YUV420:
556 return 2;
557 case I915_OVERLAY_YUV411:
558 case I915_OVERLAY_YUV410:
559 return 4;
560 default:
561 return -EINVAL;
02e792fb
DV
562 }
563}
564
565static int uv_vsubsampling(u32 format)
566{
567 switch (format & I915_OVERLAY_DEPTH_MASK) {
722506f0
CW
568 case I915_OVERLAY_YUV420:
569 case I915_OVERLAY_YUV410:
570 return 2;
571 case I915_OVERLAY_YUV422:
572 case I915_OVERLAY_YUV411:
573 return 1;
574 default:
575 return -EINVAL;
02e792fb
DV
576 }
577}
578
579static u32 calc_swidthsw(struct drm_device *dev, u32 offset, u32 width)
580{
581 u32 mask, shift, ret;
a6c45cf0 582 if (IS_GEN2(dev)) {
02e792fb
DV
583 mask = 0x1f;
584 shift = 5;
a6c45cf0
CW
585 } else {
586 mask = 0x3f;
587 shift = 6;
02e792fb
DV
588 }
589 ret = ((offset + width + mask) >> shift) - (offset >> shift);
a6c45cf0 590 if (!IS_GEN2(dev))
02e792fb
DV
591 ret <<= 1;
592 ret -=1;
593 return ret << 2;
594}
595
596static const u16 y_static_hcoeffs[N_HORIZ_Y_TAPS * N_PHASES] = {
597 0x3000, 0xb4a0, 0x1930, 0x1920, 0xb4a0,
598 0x3000, 0xb500, 0x19d0, 0x1880, 0xb440,
599 0x3000, 0xb540, 0x1a88, 0x2f80, 0xb3e0,
600 0x3000, 0xb580, 0x1b30, 0x2e20, 0xb380,
601 0x3000, 0xb5c0, 0x1bd8, 0x2cc0, 0xb320,
602 0x3020, 0xb5e0, 0x1c60, 0x2b80, 0xb2c0,
603 0x3020, 0xb5e0, 0x1cf8, 0x2a20, 0xb260,
604 0x3020, 0xb5e0, 0x1d80, 0x28e0, 0xb200,
605 0x3020, 0xb5c0, 0x1e08, 0x3f40, 0xb1c0,
606 0x3020, 0xb580, 0x1e78, 0x3ce0, 0xb160,
607 0x3040, 0xb520, 0x1ed8, 0x3aa0, 0xb120,
608 0x3040, 0xb4a0, 0x1f30, 0x3880, 0xb0e0,
609 0x3040, 0xb400, 0x1f78, 0x3680, 0xb0a0,
610 0x3020, 0xb340, 0x1fb8, 0x34a0, 0xb060,
611 0x3020, 0xb240, 0x1fe0, 0x32e0, 0xb040,
612 0x3020, 0xb140, 0x1ff8, 0x3160, 0xb020,
722506f0
CW
613 0xb000, 0x3000, 0x0800, 0x3000, 0xb000
614};
615
02e792fb
DV
616static const u16 uv_static_hcoeffs[N_HORIZ_UV_TAPS * N_PHASES] = {
617 0x3000, 0x1800, 0x1800, 0xb000, 0x18d0, 0x2e60,
618 0xb000, 0x1990, 0x2ce0, 0xb020, 0x1a68, 0x2b40,
619 0xb040, 0x1b20, 0x29e0, 0xb060, 0x1bd8, 0x2880,
620 0xb080, 0x1c88, 0x3e60, 0xb0a0, 0x1d28, 0x3c00,
621 0xb0c0, 0x1db8, 0x39e0, 0xb0e0, 0x1e40, 0x37e0,
622 0xb100, 0x1eb8, 0x3620, 0xb100, 0x1f18, 0x34a0,
623 0xb100, 0x1f68, 0x3360, 0xb0e0, 0x1fa8, 0x3240,
624 0xb0c0, 0x1fe0, 0x3140, 0xb060, 0x1ff0, 0x30a0,
722506f0
CW
625 0x3000, 0x0800, 0x3000
626};
02e792fb
DV
627
628static void update_polyphase_filter(struct overlay_registers *regs)
629{
630 memcpy(regs->Y_HCOEFS, y_static_hcoeffs, sizeof(y_static_hcoeffs));
631 memcpy(regs->UV_HCOEFS, uv_static_hcoeffs, sizeof(uv_static_hcoeffs));
632}
633
634static bool update_scaling_factors(struct intel_overlay *overlay,
635 struct overlay_registers *regs,
636 struct put_image_params *params)
637{
638 /* fixed point with a 12 bit shift */
639 u32 xscale, yscale, xscale_UV, yscale_UV;
640#define FP_SHIFT 12
641#define FRACT_MASK 0xfff
642 bool scale_changed = false;
643 int uv_hscale = uv_hsubsampling(params->format);
644 int uv_vscale = uv_vsubsampling(params->format);
645
646 if (params->dst_w > 1)
647 xscale = ((params->src_scan_w - 1) << FP_SHIFT)
648 /(params->dst_w);
649 else
650 xscale = 1 << FP_SHIFT;
651
652 if (params->dst_h > 1)
653 yscale = ((params->src_scan_h - 1) << FP_SHIFT)
654 /(params->dst_h);
655 else
656 yscale = 1 << FP_SHIFT;
657
658 /*if (params->format & I915_OVERLAY_YUV_PLANAR) {*/
722506f0
CW
659 xscale_UV = xscale/uv_hscale;
660 yscale_UV = yscale/uv_vscale;
661 /* make the Y scale to UV scale ratio an exact multiply */
662 xscale = xscale_UV * uv_hscale;
663 yscale = yscale_UV * uv_vscale;
02e792fb 664 /*} else {
722506f0
CW
665 xscale_UV = 0;
666 yscale_UV = 0;
667 }*/
02e792fb
DV
668
669 if (xscale != overlay->old_xscale || yscale != overlay->old_yscale)
670 scale_changed = true;
671 overlay->old_xscale = xscale;
672 overlay->old_yscale = yscale;
673
722506f0
CW
674 regs->YRGBSCALE = (((yscale & FRACT_MASK) << 20) |
675 ((xscale >> FP_SHIFT) << 16) |
676 ((xscale & FRACT_MASK) << 3));
677
678 regs->UVSCALE = (((yscale_UV & FRACT_MASK) << 20) |
679 ((xscale_UV >> FP_SHIFT) << 16) |
680 ((xscale_UV & FRACT_MASK) << 3));
681
682 regs->UVSCALEV = ((((yscale >> FP_SHIFT) << 16) |
683 ((yscale_UV >> FP_SHIFT) << 0)));
02e792fb
DV
684
685 if (scale_changed)
686 update_polyphase_filter(regs);
687
688 return scale_changed;
689}
690
691static void update_colorkey(struct intel_overlay *overlay,
692 struct overlay_registers *regs)
693{
694 u32 key = overlay->color_key;
6ba3ddd9 695
02e792fb 696 switch (overlay->crtc->base.fb->bits_per_pixel) {
722506f0
CW
697 case 8:
698 regs->DCLRKV = 0;
699 regs->DCLRKM = CLK_RGB8I_MASK | DST_KEY_ENABLE;
6ba3ddd9
CW
700 break;
701
722506f0
CW
702 case 16:
703 if (overlay->crtc->base.fb->depth == 15) {
704 regs->DCLRKV = RGB15_TO_COLORKEY(key);
705 regs->DCLRKM = CLK_RGB15_MASK | DST_KEY_ENABLE;
706 } else {
707 regs->DCLRKV = RGB16_TO_COLORKEY(key);
708 regs->DCLRKM = CLK_RGB16_MASK | DST_KEY_ENABLE;
709 }
6ba3ddd9
CW
710 break;
711
722506f0
CW
712 case 24:
713 case 32:
714 regs->DCLRKV = key;
715 regs->DCLRKM = CLK_RGB24_MASK | DST_KEY_ENABLE;
6ba3ddd9 716 break;
02e792fb
DV
717 }
718}
719
720static u32 overlay_cmd_reg(struct put_image_params *params)
721{
722 u32 cmd = OCMD_ENABLE | OCMD_BUF_TYPE_FRAME | OCMD_BUFFER0;
723
724 if (params->format & I915_OVERLAY_YUV_PLANAR) {
725 switch (params->format & I915_OVERLAY_DEPTH_MASK) {
722506f0
CW
726 case I915_OVERLAY_YUV422:
727 cmd |= OCMD_YUV_422_PLANAR;
728 break;
729 case I915_OVERLAY_YUV420:
730 cmd |= OCMD_YUV_420_PLANAR;
731 break;
732 case I915_OVERLAY_YUV411:
733 case I915_OVERLAY_YUV410:
734 cmd |= OCMD_YUV_410_PLANAR;
735 break;
02e792fb
DV
736 }
737 } else { /* YUV packed */
738 switch (params->format & I915_OVERLAY_DEPTH_MASK) {
722506f0
CW
739 case I915_OVERLAY_YUV422:
740 cmd |= OCMD_YUV_422_PACKED;
741 break;
742 case I915_OVERLAY_YUV411:
743 cmd |= OCMD_YUV_411_PACKED;
744 break;
02e792fb
DV
745 }
746
747 switch (params->format & I915_OVERLAY_SWAP_MASK) {
722506f0
CW
748 case I915_OVERLAY_NO_SWAP:
749 break;
750 case I915_OVERLAY_UV_SWAP:
751 cmd |= OCMD_UV_SWAP;
752 break;
753 case I915_OVERLAY_Y_SWAP:
754 cmd |= OCMD_Y_SWAP;
755 break;
756 case I915_OVERLAY_Y_AND_UV_SWAP:
757 cmd |= OCMD_Y_AND_UV_SWAP;
758 break;
02e792fb
DV
759 }
760 }
761
762 return cmd;
763}
764
5fe82c5e 765static int intel_overlay_do_put_image(struct intel_overlay *overlay,
05394f39 766 struct drm_i915_gem_object *new_bo,
5fe82c5e 767 struct put_image_params *params)
02e792fb
DV
768{
769 int ret, tmp_width;
770 struct overlay_registers *regs;
771 bool scale_changed = false;
02e792fb
DV
772 struct drm_device *dev = overlay->dev;
773
774 BUG_ON(!mutex_is_locked(&dev->struct_mutex));
775 BUG_ON(!mutex_is_locked(&dev->mode_config.mutex));
776 BUG_ON(!overlay);
777
02e792fb
DV
778 ret = intel_overlay_release_old_vid(overlay);
779 if (ret != 0)
780 return ret;
781
75e9e915 782 ret = i915_gem_object_pin(new_bo, PAGE_SIZE, true);
02e792fb
DV
783 if (ret != 0)
784 return ret;
785
786 ret = i915_gem_object_set_to_gtt_domain(new_bo, 0);
787 if (ret != 0)
788 goto out_unpin;
789
790 if (!overlay->active) {
8d74f656 791 regs = intel_overlay_map_regs(overlay);
02e792fb
DV
792 if (!regs) {
793 ret = -ENOMEM;
794 goto out_unpin;
795 }
796 regs->OCONFIG = OCONF_CC_OUT_8BIT;
a6c45cf0 797 if (IS_GEN4(overlay->dev))
02e792fb
DV
798 regs->OCONFIG |= OCONF_CSC_MODE_BT709;
799 regs->OCONFIG |= overlay->crtc->pipe == 0 ?
800 OCONF_PIPE_A : OCONF_PIPE_B;
9bb2ff73 801 intel_overlay_unmap_regs(overlay, regs);
02e792fb
DV
802
803 ret = intel_overlay_on(overlay);
804 if (ret != 0)
805 goto out_unpin;
806 }
807
8d74f656 808 regs = intel_overlay_map_regs(overlay);
02e792fb
DV
809 if (!regs) {
810 ret = -ENOMEM;
811 goto out_unpin;
812 }
813
814 regs->DWINPOS = (params->dst_y << 16) | params->dst_x;
815 regs->DWINSZ = (params->dst_h << 16) | params->dst_w;
816
817 if (params->format & I915_OVERLAY_YUV_PACKED)
818 tmp_width = packed_width_bytes(params->format, params->src_w);
819 else
820 tmp_width = params->src_w;
821
822 regs->SWIDTH = params->src_w;
823 regs->SWIDTHSW = calc_swidthsw(overlay->dev,
722506f0 824 params->offset_Y, tmp_width);
02e792fb 825 regs->SHEIGHT = params->src_h;
05394f39 826 regs->OBUF_0Y = new_bo->gtt_offset + params-> offset_Y;
02e792fb
DV
827 regs->OSTRIDE = params->stride_Y;
828
829 if (params->format & I915_OVERLAY_YUV_PLANAR) {
830 int uv_hscale = uv_hsubsampling(params->format);
831 int uv_vscale = uv_vsubsampling(params->format);
832 u32 tmp_U, tmp_V;
833 regs->SWIDTH |= (params->src_w/uv_hscale) << 16;
834 tmp_U = calc_swidthsw(overlay->dev, params->offset_U,
722506f0 835 params->src_w/uv_hscale);
02e792fb 836 tmp_V = calc_swidthsw(overlay->dev, params->offset_V,
722506f0 837 params->src_w/uv_hscale);
02e792fb
DV
838 regs->SWIDTHSW |= max_t(u32, tmp_U, tmp_V) << 16;
839 regs->SHEIGHT |= (params->src_h/uv_vscale) << 16;
05394f39
CW
840 regs->OBUF_0U = new_bo->gtt_offset + params->offset_U;
841 regs->OBUF_0V = new_bo->gtt_offset + params->offset_V;
02e792fb
DV
842 regs->OSTRIDE |= params->stride_UV << 16;
843 }
844
845 scale_changed = update_scaling_factors(overlay, regs, params);
846
847 update_colorkey(overlay, regs);
848
849 regs->OCMD = overlay_cmd_reg(params);
850
9bb2ff73 851 intel_overlay_unmap_regs(overlay, regs);
02e792fb 852
8dc5d147
CW
853 ret = intel_overlay_continue(overlay, scale_changed);
854 if (ret)
855 goto out_unpin;
02e792fb
DV
856
857 overlay->old_vid_bo = overlay->vid_bo;
05394f39 858 overlay->vid_bo = new_bo;
02e792fb
DV
859
860 return 0;
861
862out_unpin:
863 i915_gem_object_unpin(new_bo);
864 return ret;
865}
866
5dcdbcb0
CW
867int intel_overlay_switch_off(struct intel_overlay *overlay,
868 bool interruptible)
02e792fb 869{
02e792fb 870 struct overlay_registers *regs;
02e792fb 871 struct drm_device *dev = overlay->dev;
5dcdbcb0 872 int ret;
02e792fb
DV
873
874 BUG_ON(!mutex_is_locked(&dev->struct_mutex));
875 BUG_ON(!mutex_is_locked(&dev->mode_config.mutex));
876
b303cf95
CW
877 ret = intel_overlay_recover_from_interrupt(overlay, interruptible);
878 if (ret != 0)
879 return ret;
9bedb974 880
02e792fb
DV
881 if (!overlay->active)
882 return 0;
883
02e792fb
DV
884 ret = intel_overlay_release_old_vid(overlay);
885 if (ret != 0)
886 return ret;
887
8d74f656 888 regs = intel_overlay_map_regs(overlay);
02e792fb 889 regs->OCMD = 0;
9bb2ff73 890 intel_overlay_unmap_regs(overlay, regs);
02e792fb 891
5dcdbcb0 892 ret = intel_overlay_off(overlay, interruptible);
03f77ea5
DV
893 if (ret != 0)
894 return ret;
895
12ca45fe 896 intel_overlay_off_tail(overlay);
02e792fb
DV
897 return 0;
898}
899
900static int check_overlay_possible_on_crtc(struct intel_overlay *overlay,
901 struct intel_crtc *crtc)
902{
722506f0 903 drm_i915_private_t *dev_priv = overlay->dev->dev_private;
02e792fb 904
f7abfe8b 905 if (!crtc->active)
02e792fb
DV
906 return -EINVAL;
907
02e792fb 908 /* can't use the overlay with double wide pipe */
a6c45cf0 909 if (INTEL_INFO(overlay->dev)->gen < 4 &&
f7abfe8b 910 (I915_READ(PIPECONF(crtc->pipe)) & (PIPECONF_DOUBLE_WIDE | PIPECONF_ENABLE)) != PIPECONF_ENABLE)
02e792fb
DV
911 return -EINVAL;
912
913 return 0;
914}
915
916static void update_pfit_vscale_ratio(struct intel_overlay *overlay)
917{
918 struct drm_device *dev = overlay->dev;
722506f0 919 drm_i915_private_t *dev_priv = dev->dev_private;
02e792fb 920 u32 pfit_control = I915_READ(PFIT_CONTROL);
446d2183 921 u32 ratio;
02e792fb
DV
922
923 /* XXX: This is not the same logic as in the xorg driver, but more in
446d2183
CW
924 * line with the intel documentation for the i965
925 */
a6c45cf0
CW
926 if (INTEL_INFO(dev)->gen >= 4) {
927 /* on i965 use the PGM reg to read out the autoscaler values */
928 ratio = I915_READ(PFIT_PGM_RATIOS) >> PFIT_VERT_SCALE_SHIFT_965;
929 } else {
446d2183
CW
930 if (pfit_control & VERT_AUTO_SCALE)
931 ratio = I915_READ(PFIT_AUTO_RATIOS);
02e792fb 932 else
446d2183
CW
933 ratio = I915_READ(PFIT_PGM_RATIOS);
934 ratio >>= PFIT_VERT_SCALE_SHIFT;
02e792fb
DV
935 }
936
937 overlay->pfit_vscale_ratio = ratio;
938}
939
940static int check_overlay_dst(struct intel_overlay *overlay,
941 struct drm_intel_overlay_put_image *rec)
942{
943 struct drm_display_mode *mode = &overlay->crtc->base.mode;
944
722506f0
CW
945 if (rec->dst_x < mode->crtc_hdisplay &&
946 rec->dst_x + rec->dst_width <= mode->crtc_hdisplay &&
947 rec->dst_y < mode->crtc_vdisplay &&
948 rec->dst_y + rec->dst_height <= mode->crtc_vdisplay)
02e792fb
DV
949 return 0;
950 else
951 return -EINVAL;
952}
953
954static int check_overlay_scaling(struct put_image_params *rec)
955{
956 u32 tmp;
957
958 /* downscaling limit is 8.0 */
959 tmp = ((rec->src_scan_h << 16) / rec->dst_h) >> 16;
960 if (tmp > 7)
961 return -EINVAL;
962 tmp = ((rec->src_scan_w << 16) / rec->dst_w) >> 16;
963 if (tmp > 7)
964 return -EINVAL;
965
966 return 0;
967}
968
969static int check_overlay_src(struct drm_device *dev,
970 struct drm_intel_overlay_put_image *rec,
05394f39 971 struct drm_i915_gem_object *new_bo)
02e792fb 972{
02e792fb
DV
973 int uv_hscale = uv_hsubsampling(rec->flags);
974 int uv_vscale = uv_vsubsampling(rec->flags);
8f28f54a
DC
975 u32 stride_mask;
976 int depth;
977 u32 tmp;
02e792fb
DV
978
979 /* check src dimensions */
980 if (IS_845G(dev) || IS_I830(dev)) {
722506f0 981 if (rec->src_height > IMAGE_MAX_HEIGHT_LEGACY ||
9f7c3f44 982 rec->src_width > IMAGE_MAX_WIDTH_LEGACY)
02e792fb
DV
983 return -EINVAL;
984 } else {
722506f0 985 if (rec->src_height > IMAGE_MAX_HEIGHT ||
9f7c3f44 986 rec->src_width > IMAGE_MAX_WIDTH)
02e792fb
DV
987 return -EINVAL;
988 }
9f7c3f44 989
02e792fb 990 /* better safe than sorry, use 4 as the maximal subsampling ratio */
722506f0 991 if (rec->src_height < N_VERT_Y_TAPS*4 ||
9f7c3f44 992 rec->src_width < N_HORIZ_Y_TAPS*4)
02e792fb
DV
993 return -EINVAL;
994
a1efd14a 995 /* check alignment constraints */
02e792fb 996 switch (rec->flags & I915_OVERLAY_TYPE_MASK) {
722506f0
CW
997 case I915_OVERLAY_RGB:
998 /* not implemented */
999 return -EINVAL;
9f7c3f44 1000
722506f0 1001 case I915_OVERLAY_YUV_PACKED:
722506f0 1002 if (uv_vscale != 1)
02e792fb 1003 return -EINVAL;
9f7c3f44
CW
1004
1005 depth = packed_depth_bytes(rec->flags);
722506f0
CW
1006 if (depth < 0)
1007 return depth;
9f7c3f44 1008
722506f0
CW
1009 /* ignore UV planes */
1010 rec->stride_UV = 0;
1011 rec->offset_U = 0;
1012 rec->offset_V = 0;
1013 /* check pixel alignment */
1014 if (rec->offset_Y % depth)
1015 return -EINVAL;
1016 break;
9f7c3f44 1017
722506f0
CW
1018 case I915_OVERLAY_YUV_PLANAR:
1019 if (uv_vscale < 0 || uv_hscale < 0)
02e792fb 1020 return -EINVAL;
722506f0
CW
1021 /* no offset restrictions for planar formats */
1022 break;
9f7c3f44 1023
722506f0
CW
1024 default:
1025 return -EINVAL;
02e792fb
DV
1026 }
1027
1028 if (rec->src_width % uv_hscale)
1029 return -EINVAL;
1030
1031 /* stride checking */
a1efd14a
CW
1032 if (IS_I830(dev) || IS_845G(dev))
1033 stride_mask = 255;
1034 else
1035 stride_mask = 63;
02e792fb
DV
1036
1037 if (rec->stride_Y & stride_mask || rec->stride_UV & stride_mask)
1038 return -EINVAL;
a6c45cf0 1039 if (IS_GEN4(dev) && rec->stride_Y < 512)
02e792fb
DV
1040 return -EINVAL;
1041
1042 tmp = (rec->flags & I915_OVERLAY_TYPE_MASK) == I915_OVERLAY_YUV_PLANAR ?
9f7c3f44
CW
1043 4096 : 8192;
1044 if (rec->stride_Y > tmp || rec->stride_UV > 2*1024)
02e792fb
DV
1045 return -EINVAL;
1046
1047 /* check buffer dimensions */
1048 switch (rec->flags & I915_OVERLAY_TYPE_MASK) {
722506f0
CW
1049 case I915_OVERLAY_RGB:
1050 case I915_OVERLAY_YUV_PACKED:
1051 /* always 4 Y values per depth pixels */
1052 if (packed_width_bytes(rec->flags, rec->src_width) > rec->stride_Y)
1053 return -EINVAL;
1054
1055 tmp = rec->stride_Y*rec->src_height;
05394f39 1056 if (rec->offset_Y + tmp > new_bo->base.size)
722506f0
CW
1057 return -EINVAL;
1058 break;
1059
1060 case I915_OVERLAY_YUV_PLANAR:
1061 if (rec->src_width > rec->stride_Y)
1062 return -EINVAL;
1063 if (rec->src_width/uv_hscale > rec->stride_UV)
1064 return -EINVAL;
1065
9f7c3f44 1066 tmp = rec->stride_Y * rec->src_height;
05394f39 1067 if (rec->offset_Y + tmp > new_bo->base.size)
722506f0 1068 return -EINVAL;
9f7c3f44
CW
1069
1070 tmp = rec->stride_UV * (rec->src_height / uv_vscale);
05394f39
CW
1071 if (rec->offset_U + tmp > new_bo->base.size ||
1072 rec->offset_V + tmp > new_bo->base.size)
722506f0
CW
1073 return -EINVAL;
1074 break;
02e792fb
DV
1075 }
1076
1077 return 0;
1078}
1079
e9e331a8
CW
1080/**
1081 * Return the pipe currently connected to the panel fitter,
1082 * or -1 if the panel fitter is not present or not in use
1083 */
1084static int intel_panel_fitter_pipe(struct drm_device *dev)
1085{
1086 struct drm_i915_private *dev_priv = dev->dev_private;
1087 u32 pfit_control;
1088
1089 /* i830 doesn't have a panel fitter */
1090 if (IS_I830(dev))
1091 return -1;
1092
1093 pfit_control = I915_READ(PFIT_CONTROL);
1094
1095 /* See if the panel fitter is in use */
1096 if ((pfit_control & PFIT_ENABLE) == 0)
1097 return -1;
1098
1099 /* 965 can place panel fitter on either pipe */
a6c45cf0 1100 if (IS_GEN4(dev))
e9e331a8
CW
1101 return (pfit_control >> 29) & 0x3;
1102
1103 /* older chips can only use pipe 1 */
1104 return 1;
1105}
1106
02e792fb
DV
1107int intel_overlay_put_image(struct drm_device *dev, void *data,
1108 struct drm_file *file_priv)
1109{
1110 struct drm_intel_overlay_put_image *put_image_rec = data;
1111 drm_i915_private_t *dev_priv = dev->dev_private;
1112 struct intel_overlay *overlay;
1113 struct drm_mode_object *drmmode_obj;
1114 struct intel_crtc *crtc;
05394f39 1115 struct drm_i915_gem_object *new_bo;
02e792fb
DV
1116 struct put_image_params *params;
1117 int ret;
1118
1119 if (!dev_priv) {
1120 DRM_ERROR("called with no initialization\n");
1121 return -EINVAL;
1122 }
1123
1124 overlay = dev_priv->overlay;
1125 if (!overlay) {
1126 DRM_DEBUG("userspace bug: no overlay\n");
1127 return -ENODEV;
1128 }
1129
1130 if (!(put_image_rec->flags & I915_OVERLAY_ENABLE)) {
1131 mutex_lock(&dev->mode_config.mutex);
1132 mutex_lock(&dev->struct_mutex);
1133
5dcdbcb0 1134 ret = intel_overlay_switch_off(overlay, true);
02e792fb
DV
1135
1136 mutex_unlock(&dev->struct_mutex);
1137 mutex_unlock(&dev->mode_config.mutex);
1138
1139 return ret;
1140 }
1141
1142 params = kmalloc(sizeof(struct put_image_params), GFP_KERNEL);
1143 if (!params)
1144 return -ENOMEM;
1145
1146 drmmode_obj = drm_mode_object_find(dev, put_image_rec->crtc_id,
722506f0 1147 DRM_MODE_OBJECT_CRTC);
915a428e
DC
1148 if (!drmmode_obj) {
1149 ret = -ENOENT;
1150 goto out_free;
1151 }
02e792fb
DV
1152 crtc = to_intel_crtc(obj_to_crtc(drmmode_obj));
1153
05394f39
CW
1154 new_bo = to_intel_bo(drm_gem_object_lookup(dev, file_priv,
1155 put_image_rec->bo_handle));
915a428e
DC
1156 if (!new_bo) {
1157 ret = -ENOENT;
1158 goto out_free;
1159 }
02e792fb
DV
1160
1161 mutex_lock(&dev->mode_config.mutex);
1162 mutex_lock(&dev->struct_mutex);
1163
b303cf95
CW
1164 ret = intel_overlay_recover_from_interrupt(overlay, true);
1165 if (ret != 0)
1166 goto out_unlock;
03f77ea5 1167
02e792fb
DV
1168 if (overlay->crtc != crtc) {
1169 struct drm_display_mode *mode = &crtc->base.mode;
5dcdbcb0 1170 ret = intel_overlay_switch_off(overlay, true);
02e792fb
DV
1171 if (ret != 0)
1172 goto out_unlock;
1173
1174 ret = check_overlay_possible_on_crtc(overlay, crtc);
1175 if (ret != 0)
1176 goto out_unlock;
1177
1178 overlay->crtc = crtc;
1179 crtc->overlay = overlay;
1180
e9e331a8
CW
1181 /* line too wide, i.e. one-line-mode */
1182 if (mode->hdisplay > 1024 &&
1183 intel_panel_fitter_pipe(dev) == crtc->pipe) {
02e792fb
DV
1184 overlay->pfit_active = 1;
1185 update_pfit_vscale_ratio(overlay);
1186 } else
1187 overlay->pfit_active = 0;
1188 }
1189
1190 ret = check_overlay_dst(overlay, put_image_rec);
1191 if (ret != 0)
1192 goto out_unlock;
1193
1194 if (overlay->pfit_active) {
1195 params->dst_y = ((((u32)put_image_rec->dst_y) << 12) /
722506f0 1196 overlay->pfit_vscale_ratio);
02e792fb
DV
1197 /* shifting right rounds downwards, so add 1 */
1198 params->dst_h = ((((u32)put_image_rec->dst_height) << 12) /
722506f0 1199 overlay->pfit_vscale_ratio) + 1;
02e792fb
DV
1200 } else {
1201 params->dst_y = put_image_rec->dst_y;
1202 params->dst_h = put_image_rec->dst_height;
1203 }
1204 params->dst_x = put_image_rec->dst_x;
1205 params->dst_w = put_image_rec->dst_width;
1206
1207 params->src_w = put_image_rec->src_width;
1208 params->src_h = put_image_rec->src_height;
1209 params->src_scan_w = put_image_rec->src_scan_width;
1210 params->src_scan_h = put_image_rec->src_scan_height;
722506f0
CW
1211 if (params->src_scan_h > params->src_h ||
1212 params->src_scan_w > params->src_w) {
02e792fb
DV
1213 ret = -EINVAL;
1214 goto out_unlock;
1215 }
1216
1217 ret = check_overlay_src(dev, put_image_rec, new_bo);
1218 if (ret != 0)
1219 goto out_unlock;
1220 params->format = put_image_rec->flags & ~I915_OVERLAY_FLAGS_MASK;
1221 params->stride_Y = put_image_rec->stride_Y;
1222 params->stride_UV = put_image_rec->stride_UV;
1223 params->offset_Y = put_image_rec->offset_Y;
1224 params->offset_U = put_image_rec->offset_U;
1225 params->offset_V = put_image_rec->offset_V;
1226
1227 /* Check scaling after src size to prevent a divide-by-zero. */
1228 ret = check_overlay_scaling(params);
1229 if (ret != 0)
1230 goto out_unlock;
1231
1232 ret = intel_overlay_do_put_image(overlay, new_bo, params);
1233 if (ret != 0)
1234 goto out_unlock;
1235
1236 mutex_unlock(&dev->struct_mutex);
1237 mutex_unlock(&dev->mode_config.mutex);
1238
1239 kfree(params);
1240
1241 return 0;
1242
1243out_unlock:
1244 mutex_unlock(&dev->struct_mutex);
1245 mutex_unlock(&dev->mode_config.mutex);
05394f39 1246 drm_gem_object_unreference_unlocked(&new_bo->base);
915a428e 1247out_free:
02e792fb
DV
1248 kfree(params);
1249
1250 return ret;
1251}
1252
1253static void update_reg_attrs(struct intel_overlay *overlay,
1254 struct overlay_registers *regs)
1255{
1256 regs->OCLRC0 = (overlay->contrast << 18) | (overlay->brightness & 0xff);
1257 regs->OCLRC1 = overlay->saturation;
1258}
1259
1260static bool check_gamma_bounds(u32 gamma1, u32 gamma2)
1261{
1262 int i;
1263
1264 if (gamma1 & 0xff000000 || gamma2 & 0xff000000)
1265 return false;
1266
1267 for (i = 0; i < 3; i++) {
722506f0 1268 if (((gamma1 >> i*8) & 0xff) >= ((gamma2 >> i*8) & 0xff))
02e792fb
DV
1269 return false;
1270 }
1271
1272 return true;
1273}
1274
1275static bool check_gamma5_errata(u32 gamma5)
1276{
1277 int i;
1278
1279 for (i = 0; i < 3; i++) {
1280 if (((gamma5 >> i*8) & 0xff) == 0x80)
1281 return false;
1282 }
1283
1284 return true;
1285}
1286
1287static int check_gamma(struct drm_intel_overlay_attrs *attrs)
1288{
722506f0
CW
1289 if (!check_gamma_bounds(0, attrs->gamma0) ||
1290 !check_gamma_bounds(attrs->gamma0, attrs->gamma1) ||
1291 !check_gamma_bounds(attrs->gamma1, attrs->gamma2) ||
1292 !check_gamma_bounds(attrs->gamma2, attrs->gamma3) ||
1293 !check_gamma_bounds(attrs->gamma3, attrs->gamma4) ||
1294 !check_gamma_bounds(attrs->gamma4, attrs->gamma5) ||
1295 !check_gamma_bounds(attrs->gamma5, 0x00ffffff))
02e792fb 1296 return -EINVAL;
722506f0 1297
02e792fb
DV
1298 if (!check_gamma5_errata(attrs->gamma5))
1299 return -EINVAL;
722506f0 1300
02e792fb
DV
1301 return 0;
1302}
1303
1304int intel_overlay_attrs(struct drm_device *dev, void *data,
1305 struct drm_file *file_priv)
1306{
1307 struct drm_intel_overlay_attrs *attrs = data;
1308 drm_i915_private_t *dev_priv = dev->dev_private;
1309 struct intel_overlay *overlay;
1310 struct overlay_registers *regs;
1311 int ret;
1312
1313 if (!dev_priv) {
1314 DRM_ERROR("called with no initialization\n");
1315 return -EINVAL;
1316 }
1317
1318 overlay = dev_priv->overlay;
1319 if (!overlay) {
1320 DRM_DEBUG("userspace bug: no overlay\n");
1321 return -ENODEV;
1322 }
1323
1324 mutex_lock(&dev->mode_config.mutex);
1325 mutex_lock(&dev->struct_mutex);
1326
60fc332c 1327 ret = -EINVAL;
02e792fb 1328 if (!(attrs->flags & I915_OVERLAY_UPDATE_ATTRS)) {
60fc332c 1329 attrs->color_key = overlay->color_key;
02e792fb 1330 attrs->brightness = overlay->brightness;
60fc332c 1331 attrs->contrast = overlay->contrast;
02e792fb
DV
1332 attrs->saturation = overlay->saturation;
1333
a6c45cf0 1334 if (!IS_GEN2(dev)) {
02e792fb
DV
1335 attrs->gamma0 = I915_READ(OGAMC0);
1336 attrs->gamma1 = I915_READ(OGAMC1);
1337 attrs->gamma2 = I915_READ(OGAMC2);
1338 attrs->gamma3 = I915_READ(OGAMC3);
1339 attrs->gamma4 = I915_READ(OGAMC4);
1340 attrs->gamma5 = I915_READ(OGAMC5);
1341 }
02e792fb 1342 } else {
60fc332c 1343 if (attrs->brightness < -128 || attrs->brightness > 127)
02e792fb 1344 goto out_unlock;
60fc332c 1345 if (attrs->contrast > 255)
02e792fb 1346 goto out_unlock;
60fc332c 1347 if (attrs->saturation > 1023)
02e792fb 1348 goto out_unlock;
02e792fb 1349
60fc332c
CW
1350 overlay->color_key = attrs->color_key;
1351 overlay->brightness = attrs->brightness;
1352 overlay->contrast = attrs->contrast;
1353 overlay->saturation = attrs->saturation;
02e792fb 1354
8d74f656 1355 regs = intel_overlay_map_regs(overlay);
02e792fb
DV
1356 if (!regs) {
1357 ret = -ENOMEM;
1358 goto out_unlock;
1359 }
1360
1361 update_reg_attrs(overlay, regs);
1362
9bb2ff73 1363 intel_overlay_unmap_regs(overlay, regs);
02e792fb
DV
1364
1365 if (attrs->flags & I915_OVERLAY_UPDATE_GAMMA) {
a6c45cf0 1366 if (IS_GEN2(dev))
02e792fb 1367 goto out_unlock;
02e792fb
DV
1368
1369 if (overlay->active) {
1370 ret = -EBUSY;
1371 goto out_unlock;
1372 }
1373
1374 ret = check_gamma(attrs);
60fc332c 1375 if (ret)
02e792fb
DV
1376 goto out_unlock;
1377
1378 I915_WRITE(OGAMC0, attrs->gamma0);
1379 I915_WRITE(OGAMC1, attrs->gamma1);
1380 I915_WRITE(OGAMC2, attrs->gamma2);
1381 I915_WRITE(OGAMC3, attrs->gamma3);
1382 I915_WRITE(OGAMC4, attrs->gamma4);
1383 I915_WRITE(OGAMC5, attrs->gamma5);
1384 }
02e792fb
DV
1385 }
1386
60fc332c 1387 ret = 0;
02e792fb
DV
1388out_unlock:
1389 mutex_unlock(&dev->struct_mutex);
1390 mutex_unlock(&dev->mode_config.mutex);
1391
1392 return ret;
1393}
1394
1395void intel_setup_overlay(struct drm_device *dev)
1396{
1397 drm_i915_private_t *dev_priv = dev->dev_private;
1398 struct intel_overlay *overlay;
05394f39 1399 struct drm_i915_gem_object *reg_bo;
02e792fb
DV
1400 struct overlay_registers *regs;
1401 int ret;
1402
31578148 1403 if (!HAS_OVERLAY(dev))
02e792fb
DV
1404 return;
1405
1406 overlay = kzalloc(sizeof(struct intel_overlay), GFP_KERNEL);
1407 if (!overlay)
1408 return;
1409 overlay->dev = dev;
1410
ac52bc56 1411 reg_bo = i915_gem_alloc_object(dev, PAGE_SIZE);
02e792fb
DV
1412 if (!reg_bo)
1413 goto out_free;
05394f39 1414 overlay->reg_bo = reg_bo;
02e792fb 1415
31578148 1416 if (OVERLAY_NEEDS_PHYSICAL(dev)) {
02e792fb 1417 ret = i915_gem_attach_phys_object(dev, reg_bo,
6eeefaf3 1418 I915_GEM_PHYS_OVERLAY_REGS,
a2930128 1419 PAGE_SIZE);
02e792fb
DV
1420 if (ret) {
1421 DRM_ERROR("failed to attach phys overlay regs\n");
1422 goto out_free_bo;
1423 }
05394f39 1424 overlay->flip_addr = reg_bo->phys_obj->handle->busaddr;
31578148 1425 } else {
75e9e915 1426 ret = i915_gem_object_pin(reg_bo, PAGE_SIZE, true);
02e792fb
DV
1427 if (ret) {
1428 DRM_ERROR("failed to pin overlay register bo\n");
1429 goto out_free_bo;
1430 }
05394f39 1431 overlay->flip_addr = reg_bo->gtt_offset;
0ddc1289
CW
1432
1433 ret = i915_gem_object_set_to_gtt_domain(reg_bo, true);
1434 if (ret) {
1435 DRM_ERROR("failed to move overlay register bo into the GTT\n");
1436 goto out_unpin_bo;
1437 }
02e792fb
DV
1438 }
1439
1440 /* init all values */
1441 overlay->color_key = 0x0101fe;
1442 overlay->brightness = -19;
1443 overlay->contrast = 75;
1444 overlay->saturation = 146;
1445
8d74f656 1446 regs = intel_overlay_map_regs(overlay);
02e792fb
DV
1447 if (!regs)
1448 goto out_free_bo;
1449
1450 memset(regs, 0, sizeof(struct overlay_registers));
1451 update_polyphase_filter(regs);
02e792fb
DV
1452 update_reg_attrs(overlay, regs);
1453
9bb2ff73 1454 intel_overlay_unmap_regs(overlay, regs);
02e792fb
DV
1455
1456 dev_priv->overlay = overlay;
1457 DRM_INFO("initialized overlay support\n");
1458 return;
1459
0ddc1289
CW
1460out_unpin_bo:
1461 i915_gem_object_unpin(reg_bo);
02e792fb 1462out_free_bo:
05394f39 1463 drm_gem_object_unreference(&reg_bo->base);
02e792fb
DV
1464out_free:
1465 kfree(overlay);
1466 return;
1467}
1468
1469void intel_cleanup_overlay(struct drm_device *dev)
1470{
722506f0 1471 drm_i915_private_t *dev_priv = dev->dev_private;
02e792fb 1472
62cf4e6f
CW
1473 if (!dev_priv->overlay)
1474 return;
02e792fb 1475
62cf4e6f
CW
1476 /* The bo's should be free'd by the generic code already.
1477 * Furthermore modesetting teardown happens beforehand so the
1478 * hardware should be off already */
1479 BUG_ON(dev_priv->overlay->active);
1480
1481 drm_gem_object_unreference_unlocked(&dev_priv->overlay->reg_bo->base);
1482 kfree(dev_priv->overlay);
02e792fb 1483}
6ef3d427 1484
3bd3c932
CW
1485#ifdef CONFIG_DEBUG_FS
1486#include <linux/seq_file.h>
1487
6ef3d427
CW
1488struct intel_overlay_error_state {
1489 struct overlay_registers regs;
1490 unsigned long base;
1491 u32 dovsta;
1492 u32 isr;
1493};
1494
3bd3c932 1495static struct overlay_registers *
c48c43e4 1496intel_overlay_map_regs_atomic(struct intel_overlay *overlay)
3bd3c932 1497{
c48c43e4 1498 drm_i915_private_t *dev_priv = overlay->dev->dev_private;
3bd3c932
CW
1499 struct overlay_registers *regs;
1500
1501 if (OVERLAY_NEEDS_PHYSICAL(overlay->dev))
1502 regs = overlay->reg_bo->phys_obj->handle->vaddr;
1503 else
1504 regs = io_mapping_map_atomic_wc(dev_priv->mm.gtt_mapping,
c48c43e4 1505 overlay->reg_bo->gtt_offset);
3bd3c932
CW
1506
1507 return regs;
1508}
1509
1510static void intel_overlay_unmap_regs_atomic(struct intel_overlay *overlay,
3bd3c932
CW
1511 struct overlay_registers *regs)
1512{
1513 if (!OVERLAY_NEEDS_PHYSICAL(overlay->dev))
c48c43e4 1514 io_mapping_unmap_atomic(regs);
3bd3c932
CW
1515}
1516
1517
6ef3d427
CW
1518struct intel_overlay_error_state *
1519intel_overlay_capture_error_state(struct drm_device *dev)
1520{
1521 drm_i915_private_t *dev_priv = dev->dev_private;
1522 struct intel_overlay *overlay = dev_priv->overlay;
1523 struct intel_overlay_error_state *error;
1524 struct overlay_registers __iomem *regs;
1525
1526 if (!overlay || !overlay->active)
1527 return NULL;
1528
1529 error = kmalloc(sizeof(*error), GFP_ATOMIC);
1530 if (error == NULL)
1531 return NULL;
1532
1533 error->dovsta = I915_READ(DOVSTA);
1534 error->isr = I915_READ(ISR);
31578148 1535 if (OVERLAY_NEEDS_PHYSICAL(overlay->dev))
6ef3d427 1536 error->base = (long) overlay->reg_bo->phys_obj->handle->vaddr;
31578148
CW
1537 else
1538 error->base = (long) overlay->reg_bo->gtt_offset;
6ef3d427
CW
1539
1540 regs = intel_overlay_map_regs_atomic(overlay);
1541 if (!regs)
1542 goto err;
1543
1544 memcpy_fromio(&error->regs, regs, sizeof(struct overlay_registers));
c48c43e4 1545 intel_overlay_unmap_regs_atomic(overlay, regs);
6ef3d427
CW
1546
1547 return error;
1548
1549err:
1550 kfree(error);
1551 return NULL;
1552}
1553
1554void
1555intel_overlay_print_error_state(struct seq_file *m, struct intel_overlay_error_state *error)
1556{
1557 seq_printf(m, "Overlay, status: 0x%08x, interrupt: 0x%08x\n",
1558 error->dovsta, error->isr);
1559 seq_printf(m, " Register file at 0x%08lx:\n",
1560 error->base);
1561
1562#define P(x) seq_printf(m, " " #x ": 0x%08x\n", error->regs.x)
1563 P(OBUF_0Y);
1564 P(OBUF_1Y);
1565 P(OBUF_0U);
1566 P(OBUF_0V);
1567 P(OBUF_1U);
1568 P(OBUF_1V);
1569 P(OSTRIDE);
1570 P(YRGB_VPH);
1571 P(UV_VPH);
1572 P(HORZ_PH);
1573 P(INIT_PHS);
1574 P(DWINPOS);
1575 P(DWINSZ);
1576 P(SWIDTH);
1577 P(SWIDTHSW);
1578 P(SHEIGHT);
1579 P(YRGBSCALE);
1580 P(UVSCALE);
1581 P(OCLRC0);
1582 P(OCLRC1);
1583 P(DCLRKV);
1584 P(DCLRKM);
1585 P(SCLRKVH);
1586 P(SCLRKVL);
1587 P(SCLRKEN);
1588 P(OCONFIG);
1589 P(OCMD);
1590 P(OSTART_0Y);
1591 P(OSTART_1Y);
1592 P(OSTART_0U);
1593 P(OSTART_0V);
1594 P(OSTART_1U);
1595 P(OSTART_1V);
1596 P(OTILEOFF_0Y);
1597 P(OTILEOFF_1Y);
1598 P(OTILEOFF_0U);
1599 P(OTILEOFF_0V);
1600 P(OTILEOFF_1U);
1601 P(OTILEOFF_1V);
1602 P(FASTHSCALE);
1603 P(UVSCALEV);
1604#undef P
1605}
3bd3c932 1606#endif