2 * Copyright © 2008-2012 Intel Corporation
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
20 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
24 * Eric Anholt <eric@anholt.net>
25 * Chris Wilson <chris@chris-wilson.co.uk>
30 #include <drm/i915_drm.h>
33 #define KB(x) ((x) * 1024)
34 #define MB(x) (KB(x) * 1024)
37 * The BIOS typically reserves some of the system's memory for the exclusive
38 * use of the integrated graphics. This memory is no longer available for
39 * use by the OS and so the user finds that his system has less memory
40 * available than he put in. We refer to this memory as stolen.
42 * The BIOS will allocate its framebuffer from the stolen memory. Our
43 * goal is try to reuse that object for our own fbcon which must always
44 * be available for panics. Anything else we can reuse the stolen memory
48 int i915_gem_stolen_insert_node_in_range(struct drm_i915_private
*dev_priv
,
49 struct drm_mm_node
*node
, u64 size
,
50 unsigned alignment
, u64 start
, u64 end
)
54 if (!drm_mm_initialized(&dev_priv
->mm
.stolen
))
57 mutex_lock(&dev_priv
->mm
.stolen_lock
);
58 ret
= drm_mm_insert_node_in_range(&dev_priv
->mm
.stolen
, node
,
60 start
, end
, DRM_MM_INSERT_BEST
);
61 mutex_unlock(&dev_priv
->mm
.stolen_lock
);
66 int i915_gem_stolen_insert_node(struct drm_i915_private
*dev_priv
,
67 struct drm_mm_node
*node
, u64 size
,
70 return i915_gem_stolen_insert_node_in_range(dev_priv
, node
, size
,
71 alignment
, 0, U64_MAX
);
74 void i915_gem_stolen_remove_node(struct drm_i915_private
*dev_priv
,
75 struct drm_mm_node
*node
)
77 mutex_lock(&dev_priv
->mm
.stolen_lock
);
78 drm_mm_remove_node(node
);
79 mutex_unlock(&dev_priv
->mm
.stolen_lock
);
82 static dma_addr_t
i915_stolen_to_dma(struct drm_i915_private
*dev_priv
)
84 struct pci_dev
*pdev
= dev_priv
->drm
.pdev
;
85 struct i915_ggtt
*ggtt
= &dev_priv
->ggtt
;
89 /* Almost universally we can find the Graphics Base of Stolen Memory
90 * at register BSM (0x5c) in the igfx configuration space. On a few
91 * (desktop) machines this is also mirrored in the bridge device at
92 * different locations, or in the MCHBAR.
94 * On 865 we just check the TOUD register.
96 * On 830/845/85x the stolen memory base isn't available in any
97 * register. We need to calculate it as TOM-TSEG_SIZE-stolen_size.
101 if (INTEL_GEN(dev_priv
) >= 3) {
104 pci_read_config_dword(pdev
, INTEL_BSM
, &bsm
);
106 base
= bsm
& INTEL_BSM_MASK
;
107 } else if (IS_I865G(dev_priv
)) {
112 pci_bus_read_config_byte(pdev
->bus
, PCI_DEVFN(0, 0),
115 if (tmp
& TSEG_ENABLE
) {
116 switch (tmp
& I845_TSEG_SIZE_MASK
) {
117 case I845_TSEG_SIZE_512K
:
120 case I845_TSEG_SIZE_1M
:
126 pci_bus_read_config_word(pdev
->bus
, PCI_DEVFN(0, 0),
129 base
= (toud
<< 16) + tseg_size
;
130 } else if (IS_I85X(dev_priv
)) {
135 pci_bus_read_config_byte(pdev
->bus
, PCI_DEVFN(0, 0),
138 if (tmp
& TSEG_ENABLE
)
141 pci_bus_read_config_byte(pdev
->bus
, PCI_DEVFN(0, 1),
145 base
= tom
- tseg_size
- ggtt
->stolen_size
;
146 } else if (IS_I845G(dev_priv
)) {
151 pci_bus_read_config_byte(pdev
->bus
, PCI_DEVFN(0, 0),
154 if (tmp
& TSEG_ENABLE
) {
155 switch (tmp
& I845_TSEG_SIZE_MASK
) {
156 case I845_TSEG_SIZE_512K
:
159 case I845_TSEG_SIZE_1M
:
165 pci_bus_read_config_byte(pdev
->bus
, PCI_DEVFN(0, 0),
169 base
= tom
- tseg_size
- ggtt
->stolen_size
;
170 } else if (IS_I830(dev_priv
)) {
175 pci_bus_read_config_byte(pdev
->bus
, PCI_DEVFN(0, 0),
178 if (tmp
& TSEG_ENABLE
) {
179 if (tmp
& I830_TSEG_SIZE_1M
)
185 pci_bus_read_config_byte(pdev
->bus
, PCI_DEVFN(0, 0),
189 base
= tom
- tseg_size
- ggtt
->stolen_size
;
192 if (base
== 0 || add_overflows(base
, ggtt
->stolen_size
))
195 /* make sure we don't clobber the GTT if it's within stolen memory */
196 if (INTEL_GEN(dev_priv
) <= 4 &&
197 !IS_G33(dev_priv
) && !IS_PINEVIEW(dev_priv
) && !IS_G4X(dev_priv
)) {
199 dma_addr_t start
, end
;
201 { .start
= base
, .end
= base
+ ggtt
->stolen_size
, },
202 { .start
= base
, .end
= base
+ ggtt
->stolen_size
, },
204 u64 ggtt_start
, ggtt_end
;
206 ggtt_start
= I915_READ(PGTBL_CTL
);
207 if (IS_GEN4(dev_priv
))
208 ggtt_start
= (ggtt_start
& PGTBL_ADDRESS_LO_MASK
) |
209 (ggtt_start
& PGTBL_ADDRESS_HI_MASK
) << 28;
211 ggtt_start
&= PGTBL_ADDRESS_LO_MASK
;
212 ggtt_end
= ggtt_start
+ ggtt_total_entries(ggtt
) * 4;
214 if (ggtt_start
>= stolen
[0].start
&& ggtt_start
< stolen
[0].end
)
215 stolen
[0].end
= ggtt_start
;
216 if (ggtt_end
> stolen
[1].start
&& ggtt_end
<= stolen
[1].end
)
217 stolen
[1].start
= ggtt_end
;
219 /* pick the larger of the two chunks */
220 if (stolen
[0].end
- stolen
[0].start
>
221 stolen
[1].end
- stolen
[1].start
) {
222 base
= stolen
[0].start
;
223 ggtt
->stolen_size
= stolen
[0].end
- stolen
[0].start
;
225 base
= stolen
[1].start
;
226 ggtt
->stolen_size
= stolen
[1].end
- stolen
[1].start
;
229 if (stolen
[0].start
!= stolen
[1].start
||
230 stolen
[0].end
!= stolen
[1].end
) {
231 dma_addr_t end
= base
+ ggtt
->stolen_size
- 1;
233 DRM_DEBUG_KMS("GTT within stolen memory at 0x%llx-0x%llx\n",
234 (unsigned long long)ggtt_start
,
235 (unsigned long long)ggtt_end
- 1);
236 DRM_DEBUG_KMS("Stolen memory adjusted to %pad - %pad\n",
242 /* Verify that nothing else uses this physical address. Stolen
243 * memory should be reserved by the BIOS and hidden from the
244 * kernel. So if the region is already marked as busy, something
245 * is seriously wrong.
247 r
= devm_request_mem_region(dev_priv
->drm
.dev
, base
, ggtt
->stolen_size
,
248 "Graphics Stolen Memory");
251 * One more attempt but this time requesting region from
252 * base + 1, as we have seen that this resolves the region
253 * conflict with the PCI Bus.
254 * This is a BIOS w/a: Some BIOS wrap stolen in the root
255 * PCI bus, but have an off-by-one error. Hence retry the
256 * reservation starting from 1 instead of 0.
258 r
= devm_request_mem_region(dev_priv
->drm
.dev
, base
+ 1,
259 ggtt
->stolen_size
- 1,
260 "Graphics Stolen Memory");
262 * GEN3 firmware likes to smash pci bridges into the stolen
263 * range. Apparently this works.
265 if (r
== NULL
&& !IS_GEN3(dev_priv
)) {
266 dma_addr_t end
= base
+ ggtt
->stolen_size
;
268 DRM_ERROR("conflict detected with stolen region: [%pad - %pad]\n",
277 void i915_gem_cleanup_stolen(struct drm_device
*dev
)
279 struct drm_i915_private
*dev_priv
= to_i915(dev
);
281 if (!drm_mm_initialized(&dev_priv
->mm
.stolen
))
284 drm_mm_takedown(&dev_priv
->mm
.stolen
);
287 static void g4x_get_stolen_reserved(struct drm_i915_private
*dev_priv
,
288 dma_addr_t
*base
, u32
*size
)
290 struct i915_ggtt
*ggtt
= &dev_priv
->ggtt
;
291 uint32_t reg_val
= I915_READ(IS_GM45(dev_priv
) ?
292 CTG_STOLEN_RESERVED
:
293 ELK_STOLEN_RESERVED
);
294 dma_addr_t stolen_top
= dev_priv
->mm
.stolen_base
+ ggtt
->stolen_size
;
296 *base
= (reg_val
& G4X_STOLEN_RESERVED_ADDR2_MASK
) << 16;
298 WARN_ON((reg_val
& G4X_STOLEN_RESERVED_ADDR1_MASK
) < *base
);
300 /* On these platforms, the register doesn't have a size field, so the
301 * size is the distance between the base and the top of the stolen
302 * memory. We also have the genuine case where base is zero and there's
303 * nothing reserved. */
307 *size
= stolen_top
- *base
;
310 static void gen6_get_stolen_reserved(struct drm_i915_private
*dev_priv
,
311 dma_addr_t
*base
, u32
*size
)
313 uint32_t reg_val
= I915_READ(GEN6_STOLEN_RESERVED
);
315 *base
= reg_val
& GEN6_STOLEN_RESERVED_ADDR_MASK
;
317 switch (reg_val
& GEN6_STOLEN_RESERVED_SIZE_MASK
) {
318 case GEN6_STOLEN_RESERVED_1M
:
321 case GEN6_STOLEN_RESERVED_512K
:
324 case GEN6_STOLEN_RESERVED_256K
:
327 case GEN6_STOLEN_RESERVED_128K
:
332 MISSING_CASE(reg_val
& GEN6_STOLEN_RESERVED_SIZE_MASK
);
336 static void gen7_get_stolen_reserved(struct drm_i915_private
*dev_priv
,
337 dma_addr_t
*base
, u32
*size
)
339 uint32_t reg_val
= I915_READ(GEN6_STOLEN_RESERVED
);
341 *base
= reg_val
& GEN7_STOLEN_RESERVED_ADDR_MASK
;
343 switch (reg_val
& GEN7_STOLEN_RESERVED_SIZE_MASK
) {
344 case GEN7_STOLEN_RESERVED_1M
:
347 case GEN7_STOLEN_RESERVED_256K
:
352 MISSING_CASE(reg_val
& GEN7_STOLEN_RESERVED_SIZE_MASK
);
356 static void chv_get_stolen_reserved(struct drm_i915_private
*dev_priv
,
357 dma_addr_t
*base
, u32
*size
)
359 uint32_t reg_val
= I915_READ(GEN6_STOLEN_RESERVED
);
361 *base
= reg_val
& GEN6_STOLEN_RESERVED_ADDR_MASK
;
363 switch (reg_val
& GEN8_STOLEN_RESERVED_SIZE_MASK
) {
364 case GEN8_STOLEN_RESERVED_1M
:
367 case GEN8_STOLEN_RESERVED_2M
:
368 *size
= 2 * 1024 * 1024;
370 case GEN8_STOLEN_RESERVED_4M
:
371 *size
= 4 * 1024 * 1024;
373 case GEN8_STOLEN_RESERVED_8M
:
374 *size
= 8 * 1024 * 1024;
377 *size
= 8 * 1024 * 1024;
378 MISSING_CASE(reg_val
& GEN8_STOLEN_RESERVED_SIZE_MASK
);
382 static void bdw_get_stolen_reserved(struct drm_i915_private
*dev_priv
,
383 dma_addr_t
*base
, u32
*size
)
385 struct i915_ggtt
*ggtt
= &dev_priv
->ggtt
;
386 uint32_t reg_val
= I915_READ(GEN6_STOLEN_RESERVED
);
387 dma_addr_t stolen_top
;
389 stolen_top
= dev_priv
->mm
.stolen_base
+ ggtt
->stolen_size
;
391 *base
= reg_val
& GEN6_STOLEN_RESERVED_ADDR_MASK
;
393 /* On these platforms, the register doesn't have a size field, so the
394 * size is the distance between the base and the top of the stolen
395 * memory. We also have the genuine case where base is zero and there's
396 * nothing reserved. */
400 *size
= stolen_top
- *base
;
403 int i915_gem_init_stolen(struct drm_i915_private
*dev_priv
)
405 struct i915_ggtt
*ggtt
= &dev_priv
->ggtt
;
406 dma_addr_t reserved_base
, stolen_top
;
407 u32 reserved_total
, reserved_size
;
408 u32 stolen_usable_start
;
410 mutex_init(&dev_priv
->mm
.stolen_lock
);
412 if (intel_vgpu_active(dev_priv
)) {
413 DRM_INFO("iGVT-g active, disabling use of stolen memory\n");
417 if (intel_vtd_active() && INTEL_GEN(dev_priv
) < 8) {
418 DRM_INFO("DMAR active, disabling use of stolen memory\n");
422 if (ggtt
->stolen_size
== 0)
425 dev_priv
->mm
.stolen_base
= i915_stolen_to_dma(dev_priv
);
426 if (dev_priv
->mm
.stolen_base
== 0)
429 stolen_top
= dev_priv
->mm
.stolen_base
+ ggtt
->stolen_size
;
433 switch (INTEL_INFO(dev_priv
)->gen
) {
438 if (IS_G4X(dev_priv
))
439 g4x_get_stolen_reserved(dev_priv
,
440 &reserved_base
, &reserved_size
);
443 /* Assume the gen6 maximum for the older platforms. */
444 reserved_size
= 1024 * 1024;
445 reserved_base
= stolen_top
- reserved_size
;
448 gen6_get_stolen_reserved(dev_priv
,
449 &reserved_base
, &reserved_size
);
452 gen7_get_stolen_reserved(dev_priv
,
453 &reserved_base
, &reserved_size
);
457 chv_get_stolen_reserved(dev_priv
,
458 &reserved_base
, &reserved_size
);
460 bdw_get_stolen_reserved(dev_priv
,
461 &reserved_base
, &reserved_size
);
465 /* It is possible for the reserved base to be zero, but the register
466 * field for size doesn't have a zero option. */
467 if (reserved_base
== 0) {
469 reserved_base
= stolen_top
;
472 if (reserved_base
< dev_priv
->mm
.stolen_base
||
473 reserved_base
+ reserved_size
> stolen_top
) {
474 dma_addr_t reserved_top
= reserved_base
+ reserved_size
;
475 DRM_DEBUG_KMS("Stolen reserved area [%pad - %pad] outside stolen memory [%pad - %pad]\n",
476 &reserved_base
, &reserved_top
,
477 &dev_priv
->mm
.stolen_base
, &stolen_top
);
481 ggtt
->stolen_reserved_base
= reserved_base
;
482 ggtt
->stolen_reserved_size
= reserved_size
;
484 /* It is possible for the reserved area to end before the end of stolen
485 * memory, so just consider the start. */
486 reserved_total
= stolen_top
- reserved_base
;
488 DRM_DEBUG_KMS("Memory reserved for graphics device: %uK, usable: %uK\n",
489 ggtt
->stolen_size
>> 10,
490 (ggtt
->stolen_size
- reserved_total
) >> 10);
492 stolen_usable_start
= 0;
493 /* WaSkipStolenMemoryFirstPage:bdw+ */
494 if (INTEL_GEN(dev_priv
) >= 8)
495 stolen_usable_start
= 4096;
497 ggtt
->stolen_usable_size
=
498 ggtt
->stolen_size
- reserved_total
- stolen_usable_start
;
500 /* Basic memrange allocator for stolen space. */
501 drm_mm_init(&dev_priv
->mm
.stolen
, stolen_usable_start
,
502 ggtt
->stolen_usable_size
);
507 static struct sg_table
*
508 i915_pages_create_for_stolen(struct drm_device
*dev
,
509 u32 offset
, u32 size
)
511 struct drm_i915_private
*dev_priv
= to_i915(dev
);
513 struct scatterlist
*sg
;
515 GEM_BUG_ON(range_overflows(offset
, size
, dev_priv
->ggtt
.stolen_size
));
517 /* We hide that we have no struct page backing our stolen object
518 * by wrapping the contiguous physical allocation with a fake
519 * dma mapping in a single scatterlist.
522 st
= kmalloc(sizeof(*st
), GFP_KERNEL
);
524 return ERR_PTR(-ENOMEM
);
526 if (sg_alloc_table(st
, 1, GFP_KERNEL
)) {
528 return ERR_PTR(-ENOMEM
);
535 sg_dma_address(sg
) = (dma_addr_t
)dev_priv
->mm
.stolen_base
+ offset
;
536 sg_dma_len(sg
) = size
;
541 static struct sg_table
*
542 i915_gem_object_get_pages_stolen(struct drm_i915_gem_object
*obj
)
544 return i915_pages_create_for_stolen(obj
->base
.dev
,
549 static void i915_gem_object_put_pages_stolen(struct drm_i915_gem_object
*obj
,
550 struct sg_table
*pages
)
552 /* Should only be called from i915_gem_object_release_stolen() */
553 sg_free_table(pages
);
558 i915_gem_object_release_stolen(struct drm_i915_gem_object
*obj
)
560 struct drm_i915_private
*dev_priv
= to_i915(obj
->base
.dev
);
561 struct drm_mm_node
*stolen
= fetch_and_zero(&obj
->stolen
);
565 __i915_gem_object_unpin_pages(obj
);
567 i915_gem_stolen_remove_node(dev_priv
, stolen
);
571 static const struct drm_i915_gem_object_ops i915_gem_object_stolen_ops
= {
572 .get_pages
= i915_gem_object_get_pages_stolen
,
573 .put_pages
= i915_gem_object_put_pages_stolen
,
574 .release
= i915_gem_object_release_stolen
,
577 static struct drm_i915_gem_object
*
578 _i915_gem_object_create_stolen(struct drm_i915_private
*dev_priv
,
579 struct drm_mm_node
*stolen
)
581 struct drm_i915_gem_object
*obj
;
583 obj
= i915_gem_object_alloc(dev_priv
);
587 drm_gem_private_object_init(&dev_priv
->drm
, &obj
->base
, stolen
->size
);
588 i915_gem_object_init(obj
, &i915_gem_object_stolen_ops
);
590 obj
->stolen
= stolen
;
591 obj
->base
.read_domains
= I915_GEM_DOMAIN_CPU
| I915_GEM_DOMAIN_GTT
;
592 obj
->cache_level
= HAS_LLC(dev_priv
) ? I915_CACHE_LLC
: I915_CACHE_NONE
;
593 obj
->cache_coherent
= true; /* assumptions! more like cache_oblivious */
595 if (i915_gem_object_pin_pages(obj
))
601 i915_gem_object_free(obj
);
605 struct drm_i915_gem_object
*
606 i915_gem_object_create_stolen(struct drm_i915_private
*dev_priv
, u32 size
)
608 struct drm_i915_gem_object
*obj
;
609 struct drm_mm_node
*stolen
;
612 if (!drm_mm_initialized(&dev_priv
->mm
.stolen
))
618 stolen
= kzalloc(sizeof(*stolen
), GFP_KERNEL
);
622 ret
= i915_gem_stolen_insert_node(dev_priv
, stolen
, size
, 4096);
628 obj
= _i915_gem_object_create_stolen(dev_priv
, stolen
);
632 i915_gem_stolen_remove_node(dev_priv
, stolen
);
637 struct drm_i915_gem_object
*
638 i915_gem_object_create_stolen_for_preallocated(struct drm_i915_private
*dev_priv
,
643 struct i915_ggtt
*ggtt
= &dev_priv
->ggtt
;
644 struct drm_i915_gem_object
*obj
;
645 struct drm_mm_node
*stolen
;
646 struct i915_vma
*vma
;
649 if (!drm_mm_initialized(&dev_priv
->mm
.stolen
))
652 lockdep_assert_held(&dev_priv
->drm
.struct_mutex
);
654 DRM_DEBUG_KMS("creating preallocated stolen object: stolen_offset=%x, gtt_offset=%x, size=%x\n",
655 stolen_offset
, gtt_offset
, size
);
657 /* KISS and expect everything to be page-aligned */
658 if (WARN_ON(size
== 0) ||
659 WARN_ON(!IS_ALIGNED(size
, I915_GTT_PAGE_SIZE
)) ||
660 WARN_ON(!IS_ALIGNED(stolen_offset
, I915_GTT_MIN_ALIGNMENT
)))
663 stolen
= kzalloc(sizeof(*stolen
), GFP_KERNEL
);
667 stolen
->start
= stolen_offset
;
669 mutex_lock(&dev_priv
->mm
.stolen_lock
);
670 ret
= drm_mm_reserve_node(&dev_priv
->mm
.stolen
, stolen
);
671 mutex_unlock(&dev_priv
->mm
.stolen_lock
);
673 DRM_DEBUG_KMS("failed to allocate stolen space\n");
678 obj
= _i915_gem_object_create_stolen(dev_priv
, stolen
);
680 DRM_DEBUG_KMS("failed to allocate stolen object\n");
681 i915_gem_stolen_remove_node(dev_priv
, stolen
);
686 /* Some objects just need physical mem from stolen space */
687 if (gtt_offset
== I915_GTT_OFFSET_NONE
)
690 ret
= i915_gem_object_pin_pages(obj
);
694 vma
= i915_vma_instance(obj
, &ggtt
->base
, NULL
);
700 /* To simplify the initialisation sequence between KMS and GTT,
701 * we allow construction of the stolen object prior to
702 * setting up the GTT space. The actual reservation will occur
705 ret
= i915_gem_gtt_reserve(&ggtt
->base
, &vma
->node
,
706 size
, gtt_offset
, obj
->cache_level
,
709 DRM_DEBUG_KMS("failed to allocate stolen GTT space\n");
713 GEM_BUG_ON(!drm_mm_node_allocated(&vma
->node
));
715 vma
->pages
= obj
->mm
.pages
;
716 vma
->flags
|= I915_VMA_GLOBAL_BIND
;
717 __i915_vma_set_map_and_fenceable(vma
);
718 list_move_tail(&vma
->vm_link
, &ggtt
->base
.inactive_list
);
719 list_move_tail(&obj
->global_link
, &dev_priv
->mm
.bound_list
);
725 i915_gem_object_unpin_pages(obj
);
727 i915_gem_object_put(obj
);