2 * Copyright 2014 Advanced Micro Devices, Inc.
5 * Permission is hereby granted, free of charge, to any person obtaining a
6 * copy of this software and associated documentation files (the
7 * "Software"), to deal in the Software without restriction, including
8 * without limitation the rights to use, copy, modify, merge, publish,
9 * distribute, sub license, and/or sell copies of the Software, and to
10 * permit persons to whom the Software is furnished to do so, subject to
11 * the following conditions:
13 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
14 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
15 * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
16 * THE COPYRIGHT HOLDERS, AUTHORS AND/OR ITS SUPPLIERS BE LIABLE FOR ANY CLAIM,
17 * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
18 * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
19 * USE OR OTHER DEALINGS IN THE SOFTWARE.
21 * The above copyright notice and this permission notice (including the
22 * next paragraph) shall be included in all copies or substantial portions
28 * Christian König <christian.koenig@amd.com>
31 #include <linux/firmware.h>
32 #include <linux/module.h>
33 #include <linux/mmu_notifier.h>
34 #include <linux/interval_tree.h>
41 /* constant after initialisation */
42 struct amdgpu_device
*adev
;
44 struct mmu_notifier mn
;
46 /* only used on destruction */
47 struct work_struct work
;
49 /* protected by adev->mn_lock */
50 struct hlist_node node
;
52 /* objects protected by lock */
54 struct rb_root objects
;
57 struct amdgpu_mn_node
{
58 struct interval_tree_node it
;
63 * amdgpu_mn_destroy - destroy the rmn
65 * @work: previously sheduled work item
67 * Lazy destroys the notifier from a work item
69 static void amdgpu_mn_destroy(struct work_struct
*work
)
71 struct amdgpu_mn
*rmn
= container_of(work
, struct amdgpu_mn
, work
);
72 struct amdgpu_device
*adev
= rmn
->adev
;
73 struct amdgpu_mn_node
*node
, *next_node
;
74 struct amdgpu_bo
*bo
, *next_bo
;
76 mutex_lock(&adev
->mn_lock
);
77 mutex_lock(&rmn
->lock
);
79 rbtree_postorder_for_each_entry_safe(node
, next_node
, &rmn
->objects
,
81 list_for_each_entry_safe(bo
, next_bo
, &node
->bos
, mn_list
) {
83 list_del_init(&bo
->mn_list
);
87 mutex_unlock(&rmn
->lock
);
88 mutex_unlock(&adev
->mn_lock
);
89 mmu_notifier_unregister_no_release(&rmn
->mn
, rmn
->mm
);
94 * amdgpu_mn_release - callback to notify about mm destruction
97 * @mn: the mm this callback is about
99 * Shedule a work item to lazy destroy our notifier.
101 static void amdgpu_mn_release(struct mmu_notifier
*mn
,
102 struct mm_struct
*mm
)
104 struct amdgpu_mn
*rmn
= container_of(mn
, struct amdgpu_mn
, mn
);
105 INIT_WORK(&rmn
->work
, amdgpu_mn_destroy
);
106 schedule_work(&rmn
->work
);
110 * amdgpu_mn_invalidate_node - unmap all BOs of a node
112 * @node: the node with the BOs to unmap
114 * We block for all BOs and unmap them by move them
115 * into system domain again.
117 static void amdgpu_mn_invalidate_node(struct amdgpu_mn_node
*node
,
121 struct amdgpu_bo
*bo
;
124 list_for_each_entry(bo
, &node
->bos
, mn_list
) {
126 if (!amdgpu_ttm_tt_affect_userptr(bo
->tbo
.ttm
, start
, end
))
129 r
= amdgpu_bo_reserve(bo
, true);
131 DRM_ERROR("(%ld) failed to reserve user bo\n", r
);
135 r
= reservation_object_wait_timeout_rcu(bo
->tbo
.resv
,
136 true, false, MAX_SCHEDULE_TIMEOUT
);
138 DRM_ERROR("(%ld) failed to wait for user bo\n", r
);
140 amdgpu_ttm_placement_from_domain(bo
, AMDGPU_GEM_DOMAIN_CPU
);
141 r
= ttm_bo_validate(&bo
->tbo
, &bo
->placement
, false, false);
143 DRM_ERROR("(%ld) failed to validate user bo\n", r
);
145 amdgpu_bo_unreserve(bo
);
150 * amdgpu_mn_invalidate_page - callback to notify about mm change
153 * @mn: the mm this callback is about
154 * @address: address of invalidate page
156 * Invalidation of a single page. Blocks for all BOs mapping it
157 * and unmap them by move them into system domain again.
159 static void amdgpu_mn_invalidate_page(struct mmu_notifier
*mn
,
160 struct mm_struct
*mm
,
161 unsigned long address
)
163 struct amdgpu_mn
*rmn
= container_of(mn
, struct amdgpu_mn
, mn
);
164 struct interval_tree_node
*it
;
166 mutex_lock(&rmn
->lock
);
168 it
= interval_tree_iter_first(&rmn
->objects
, address
, address
);
170 struct amdgpu_mn_node
*node
;
172 node
= container_of(it
, struct amdgpu_mn_node
, it
);
173 amdgpu_mn_invalidate_node(node
, address
, address
);
176 mutex_unlock(&rmn
->lock
);
180 * amdgpu_mn_invalidate_range_start - callback to notify about mm change
183 * @mn: the mm this callback is about
184 * @start: start of updated range
185 * @end: end of updated range
187 * We block for all BOs between start and end to be idle and
188 * unmap them by move them into system domain again.
190 static void amdgpu_mn_invalidate_range_start(struct mmu_notifier
*mn
,
191 struct mm_struct
*mm
,
195 struct amdgpu_mn
*rmn
= container_of(mn
, struct amdgpu_mn
, mn
);
196 struct interval_tree_node
*it
;
198 /* notification is exclusive, but interval is inclusive */
201 mutex_lock(&rmn
->lock
);
203 it
= interval_tree_iter_first(&rmn
->objects
, start
, end
);
205 struct amdgpu_mn_node
*node
;
207 node
= container_of(it
, struct amdgpu_mn_node
, it
);
208 it
= interval_tree_iter_next(it
, start
, end
);
210 amdgpu_mn_invalidate_node(node
, start
, end
);
213 mutex_unlock(&rmn
->lock
);
216 static const struct mmu_notifier_ops amdgpu_mn_ops
= {
217 .release
= amdgpu_mn_release
,
218 .invalidate_page
= amdgpu_mn_invalidate_page
,
219 .invalidate_range_start
= amdgpu_mn_invalidate_range_start
,
223 * amdgpu_mn_get - create notifier context
225 * @adev: amdgpu device pointer
227 * Creates a notifier context for current->mm.
229 static struct amdgpu_mn
*amdgpu_mn_get(struct amdgpu_device
*adev
)
231 struct mm_struct
*mm
= current
->mm
;
232 struct amdgpu_mn
*rmn
;
235 mutex_lock(&adev
->mn_lock
);
236 if (down_write_killable(&mm
->mmap_sem
)) {
237 mutex_unlock(&adev
->mn_lock
);
238 return ERR_PTR(-EINTR
);
241 hash_for_each_possible(adev
->mn_hash
, rmn
, node
, (unsigned long)mm
)
245 rmn
= kzalloc(sizeof(*rmn
), GFP_KERNEL
);
247 rmn
= ERR_PTR(-ENOMEM
);
253 rmn
->mn
.ops
= &amdgpu_mn_ops
;
254 mutex_init(&rmn
->lock
);
255 rmn
->objects
= RB_ROOT
;
257 r
= __mmu_notifier_register(&rmn
->mn
, mm
);
261 hash_add(adev
->mn_hash
, &rmn
->node
, (unsigned long)mm
);
264 up_write(&mm
->mmap_sem
);
265 mutex_unlock(&adev
->mn_lock
);
270 up_write(&mm
->mmap_sem
);
271 mutex_unlock(&adev
->mn_lock
);
278 * amdgpu_mn_register - register a BO for notifier updates
280 * @bo: amdgpu buffer object
281 * @addr: userptr addr we should monitor
283 * Registers an MMU notifier for the given BO at the specified address.
284 * Returns 0 on success, -ERRNO if anything goes wrong.
286 int amdgpu_mn_register(struct amdgpu_bo
*bo
, unsigned long addr
)
288 unsigned long end
= addr
+ amdgpu_bo_size(bo
) - 1;
289 struct amdgpu_device
*adev
= amdgpu_ttm_adev(bo
->tbo
.bdev
);
290 struct amdgpu_mn
*rmn
;
291 struct amdgpu_mn_node
*node
= NULL
;
292 struct list_head bos
;
293 struct interval_tree_node
*it
;
295 rmn
= amdgpu_mn_get(adev
);
299 INIT_LIST_HEAD(&bos
);
301 mutex_lock(&rmn
->lock
);
303 while ((it
= interval_tree_iter_first(&rmn
->objects
, addr
, end
))) {
305 node
= container_of(it
, struct amdgpu_mn_node
, it
);
306 interval_tree_remove(&node
->it
, &rmn
->objects
);
307 addr
= min(it
->start
, addr
);
308 end
= max(it
->last
, end
);
309 list_splice(&node
->bos
, &bos
);
313 node
= kmalloc(sizeof(struct amdgpu_mn_node
), GFP_KERNEL
);
315 mutex_unlock(&rmn
->lock
);
322 node
->it
.start
= addr
;
324 INIT_LIST_HEAD(&node
->bos
);
325 list_splice(&bos
, &node
->bos
);
326 list_add(&bo
->mn_list
, &node
->bos
);
328 interval_tree_insert(&node
->it
, &rmn
->objects
);
330 mutex_unlock(&rmn
->lock
);
336 * amdgpu_mn_unregister - unregister a BO for notifier updates
338 * @bo: amdgpu buffer object
340 * Remove any registration of MMU notifier updates from the buffer object.
342 void amdgpu_mn_unregister(struct amdgpu_bo
*bo
)
344 struct amdgpu_device
*adev
= amdgpu_ttm_adev(bo
->tbo
.bdev
);
345 struct amdgpu_mn
*rmn
;
346 struct list_head
*head
;
348 mutex_lock(&adev
->mn_lock
);
352 mutex_unlock(&adev
->mn_lock
);
356 mutex_lock(&rmn
->lock
);
358 /* save the next list entry for later */
359 head
= bo
->mn_list
.next
;
362 list_del_init(&bo
->mn_list
);
364 if (list_empty(head
)) {
365 struct amdgpu_mn_node
*node
;
366 node
= container_of(head
, struct amdgpu_mn_node
, bos
);
367 interval_tree_remove(&node
->it
, &rmn
->objects
);
371 mutex_unlock(&rmn
->lock
);
372 mutex_unlock(&adev
->mn_lock
);