2 * Copyright 2014 Advanced Micro Devices, Inc.
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
11 * The above copyright notice and this permission notice shall be included in
12 * all copies or substantial portions of the Software.
14 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
15 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
16 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
17 * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
18 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
19 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
20 * OTHER DEALINGS IN THE SOFTWARE.
23 #include "amdgpu_amdkfd.h"
24 #include "amd_shared.h"
27 #include "amdgpu_gfx.h"
28 #include <linux/module.h>
30 const struct kfd2kgd_calls
*kfd2kgd
;
31 const struct kgd2kfd_calls
*kgd2kfd
;
32 bool (*kgd2kfd_init_p
)(unsigned, const struct kgd2kfd_calls
**);
34 int amdgpu_amdkfd_init(void)
38 #if defined(CONFIG_HSA_AMD_MODULE)
39 int (*kgd2kfd_init_p
)(unsigned, const struct kgd2kfd_calls
**);
41 kgd2kfd_init_p
= symbol_request(kgd2kfd_init
);
43 if (kgd2kfd_init_p
== NULL
)
46 ret
= kgd2kfd_init_p(KFD_INTERFACE_VERSION
, &kgd2kfd
);
48 symbol_put(kgd2kfd_init
);
52 #elif defined(CONFIG_HSA_AMD)
53 ret
= kgd2kfd_init(KFD_INTERFACE_VERSION
, &kgd2kfd
);
64 bool amdgpu_amdkfd_load_interface(struct amdgpu_device
*adev
)
66 switch (adev
->asic_type
) {
67 #ifdef CONFIG_DRM_AMDGPU_CIK
69 kfd2kgd
= amdgpu_amdkfd_gfx_7_get_functions();
73 kfd2kgd
= amdgpu_amdkfd_gfx_8_0_get_functions();
82 void amdgpu_amdkfd_fini(void)
86 symbol_put(kgd2kfd_init
);
90 void amdgpu_amdkfd_device_probe(struct amdgpu_device
*adev
)
93 adev
->kfd
= kgd2kfd
->probe((struct kgd_dev
*)adev
,
97 void amdgpu_amdkfd_device_init(struct amdgpu_device
*adev
)
102 struct kgd2kfd_shared_resources gpu_resources
= {
103 .compute_vmid_bitmap
= 0xFF00,
104 .num_pipe_per_mec
= adev
->gfx
.mec
.num_pipe_per_mec
,
105 .num_queue_per_pipe
= adev
->gfx
.mec
.num_queue_per_pipe
108 /* this is going to have a few of the MSBs set that we need to
110 bitmap_complement(gpu_resources
.queue_bitmap
,
111 adev
->gfx
.mec
.queue_bitmap
,
114 /* remove the KIQ bit as well */
115 if (adev
->gfx
.kiq
.ring
.ready
)
116 clear_bit(amdgpu_gfx_queue_to_bit(adev
,
117 adev
->gfx
.kiq
.ring
.me
- 1,
118 adev
->gfx
.kiq
.ring
.pipe
,
119 adev
->gfx
.kiq
.ring
.queue
),
120 gpu_resources
.queue_bitmap
);
122 /* According to linux/bitmap.h we shouldn't use bitmap_clear if
123 * nbits is not compile time constant */
124 last_valid_bit
= 1 /* only first MEC can have compute queues */
125 * adev
->gfx
.mec
.num_pipe_per_mec
126 * adev
->gfx
.mec
.num_queue_per_pipe
;
127 for (i
= last_valid_bit
; i
< KGD_MAX_QUEUES
; ++i
)
128 clear_bit(i
, gpu_resources
.queue_bitmap
);
130 amdgpu_doorbell_get_kfd_info(adev
,
131 &gpu_resources
.doorbell_physical_address
,
132 &gpu_resources
.doorbell_aperture_size
,
133 &gpu_resources
.doorbell_start_offset
);
135 kgd2kfd
->device_init(adev
->kfd
, &gpu_resources
);
139 void amdgpu_amdkfd_device_fini(struct amdgpu_device
*adev
)
142 kgd2kfd
->device_exit(adev
->kfd
);
147 void amdgpu_amdkfd_interrupt(struct amdgpu_device
*adev
,
148 const void *ih_ring_entry
)
151 kgd2kfd
->interrupt(adev
->kfd
, ih_ring_entry
);
154 void amdgpu_amdkfd_suspend(struct amdgpu_device
*adev
)
157 kgd2kfd
->suspend(adev
->kfd
);
160 int amdgpu_amdkfd_resume(struct amdgpu_device
*adev
)
165 r
= kgd2kfd
->resume(adev
->kfd
);
170 int alloc_gtt_mem(struct kgd_dev
*kgd
, size_t size
,
171 void **mem_obj
, uint64_t *gpu_addr
,
174 struct amdgpu_device
*adev
= (struct amdgpu_device
*)kgd
;
175 struct kgd_mem
**mem
= (struct kgd_mem
**) mem_obj
;
179 BUG_ON(gpu_addr
== NULL
);
180 BUG_ON(cpu_ptr
== NULL
);
182 *mem
= kmalloc(sizeof(struct kgd_mem
), GFP_KERNEL
);
186 r
= amdgpu_bo_create(adev
, size
, PAGE_SIZE
, true, AMDGPU_GEM_DOMAIN_GTT
,
187 AMDGPU_GEM_CREATE_CPU_GTT_USWC
, NULL
, NULL
, &(*mem
)->bo
);
190 "failed to allocate BO for amdkfd (%d)\n", r
);
195 r
= amdgpu_bo_reserve((*mem
)->bo
, true);
197 dev_err(adev
->dev
, "(%d) failed to reserve bo for amdkfd\n", r
);
198 goto allocate_mem_reserve_bo_failed
;
201 r
= amdgpu_bo_pin((*mem
)->bo
, AMDGPU_GEM_DOMAIN_GTT
,
204 dev_err(adev
->dev
, "(%d) failed to pin bo for amdkfd\n", r
);
205 goto allocate_mem_pin_bo_failed
;
207 *gpu_addr
= (*mem
)->gpu_addr
;
209 r
= amdgpu_bo_kmap((*mem
)->bo
, &(*mem
)->cpu_ptr
);
212 "(%d) failed to map bo to kernel for amdkfd\n", r
);
213 goto allocate_mem_kmap_bo_failed
;
215 *cpu_ptr
= (*mem
)->cpu_ptr
;
217 amdgpu_bo_unreserve((*mem
)->bo
);
221 allocate_mem_kmap_bo_failed
:
222 amdgpu_bo_unpin((*mem
)->bo
);
223 allocate_mem_pin_bo_failed
:
224 amdgpu_bo_unreserve((*mem
)->bo
);
225 allocate_mem_reserve_bo_failed
:
226 amdgpu_bo_unref(&(*mem
)->bo
);
231 void free_gtt_mem(struct kgd_dev
*kgd
, void *mem_obj
)
233 struct kgd_mem
*mem
= (struct kgd_mem
*) mem_obj
;
237 amdgpu_bo_reserve(mem
->bo
, true);
238 amdgpu_bo_kunmap(mem
->bo
);
239 amdgpu_bo_unpin(mem
->bo
);
240 amdgpu_bo_unreserve(mem
->bo
);
241 amdgpu_bo_unref(&(mem
->bo
));
245 uint64_t get_vmem_size(struct kgd_dev
*kgd
)
247 struct amdgpu_device
*adev
=
248 (struct amdgpu_device
*)kgd
;
252 return adev
->mc
.real_vram_size
;
255 uint64_t get_gpu_clock_counter(struct kgd_dev
*kgd
)
257 struct amdgpu_device
*adev
= (struct amdgpu_device
*)kgd
;
259 if (adev
->gfx
.funcs
->get_gpu_clock_counter
)
260 return adev
->gfx
.funcs
->get_gpu_clock_counter(adev
);
264 uint32_t get_max_engine_clock_in_mhz(struct kgd_dev
*kgd
)
266 struct amdgpu_device
*adev
= (struct amdgpu_device
*)kgd
;
268 /* The sclk is in quantas of 10kHz */
269 return adev
->pm
.dpm
.dyn_state
.max_clock_voltage_on_ac
.sclk
/ 100;