2 * Copyright(c) 2011-2016 Intel Corporation. All rights reserved.
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
20 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
24 * Kevin Tian <kevin.tian@intel.com>
25 * Eddie Dong <eddie.dong@intel.com>
28 * Niu Bing <bing.niu@intel.com>
29 * Zhi Wang <zhi.a.wang@intel.com>
37 #include "hypercall.h"
40 #include "interrupt.h"
45 #include "scheduler.h"
46 #include "sched_policy.h"
48 #include "cmd_parser.h"
50 #define GVT_MAX_VGPU 8
53 INTEL_GVT_HYPERVISOR_XEN
= 0,
54 INTEL_GVT_HYPERVISOR_KVM
,
57 struct intel_gvt_host
{
60 struct intel_gvt_mpt
*mpt
;
63 extern struct intel_gvt_host intel_gvt_host
;
65 /* Describe per-platform limitations. */
66 struct intel_gvt_device_info
{
67 u32 max_support_vgpus
;
71 unsigned long msi_cap_offset
;
74 u32 gtt_entry_size_shift
;
75 int gmadr_bytes_in_cmd
;
79 /* GM resources owned by a vGPU */
80 struct intel_vgpu_gm
{
83 struct drm_mm_node low_gm_node
;
84 struct drm_mm_node high_gm_node
;
87 #define INTEL_GVT_MAX_NUM_FENCES 32
89 /* Fences owned by a vGPU */
90 struct intel_vgpu_fence
{
91 struct drm_i915_fence_reg
*regs
[INTEL_GVT_MAX_NUM_FENCES
];
96 struct intel_vgpu_mmio
{
99 bool disable_warn_untrack
;
102 #define INTEL_GVT_MAX_CFG_SPACE_SZ 256
103 #define INTEL_GVT_MAX_BAR_NUM 4
105 struct intel_vgpu_pci_bar
{
110 struct intel_vgpu_cfg_space
{
111 unsigned char virtual_cfg_space
[INTEL_GVT_MAX_CFG_SPACE_SZ
];
112 struct intel_vgpu_pci_bar bar
[INTEL_GVT_MAX_BAR_NUM
];
115 #define vgpu_cfg_space(vgpu) ((vgpu)->cfg_space.virtual_cfg_space)
117 #define INTEL_GVT_MAX_PIPE 4
119 struct intel_vgpu_irq
{
120 bool irq_warn_once
[INTEL_GVT_EVENT_MAX
];
121 DECLARE_BITMAP(flip_done_event
[INTEL_GVT_MAX_PIPE
],
122 INTEL_GVT_EVENT_MAX
);
125 struct intel_vgpu_opregion
{
127 u32 gfn
[INTEL_GVT_OPREGION_PAGES
];
128 struct page
*pages
[INTEL_GVT_OPREGION_PAGES
];
131 #define vgpu_opregion(vgpu) (&(vgpu->opregion))
133 #define INTEL_GVT_MAX_PORT 5
135 struct intel_vgpu_display
{
136 struct intel_vgpu_i2c_edid i2c_edid
;
137 struct intel_vgpu_port ports
[INTEL_GVT_MAX_PORT
];
138 struct intel_vgpu_sbi sbi
;
141 struct vgpu_sched_ctl
{
146 struct intel_gvt
*gvt
;
148 unsigned long handle
; /* vGPU handle used by hypervisor MPT modules */
152 unsigned int resetting_eng
;
154 struct vgpu_sched_ctl sched_ctl
;
156 struct intel_vgpu_fence fence
;
157 struct intel_vgpu_gm gm
;
158 struct intel_vgpu_cfg_space cfg_space
;
159 struct intel_vgpu_mmio mmio
;
160 struct intel_vgpu_irq irq
;
161 struct intel_vgpu_gtt gtt
;
162 struct intel_vgpu_opregion opregion
;
163 struct intel_vgpu_display display
;
164 struct intel_vgpu_execlist execlist
[I915_NUM_ENGINES
];
165 struct list_head workload_q_head
[I915_NUM_ENGINES
];
166 struct kmem_cache
*workloads
;
167 atomic_t running_workload_num
;
168 DECLARE_BITMAP(tlb_handle_pending
, I915_NUM_ENGINES
);
169 struct i915_gem_context
*shadow_ctx
;
171 #if IS_ENABLED(CONFIG_DRM_I915_GVT_KVMGT)
173 struct mdev_device
*mdev
;
174 struct vfio_region
*region
;
176 struct eventfd_ctx
*intx_trigger
;
177 struct eventfd_ctx
*msi_trigger
;
178 struct rb_root cache
;
179 struct mutex cache_lock
;
180 struct notifier_block iommu_notifier
;
181 struct notifier_block group_notifier
;
183 struct work_struct release_work
;
189 struct intel_gvt_gm
{
190 unsigned long vgpu_allocated_low_gm_size
;
191 unsigned long vgpu_allocated_high_gm_size
;
194 struct intel_gvt_fence
{
195 unsigned long vgpu_allocated_fence_num
;
198 /* Special MMIO blocks. */
199 struct gvt_mmio_block
{
207 #define INTEL_GVT_MMIO_HASH_BITS 11
209 struct intel_gvt_mmio
{
211 /* Register contains RO bits */
212 #define F_RO (1 << 0)
213 /* Register contains graphics address */
214 #define F_GMADR (1 << 1)
215 /* Mode mask registers with high 16 bits as the mask bits */
216 #define F_MODE_MASK (1 << 2)
217 /* This reg can be accessed by GPU commands */
218 #define F_CMD_ACCESS (1 << 3)
219 /* This reg has been accessed by a VM */
220 #define F_ACCESSED (1 << 4)
221 /* This reg has been accessed through GPU commands */
222 #define F_CMD_ACCESSED (1 << 5)
223 /* This reg could be accessed by unaligned address */
224 #define F_UNALIGN (1 << 6)
226 struct gvt_mmio_block
*mmio_block
;
227 unsigned int num_mmio_block
;
229 DECLARE_HASHTABLE(mmio_info_table
, INTEL_GVT_MMIO_HASH_BITS
);
230 unsigned int num_tracked_mmio
;
233 struct intel_gvt_firmware
{
236 bool firmware_loaded
;
239 struct intel_gvt_opregion
{
244 #define NR_MAX_INTEL_VGPU_TYPES 20
245 struct intel_vgpu_type
{
247 unsigned int avail_instance
;
248 unsigned int low_gm_size
;
249 unsigned int high_gm_size
;
252 enum intel_vgpu_edid resolution
;
257 struct drm_i915_private
*dev_priv
;
258 struct idr vgpu_idr
; /* vGPU IDR pool */
260 struct intel_gvt_device_info device_info
;
261 struct intel_gvt_gm gm
;
262 struct intel_gvt_fence fence
;
263 struct intel_gvt_mmio mmio
;
264 struct intel_gvt_firmware firmware
;
265 struct intel_gvt_irq irq
;
266 struct intel_gvt_gtt gtt
;
267 struct intel_gvt_opregion opregion
;
268 struct intel_gvt_workload_scheduler scheduler
;
269 struct notifier_block shadow_ctx_notifier_block
[I915_NUM_ENGINES
];
270 DECLARE_HASHTABLE(cmd_table
, GVT_CMD_HASH_BITS
);
271 struct intel_vgpu_type
*types
;
272 unsigned int num_types
;
273 struct intel_vgpu
*idle_vgpu
;
275 struct task_struct
*service_thread
;
276 wait_queue_head_t service_thread_wq
;
277 unsigned long service_request
;
280 static inline struct intel_gvt
*to_gvt(struct drm_i915_private
*i915
)
286 INTEL_GVT_REQUEST_EMULATE_VBLANK
= 0,
288 /* Scheduling trigger by timer */
289 INTEL_GVT_REQUEST_SCHED
= 1,
291 /* Scheduling trigger by event */
292 INTEL_GVT_REQUEST_EVENT_SCHED
= 2,
295 static inline void intel_gvt_request_service(struct intel_gvt
*gvt
,
298 set_bit(service
, (void *)&gvt
->service_request
);
299 wake_up(&gvt
->service_thread_wq
);
302 void intel_gvt_free_firmware(struct intel_gvt
*gvt
);
303 int intel_gvt_load_firmware(struct intel_gvt
*gvt
);
305 /* Aperture/GM space definitions for GVT device */
306 #define MB_TO_BYTES(mb) ((mb) << 20ULL)
307 #define BYTES_TO_MB(b) ((b) >> 20ULL)
309 #define HOST_LOW_GM_SIZE MB_TO_BYTES(128)
310 #define HOST_HIGH_GM_SIZE MB_TO_BYTES(384)
313 /* Aperture/GM space definitions for GVT device */
314 #define gvt_aperture_sz(gvt) (gvt->dev_priv->ggtt.mappable_end)
315 #define gvt_aperture_pa_base(gvt) (gvt->dev_priv->ggtt.mappable_base)
317 #define gvt_ggtt_gm_sz(gvt) (gvt->dev_priv->ggtt.base.total)
318 #define gvt_ggtt_sz(gvt) \
319 ((gvt->dev_priv->ggtt.base.total >> PAGE_SHIFT) << 3)
320 #define gvt_hidden_sz(gvt) (gvt_ggtt_gm_sz(gvt) - gvt_aperture_sz(gvt))
322 #define gvt_aperture_gmadr_base(gvt) (0)
323 #define gvt_aperture_gmadr_end(gvt) (gvt_aperture_gmadr_base(gvt) \
324 + gvt_aperture_sz(gvt) - 1)
326 #define gvt_hidden_gmadr_base(gvt) (gvt_aperture_gmadr_base(gvt) \
327 + gvt_aperture_sz(gvt))
328 #define gvt_hidden_gmadr_end(gvt) (gvt_hidden_gmadr_base(gvt) \
329 + gvt_hidden_sz(gvt) - 1)
331 #define gvt_fence_sz(gvt) (gvt->dev_priv->num_fence_regs)
333 /* Aperture/GM space definitions for vGPU */
334 #define vgpu_aperture_offset(vgpu) ((vgpu)->gm.low_gm_node.start)
335 #define vgpu_hidden_offset(vgpu) ((vgpu)->gm.high_gm_node.start)
336 #define vgpu_aperture_sz(vgpu) ((vgpu)->gm.aperture_sz)
337 #define vgpu_hidden_sz(vgpu) ((vgpu)->gm.hidden_sz)
339 #define vgpu_aperture_pa_base(vgpu) \
340 (gvt_aperture_pa_base(vgpu->gvt) + vgpu_aperture_offset(vgpu))
342 #define vgpu_ggtt_gm_sz(vgpu) ((vgpu)->gm.aperture_sz + (vgpu)->gm.hidden_sz)
344 #define vgpu_aperture_pa_end(vgpu) \
345 (vgpu_aperture_pa_base(vgpu) + vgpu_aperture_sz(vgpu) - 1)
347 #define vgpu_aperture_gmadr_base(vgpu) (vgpu_aperture_offset(vgpu))
348 #define vgpu_aperture_gmadr_end(vgpu) \
349 (vgpu_aperture_gmadr_base(vgpu) + vgpu_aperture_sz(vgpu) - 1)
351 #define vgpu_hidden_gmadr_base(vgpu) (vgpu_hidden_offset(vgpu))
352 #define vgpu_hidden_gmadr_end(vgpu) \
353 (vgpu_hidden_gmadr_base(vgpu) + vgpu_hidden_sz(vgpu) - 1)
355 #define vgpu_fence_base(vgpu) (vgpu->fence.base)
356 #define vgpu_fence_sz(vgpu) (vgpu->fence.size)
358 struct intel_vgpu_creation_params
{
360 __u64 low_gm_sz
; /* in MB */
361 __u64 high_gm_sz
; /* in MB */
370 int intel_vgpu_alloc_resource(struct intel_vgpu
*vgpu
,
371 struct intel_vgpu_creation_params
*param
);
372 void intel_vgpu_reset_resource(struct intel_vgpu
*vgpu
);
373 void intel_vgpu_free_resource(struct intel_vgpu
*vgpu
);
374 void intel_vgpu_write_fence(struct intel_vgpu
*vgpu
,
375 u32 fence
, u64 value
);
377 /* Macros for easily accessing vGPU virtual/shadow register */
378 #define vgpu_vreg(vgpu, reg) \
379 (*(u32 *)(vgpu->mmio.vreg + INTEL_GVT_MMIO_OFFSET(reg)))
380 #define vgpu_vreg8(vgpu, reg) \
381 (*(u8 *)(vgpu->mmio.vreg + INTEL_GVT_MMIO_OFFSET(reg)))
382 #define vgpu_vreg16(vgpu, reg) \
383 (*(u16 *)(vgpu->mmio.vreg + INTEL_GVT_MMIO_OFFSET(reg)))
384 #define vgpu_vreg64(vgpu, reg) \
385 (*(u64 *)(vgpu->mmio.vreg + INTEL_GVT_MMIO_OFFSET(reg)))
386 #define vgpu_sreg(vgpu, reg) \
387 (*(u32 *)(vgpu->mmio.sreg + INTEL_GVT_MMIO_OFFSET(reg)))
388 #define vgpu_sreg8(vgpu, reg) \
389 (*(u8 *)(vgpu->mmio.sreg + INTEL_GVT_MMIO_OFFSET(reg)))
390 #define vgpu_sreg16(vgpu, reg) \
391 (*(u16 *)(vgpu->mmio.sreg + INTEL_GVT_MMIO_OFFSET(reg)))
392 #define vgpu_sreg64(vgpu, reg) \
393 (*(u64 *)(vgpu->mmio.sreg + INTEL_GVT_MMIO_OFFSET(reg)))
395 #define for_each_active_vgpu(gvt, vgpu, id) \
396 idr_for_each_entry((&(gvt)->vgpu_idr), (vgpu), (id)) \
397 for_each_if(vgpu->active)
399 static inline void intel_vgpu_write_pci_bar(struct intel_vgpu
*vgpu
,
400 u32 offset
, u32 val
, bool low
)
404 /* BAR offset should be 32 bits algiend */
405 offset
= rounddown(offset
, 4);
406 pval
= (u32
*)(vgpu_cfg_space(vgpu
) + offset
);
410 * only update bit 31 - bit 4,
411 * leave the bit 3 - bit 0 unchanged.
413 *pval
= (val
& GENMASK(31, 4)) | (*pval
& GENMASK(3, 0));
419 int intel_gvt_init_vgpu_types(struct intel_gvt
*gvt
);
420 void intel_gvt_clean_vgpu_types(struct intel_gvt
*gvt
);
422 struct intel_vgpu
*intel_gvt_create_idle_vgpu(struct intel_gvt
*gvt
);
423 void intel_gvt_destroy_idle_vgpu(struct intel_vgpu
*vgpu
);
424 struct intel_vgpu
*intel_gvt_create_vgpu(struct intel_gvt
*gvt
,
425 struct intel_vgpu_type
*type
);
426 void intel_gvt_destroy_vgpu(struct intel_vgpu
*vgpu
);
427 void intel_gvt_reset_vgpu_locked(struct intel_vgpu
*vgpu
, bool dmlr
,
428 unsigned int engine_mask
);
429 void intel_gvt_reset_vgpu(struct intel_vgpu
*vgpu
);
430 void intel_gvt_activate_vgpu(struct intel_vgpu
*vgpu
);
431 void intel_gvt_deactivate_vgpu(struct intel_vgpu
*vgpu
);
433 /* validating GM functions */
434 #define vgpu_gmadr_is_aperture(vgpu, gmadr) \
435 ((gmadr >= vgpu_aperture_gmadr_base(vgpu)) && \
436 (gmadr <= vgpu_aperture_gmadr_end(vgpu)))
438 #define vgpu_gmadr_is_hidden(vgpu, gmadr) \
439 ((gmadr >= vgpu_hidden_gmadr_base(vgpu)) && \
440 (gmadr <= vgpu_hidden_gmadr_end(vgpu)))
442 #define vgpu_gmadr_is_valid(vgpu, gmadr) \
443 ((vgpu_gmadr_is_aperture(vgpu, gmadr) || \
444 (vgpu_gmadr_is_hidden(vgpu, gmadr))))
446 #define gvt_gmadr_is_aperture(gvt, gmadr) \
447 ((gmadr >= gvt_aperture_gmadr_base(gvt)) && \
448 (gmadr <= gvt_aperture_gmadr_end(gvt)))
450 #define gvt_gmadr_is_hidden(gvt, gmadr) \
451 ((gmadr >= gvt_hidden_gmadr_base(gvt)) && \
452 (gmadr <= gvt_hidden_gmadr_end(gvt)))
454 #define gvt_gmadr_is_valid(gvt, gmadr) \
455 (gvt_gmadr_is_aperture(gvt, gmadr) || \
456 gvt_gmadr_is_hidden(gvt, gmadr))
458 bool intel_gvt_ggtt_validate_range(struct intel_vgpu
*vgpu
, u64 addr
, u32 size
);
459 int intel_gvt_ggtt_gmadr_g2h(struct intel_vgpu
*vgpu
, u64 g_addr
, u64
*h_addr
);
460 int intel_gvt_ggtt_gmadr_h2g(struct intel_vgpu
*vgpu
, u64 h_addr
, u64
*g_addr
);
461 int intel_gvt_ggtt_index_g2h(struct intel_vgpu
*vgpu
, unsigned long g_index
,
462 unsigned long *h_index
);
463 int intel_gvt_ggtt_h2g_index(struct intel_vgpu
*vgpu
, unsigned long h_index
,
464 unsigned long *g_index
);
466 void intel_vgpu_init_cfg_space(struct intel_vgpu
*vgpu
,
468 void intel_vgpu_reset_cfg_space(struct intel_vgpu
*vgpu
);
470 int intel_vgpu_emulate_cfg_read(struct intel_vgpu
*vgpu
, unsigned int offset
,
471 void *p_data
, unsigned int bytes
);
473 int intel_vgpu_emulate_cfg_write(struct intel_vgpu
*vgpu
, unsigned int offset
,
474 void *p_data
, unsigned int bytes
);
476 void intel_gvt_clean_opregion(struct intel_gvt
*gvt
);
477 int intel_gvt_init_opregion(struct intel_gvt
*gvt
);
479 void intel_vgpu_clean_opregion(struct intel_vgpu
*vgpu
);
480 int intel_vgpu_init_opregion(struct intel_vgpu
*vgpu
, u32 gpa
);
482 int intel_vgpu_emulate_opregion_request(struct intel_vgpu
*vgpu
, u32 swsci
);
483 void populate_pvinfo_page(struct intel_vgpu
*vgpu
);
485 struct intel_gvt_ops
{
486 int (*emulate_cfg_read
)(struct intel_vgpu
*, unsigned int, void *,
488 int (*emulate_cfg_write
)(struct intel_vgpu
*, unsigned int, void *,
490 int (*emulate_mmio_read
)(struct intel_vgpu
*, u64
, void *,
492 int (*emulate_mmio_write
)(struct intel_vgpu
*, u64
, void *,
494 struct intel_vgpu
*(*vgpu_create
)(struct intel_gvt
*,
495 struct intel_vgpu_type
*);
496 void (*vgpu_destroy
)(struct intel_vgpu
*);
497 void (*vgpu_reset
)(struct intel_vgpu
*);
498 void (*vgpu_activate
)(struct intel_vgpu
*);
499 void (*vgpu_deactivate
)(struct intel_vgpu
*);
504 GVT_FAILSAFE_UNSUPPORTED_GUEST
,
505 GVT_FAILSAFE_INSUFFICIENT_RESOURCE
,
508 static inline void mmio_hw_access_pre(struct drm_i915_private
*dev_priv
)
510 intel_runtime_pm_get(dev_priv
);
513 static inline void mmio_hw_access_post(struct drm_i915_private
*dev_priv
)
515 intel_runtime_pm_put(dev_priv
);
519 * intel_gvt_mmio_set_accessed - mark a MMIO has been accessed
521 * @offset: register offset
524 static inline void intel_gvt_mmio_set_accessed(
525 struct intel_gvt
*gvt
, unsigned int offset
)
527 gvt
->mmio
.mmio_attribute
[offset
>> 2] |= F_ACCESSED
;
531 * intel_gvt_mmio_is_cmd_accessed - mark a MMIO could be accessed by command
533 * @offset: register offset
536 static inline bool intel_gvt_mmio_is_cmd_access(
537 struct intel_gvt
*gvt
, unsigned int offset
)
539 return gvt
->mmio
.mmio_attribute
[offset
>> 2] & F_CMD_ACCESS
;
543 * intel_gvt_mmio_is_unalign - mark a MMIO could be accessed unaligned
545 * @offset: register offset
548 static inline bool intel_gvt_mmio_is_unalign(
549 struct intel_gvt
*gvt
, unsigned int offset
)
551 return gvt
->mmio
.mmio_attribute
[offset
>> 2] & F_UNALIGN
;
555 * intel_gvt_mmio_set_cmd_accessed - mark a MMIO has been accessed by command
557 * @offset: register offset
560 static inline void intel_gvt_mmio_set_cmd_accessed(
561 struct intel_gvt
*gvt
, unsigned int offset
)
563 gvt
->mmio
.mmio_attribute
[offset
>> 2] |= F_CMD_ACCESSED
;
567 * intel_gvt_mmio_has_mode_mask - if a MMIO has a mode mask
569 * @offset: register offset
572 * True if a MMIO has a mode mask in its higher 16 bits, false if it isn't.
575 static inline bool intel_gvt_mmio_has_mode_mask(
576 struct intel_gvt
*gvt
, unsigned int offset
)
578 return gvt
->mmio
.mmio_attribute
[offset
>> 2] & F_MODE_MASK
;