@@ -1637,6 +1637,8 @@ static void i915_driver_release(struct drm_device *dev)
disable_rpm_wakeref_asserts(rpm);
+ i915_destroy_vgpu(dev_priv);
+
i915_gem_driver_release(dev_priv);
i915_ggtt_driver_release(dev_priv);
@@ -973,7 +973,9 @@ struct i915_virtual_gpu {
bool active;
u32 caps;
u32 pv_caps;
-};
+
+ struct i915_virtual_gpu_pv *pv;
+} __packed;
/* used in computing the new watermarks state */
struct intel_wm_config {
@@ -48,6 +48,7 @@ enum vgt_g2v_type {
VGT_G2V_PPGTT_L4_PAGE_TABLE_DESTROY,
VGT_G2V_EXECLIST_CONTEXT_CREATE,
VGT_G2V_EXECLIST_CONTEXT_DESTROY,
+ VGT_G2V_SHARED_PAGE_SETUP,
VGT_G2V_MAX,
};
@@ -112,7 +113,9 @@ struct vgt_if {
u32 pv_caps;
- u32 rsv7[0x200 - 25]; /* pad to one page */
+ u64 shared_page_gpa;
+
+ u32 rsv7[0x200 - 27]; /* pad to one page */
} __packed;
#define vgtif_offset(x) (offsetof(struct vgt_if, x))
@@ -107,6 +107,17 @@ void i915_detect_vgpu(struct drm_i915_private *dev_priv)
pci_iounmap(pdev, shared_area);
}
+void i915_destroy_vgpu(struct drm_i915_private *dev_priv)
+{
+ struct i915_virtual_gpu_pv *pv = dev_priv->vgpu.pv;
+
+ if (!intel_vgpu_active(dev_priv) || !pv)
+ return;
+
+ __free_page(virt_to_page(pv->shared_page));
+ kfree(pv);
+}
+
bool intel_vgpu_has_full_ppgtt(struct drm_i915_private *dev_priv)
{
return dev_priv->vgpu.caps & VGT_CAPS_FULL_PPGTT;
@@ -311,6 +322,84 @@ int intel_vgt_balloon(struct i915_ggtt *ggtt)
* i915 vgpu PV support for Linux
*/
+/*
+ * shared_page setup for VGPU PV features
+ */
+static int intel_vgpu_setup_shared_page(struct drm_i915_private *dev_priv,
+ void __iomem *shared_area)
+{
+ void __iomem *addr;
+ struct i915_virtual_gpu_pv *pv;
+ struct gvt_shared_page *base;
+ u64 gpa;
+ u16 ver_maj, ver_min;
+ int ret = 0;
+
+ /* We allocate 1 page shared between guest and GVT for data exchange.
+ * ___________.....................
+ * |head | |
+ * |___________|.................. PAGE/8
+ * |PV ELSP |
+ * :___________....................PAGE/4
+ * |desc (SEND) |
+ * | |
+ * :_______________________________PAGE/2
+ * |cmds (SEND) |
+ * | |
+ * | |
+ * | |
+ * | |
+ * |_______________________________|
+ *
+ * 0 offset: PV version area
+ * PAGE/8 offset: per engine workload submission data area
+ * PAGE/4 offset: PV command buffer command descriptor area
+ * PAGE/2 offset: PV command buffer command data area
+ */
+
+ base = (struct gvt_shared_page *)get_zeroed_page(GFP_KERNEL);
+ if (!base) {
+ dev_info(dev_priv->drm.dev, "out of memory for shared memory\n");
+ return -ENOMEM;
+ }
+
+ /* pass guest memory pa address to GVT and then read back to verify */
+ gpa = __pa(base);
+ addr = shared_area + vgtif_offset(shared_page_gpa);
+ writeq(gpa, addr);
+ if (gpa != readq(addr)) {
+ dev_info(dev_priv->drm.dev, "passed shared_page_gpa failed\n");
+ ret = -EIO;
+ goto err;
+ }
+
+ addr = shared_area + vgtif_offset(g2v_notify);
+ writel(VGT_G2V_SHARED_PAGE_SETUP, addr);
+
+ ver_maj = base->ver_major;
+ ver_min = base->ver_minor;
+ if (ver_maj != PV_MAJOR || ver_min != PV_MINOR) {
+ dev_info(dev_priv->drm.dev, "VGPU PV version incompatible\n");
+ ret = -EIO;
+ goto err;
+ }
+
+ pv = kzalloc(sizeof(struct i915_virtual_gpu_pv), GFP_KERNEL);
+ if (!pv) {
+ ret = -ENOMEM;
+ goto err;
+ }
+
+ DRM_INFO("vgpu PV ver major %d and minor %d\n", ver_maj, ver_min);
+ dev_priv->vgpu.pv = pv;
+ pv->shared_page = base;
+ pv->enabled = true;
+ return ret;
+err:
+ __free_page(virt_to_page(base));
+ return ret;
+}
+
/**
* intel_vgpu_check_pv_caps - detect virtual GPU PV capabilities
* @dev_priv: i915 device private
@@ -339,5 +428,11 @@ bool intel_vgpu_check_pv_caps(struct drm_i915_private *dev_priv,
if (!pvcaps)
return false;
+ if (intel_vgpu_setup_shared_page(dev_priv, shared_area)) {
+ dev_priv->vgpu.pv_caps = 0;
+ writel(0, shared_area + vgtif_offset(pv_caps));
+ return false;
+ }
+
return true;
}
@@ -27,7 +27,25 @@
#include "i915_drv.h"
#include "i915_pvinfo.h"
+#define PV_MAJOR 1
+#define PV_MINOR 0
+
+/*
+ * A shared page(4KB) between gvt and VM, could be allocated by guest driver
+ * or a fixed location in PCI bar 0 region
+ */
+struct gvt_shared_page {
+ u16 ver_major;
+ u16 ver_minor;
+};
+
+struct i915_virtual_gpu_pv {
+ struct gvt_shared_page *shared_page;
+ bool enabled;
+};
+
void i915_detect_vgpu(struct drm_i915_private *dev_priv);
+void i915_destroy_vgpu(struct drm_i915_private *dev_priv);
bool intel_vgpu_has_full_ppgtt(struct drm_i915_private *dev_priv);
To enable vgpu pv features, we need to setup a shared memory page which will be used for data exchange directly accessed between both guest and backend i915 driver to avoid emulation trap cost. guest i915 will allocate this page memory and then pass it's physical address to backend i915 driver through PVINFO register so that backend i915 driver can access this shared page meory without any trap cost with the help form hyperviser's read guest gpa functionality. guest i915 will send VGT_G2V_SHARED_PAGE_SETUP notification to host GVT once shared memory setup finished. the layout of the shared_page also defined as well in this patch which is used for pv features implementation. v0: RFC. v1: addressed RFC comment to move both shared_page_lock and shared_page to i915_virtual_gpu structure. v2: packed i915_virtual_gpu structure. v3: added SHARED_PAGE_SETUP g2v notification for pv shared_page setup v4: added intel_vgpu_setup_shared_page() in i915_vgpu_pv.c. v5: per engine desc data in shared memory. v6: added version support in shared memory (Zhenyu). v7: added new function i915_destroy_vgpu to free shared memory. Signed-off-by: Xiaolin Zhang <xiaolin.zhang@intel.com> --- drivers/gpu/drm/i915/i915_drv.c | 2 + drivers/gpu/drm/i915/i915_drv.h | 4 +- drivers/gpu/drm/i915/i915_pvinfo.h | 5 +- drivers/gpu/drm/i915/i915_vgpu.c | 95 ++++++++++++++++++++++++++++++++++++++ drivers/gpu/drm/i915/i915_vgpu.h | 18 ++++++++ 5 files changed, 122 insertions(+), 2 deletions(-)