BACKPORT: FROMLIST: gunyah: vm_mgr: Add ioctls to support basic non-proxy VM boot

Add remaining ioctls to support non-proxy VM boot:

 - Gunyah Resource Manager uses the VM's devicetree to configure the
   virtual machine. The location of the devicetree in the guest's
   virtual memory can be declared via the SET_DTB_CONFIG ioctl.
 - Trigger start of the virtual machine with VM_START ioctl.

Co-developed-by: Prakruthi Deepak Heragu <quic_pheragu@quicinc.com>
Signed-off-by: Prakruthi Deepak Heragu <quic_pheragu@quicinc.com>
Signed-off-by: Elliot Berman <quic_eberman@quicinc.com>

Bug: 268234781
Link: https://lore.kernel.org/all/20230304010632.2127470-14-quic_eberman@quicinc.com/
Change-Id: Iade2105969dc9bde2274e124696a5fb914478236
[Elliot: fixup gh_vm_free flow to align with future v12 patch]
Signed-off-by: Elliot Berman <quic_eberman@quicinc.com>
This commit is contained in:
Elliot Berman
2022-10-17 16:24:17 -07:00
committed by Aleksei Vetrov
parent afe9d3b501
commit fa4e7824da
5 changed files with 287 additions and 13 deletions

View File

@@ -9,37 +9,124 @@
#include <linux/file.h>
#include <linux/gunyah_rsc_mgr.h>
#include <linux/miscdevice.h>
#include <linux/mm.h>
#include <linux/module.h>
#include <uapi/linux/gunyah.h>
#include "vm_mgr.h"
static int gh_vm_rm_notification_status(struct gh_vm *ghvm, void *data)
{
struct gh_rm_vm_status_payload *payload = data;
if (payload->vmid != ghvm->vmid)
return NOTIFY_OK;
/* All other state transitions are synchronous to a corresponding RM call */
if (payload->vm_status == GH_RM_VM_STATUS_RESET) {
down_write(&ghvm->status_lock);
ghvm->vm_status = payload->vm_status;
up_write(&ghvm->status_lock);
wake_up(&ghvm->vm_status_wait);
}
return NOTIFY_DONE;
}
static int gh_vm_rm_notification_exited(struct gh_vm *ghvm, void *data)
{
struct gh_rm_vm_exited_payload *payload = data;
if (payload->vmid != ghvm->vmid)
return NOTIFY_OK;
down_write(&ghvm->status_lock);
ghvm->vm_status = GH_RM_VM_STATUS_EXITED;
up_write(&ghvm->status_lock);
return NOTIFY_DONE;
}
static int gh_vm_rm_notification(struct notifier_block *nb, unsigned long action, void *data)
{
struct gh_vm *ghvm = container_of(nb, struct gh_vm, nb);
switch (action) {
case GH_RM_NOTIFICATION_VM_STATUS:
return gh_vm_rm_notification_status(ghvm, data);
case GH_RM_NOTIFICATION_VM_EXITED:
return gh_vm_rm_notification_exited(ghvm, data);
default:
return NOTIFY_OK;
}
}
static void gh_vm_stop(struct gh_vm *ghvm)
{
int ret;
down_write(&ghvm->status_lock);
if (ghvm->vm_status == GH_RM_VM_STATUS_RUNNING) {
ret = gh_rm_vm_stop(ghvm->rm, ghvm->vmid);
if (ret)
dev_warn(ghvm->parent, "Failed to stop VM: %d\n", ret);
}
ghvm->vm_status = GH_RM_VM_STATUS_EXITED;
up_write(&ghvm->status_lock);
}
static void gh_vm_free(struct work_struct *work)
{
struct gh_vm *ghvm = container_of(work, struct gh_vm, free_work);
struct gh_vm_mem *mapping, *tmp;
int ret;
mutex_lock(&ghvm->mm_lock);
list_for_each_entry_safe(mapping, tmp, &ghvm->memory_mappings, list) {
gh_vm_mem_reclaim(ghvm, mapping);
kfree(mapping);
switch (ghvm->vm_status) {
case GH_RM_VM_STATUS_RUNNING:
gh_vm_stop(ghvm);
fallthrough;
case GH_RM_VM_STATUS_INIT_FAILED:
case GH_RM_VM_STATUS_EXITED:
ret = gh_rm_vm_reset(ghvm->rm, ghvm->vmid);
if (ret)
dev_err(ghvm->parent, "Failed to reset the vm: %d\n", ret);
wait_event(ghvm->vm_status_wait, ghvm->vm_status == GH_RM_VM_STATUS_RESET);
fallthrough;
case GH_RM_VM_STATUS_LOAD:
mutex_lock(&ghvm->mm_lock);
list_for_each_entry_safe(mapping, tmp, &ghvm->memory_mappings, list) {
gh_vm_mem_reclaim(ghvm, mapping);
kfree(mapping);
}
mutex_unlock(&ghvm->mm_lock);
fallthrough;
case GH_RM_VM_STATUS_NO_STATE:
ret = gh_rm_dealloc_vmid(ghvm->rm, ghvm->vmid);
if (ret)
dev_warn(ghvm->parent, "Failed to deallocate vmid: %d\n", ret);
gh_rm_notifier_unregister(ghvm->rm, &ghvm->nb);
gh_rm_put(ghvm->rm);
kfree(ghvm);
break;
default:
dev_err(ghvm->parent, "VM is unknown state: %d. VM will not be cleaned up.\n",
ghvm->vm_status);
gh_rm_notifier_unregister(ghvm->rm, &ghvm->nb);
gh_rm_put(ghvm->rm);
kfree(ghvm);
break;
}
mutex_unlock(&ghvm->mm_lock);
ret = gh_rm_dealloc_vmid(ghvm->rm, ghvm->vmid);
if (ret)
pr_warn("Failed to deallocate vmid: %d\n", ret);
put_gh_rm(ghvm->rm);
kfree(ghvm);
}
static __must_check struct gh_vm *gh_vm_alloc(struct gh_rm *rm)
{
struct gh_vm *ghvm;
int vmid;
int vmid, ret;
vmid = gh_rm_alloc_vmid(rm, 0);
if (vmid < 0)
@@ -55,13 +142,129 @@ static __must_check struct gh_vm *gh_vm_alloc(struct gh_rm *rm)
ghvm->vmid = vmid;
ghvm->rm = rm;
init_waitqueue_head(&ghvm->vm_status_wait);
ghvm->nb.notifier_call = gh_vm_rm_notification;
ret = gh_rm_notifier_register(rm, &ghvm->nb);
if (ret) {
gh_rm_put(rm);
gh_rm_dealloc_vmid(rm, vmid);
kfree(ghvm);
return ERR_PTR(ret);
}
mutex_init(&ghvm->mm_lock);
INIT_LIST_HEAD(&ghvm->memory_mappings);
init_rwsem(&ghvm->status_lock);
INIT_WORK(&ghvm->free_work, gh_vm_free);
ghvm->vm_status = GH_RM_VM_STATUS_LOAD;
return ghvm;
}
static int gh_vm_start(struct gh_vm *ghvm)
{
struct gh_vm_mem *mapping;
u64 dtb_offset;
u32 mem_handle;
int ret;
down_write(&ghvm->status_lock);
if (ghvm->vm_status != GH_RM_VM_STATUS_LOAD) {
up_write(&ghvm->status_lock);
return 0;
}
mutex_lock(&ghvm->mm_lock);
list_for_each_entry(mapping, &ghvm->memory_mappings, list) {
switch (mapping->share_type) {
case VM_MEM_LEND:
ret = gh_rm_mem_lend(ghvm->rm, &mapping->parcel);
break;
case VM_MEM_SHARE:
ret = gh_rm_mem_share(ghvm->rm, &mapping->parcel);
break;
}
if (ret) {
dev_warn(ghvm->parent, "Failed to %s parcel %d: %d\n",
mapping->share_type == VM_MEM_LEND ? "lend" : "share",
mapping->parcel.label,
ret);
goto err;
}
}
mutex_unlock(&ghvm->mm_lock);
mapping = gh_vm_mem_find_by_addr(ghvm, ghvm->dtb_config.guest_phys_addr,
ghvm->dtb_config.size);
if (!mapping) {
dev_warn(ghvm->parent, "Failed to find the memory_handle for DTB\n");
ret = -EINVAL;
goto err;
}
mem_handle = mapping->parcel.mem_handle;
dtb_offset = ghvm->dtb_config.guest_phys_addr - mapping->guest_phys_addr;
ret = gh_rm_vm_configure(ghvm->rm, ghvm->vmid, ghvm->auth, mem_handle,
0, 0, dtb_offset, ghvm->dtb_config.size);
if (ret) {
dev_warn(ghvm->parent, "Failed to configure VM: %d\n", ret);
goto err;
}
ret = gh_rm_vm_init(ghvm->rm, ghvm->vmid);
ghvm->vm_status = GH_RM_VM_STATUS_RESET;
if (ret) {
dev_warn(ghvm->parent, "Failed to initialize VM: %d\n", ret);
goto err;
}
ret = gh_rm_vm_start(ghvm->rm, ghvm->vmid);
if (ret) {
dev_warn(ghvm->parent, "Failed to start VM: %d\n", ret);
goto err;
}
ghvm->vm_status = GH_RM_VM_STATUS_RUNNING;
up_write(&ghvm->status_lock);
return ret;
err:
ghvm->vm_status = GH_RM_VM_STATUS_INIT_FAILED;
/* gh_vm_free will handle releasing resources and reclaiming memory */
up_write(&ghvm->status_lock);
return ret;
}
static int gh_vm_ensure_started(struct gh_vm *ghvm)
{
int ret;
ret = down_read_interruptible(&ghvm->status_lock);
if (ret)
return ret;
/* Unlikely because VM is typically started */
if (unlikely(ghvm->vm_status == GH_RM_VM_STATUS_LOAD)) {
up_read(&ghvm->status_lock);
ret = gh_vm_start(ghvm);
if (ret)
goto out;
/** gh_vm_start() is guaranteed to bring status out of
* GH_RM_VM_STATUS_LOAD, thus inifitely recursive call is not
* possible
*/
return gh_vm_ensure_started(ghvm);
}
/* Unlikely because VM is typically running */
if (unlikely(ghvm->vm_status != GH_RM_VM_STATUS_RUNNING))
ret = -ENODEV;
out:
up_read(&ghvm->status_lock);
return ret;
}
static long gh_vm_ioctl(struct file *filp, unsigned int cmd, unsigned long arg)
{
struct gh_vm *ghvm = filp->private_data;
@@ -85,6 +288,25 @@ static long gh_vm_ioctl(struct file *filp, unsigned int cmd, unsigned long arg)
r = gh_vm_mem_alloc(ghvm, &region);
break;
}
case GH_VM_SET_DTB_CONFIG: {
struct gh_vm_dtb_config dtb_config;
if (copy_from_user(&dtb_config, argp, sizeof(dtb_config)))
return -EFAULT;
dtb_config.size = PAGE_ALIGN(dtb_config.size);
if (dtb_config.guest_phys_addr + dtb_config.size < dtb_config.guest_phys_addr)
return -EOVERFLOW;
ghvm->dtb_config = dtb_config;
r = 0;
break;
}
case GH_VM_START: {
r = gh_vm_ensure_started(ghvm);
break;
}
default:
r = -ENOTTY;
break;

View File

@@ -10,6 +10,8 @@
#include <linux/list.h>
#include <linux/miscdevice.h>
#include <linux/mutex.h>
#include <linux/rwsem.h>
#include <linux/wait.h>
#include <uapi/linux/gunyah.h>
@@ -34,6 +36,13 @@ struct gh_vm {
u16 vmid;
struct gh_rm *rm;
struct device *parent;
enum gh_rm_vm_auth_mechanism auth;
struct gh_vm_dtb_config dtb_config;
struct notifier_block nb;
enum gh_rm_vm_status vm_status;
wait_queue_head_t vm_status_wait;
struct rw_semaphore status_lock;
struct work_struct free_work;
struct mutex mm_lock;
@@ -44,5 +53,6 @@ int gh_vm_mem_alloc(struct gh_vm *ghvm, struct gh_userspace_memory_region *regio
void gh_vm_mem_reclaim(struct gh_vm *ghvm, struct gh_vm_mem *mapping);
int gh_vm_mem_free(struct gh_vm *ghvm, u32 label);
struct gh_vm_mem *gh_vm_mem_find_by_label(struct gh_vm *ghvm, u32 label);
struct gh_vm_mem *gh_vm_mem_find_by_addr(struct gh_vm *ghvm, u64 guest_phys_addr, u32 size);
#endif

View File

@@ -47,6 +47,29 @@ void gh_vm_mem_reclaim(struct gh_vm *ghvm, struct gh_vm_mem *mapping)
list_del(&mapping->list);
}
struct gh_vm_mem *gh_vm_mem_find_by_addr(struct gh_vm *ghvm, u64 guest_phys_addr, u32 size)
{
struct gh_vm_mem *mapping = NULL;
int ret;
ret = mutex_lock_interruptible(&ghvm->mm_lock);
if (ret)
return ERR_PTR(ret);
list_for_each_entry(mapping, &ghvm->memory_mappings, list) {
if (guest_phys_addr >= mapping->guest_phys_addr &&
(guest_phys_addr + size <= mapping->guest_phys_addr +
(mapping->npages << PAGE_SHIFT))) {
goto unlock;
}
}
mapping = NULL;
unlock:
mutex_unlock(&ghvm->mm_lock);
return mapping;
}
struct gh_vm_mem *gh_vm_mem_find_by_label(struct gh_vm *ghvm, u32 label)
{
struct gh_vm_mem *mapping;

View File

@@ -29,6 +29,12 @@ struct gh_rm_vm_exited_payload {
#define GH_RM_NOTIFICATION_VM_EXITED 0x56100001
enum gh_rm_vm_status {
/**
* RM doesn't have a state where load partially failed because
* only Linux
*/
GH_RM_VM_STATUS_LOAD_FAILED = -1,
GH_RM_VM_STATUS_NO_STATE = 0,
GH_RM_VM_STATUS_INIT = 1,
GH_RM_VM_STATUS_READY = 2,

View File

@@ -49,4 +49,17 @@ struct gh_userspace_memory_region {
#define GH_VM_SET_USER_MEM_REGION _IOW(GH_IOCTL_TYPE, 0x1, \
struct gh_userspace_memory_region)
/**
* struct gh_vm_dtb_config - Set the location of the VM's devicetree blob
* @guest_phys_addr: Address of the VM's devicetree in guest memory.
* @size: Maximum size of the devicetree.
*/
struct gh_vm_dtb_config {
__u64 guest_phys_addr;
__u64 size;
};
#define GH_VM_SET_DTB_CONFIG _IOW(GH_IOCTL_TYPE, 0x2, struct gh_vm_dtb_config)
#define GH_VM_START _IO(GH_IOCTL_TYPE, 0x3)
#endif