diff options
Diffstat (limited to 'virtio_loopback_driver.c')
-rw-r--r-- | virtio_loopback_driver.c | 465 |
1 files changed, 321 insertions, 144 deletions
diff --git a/virtio_loopback_driver.c b/virtio_loopback_driver.c index d822a3e..4284f0a 100644 --- a/virtio_loopback_driver.c +++ b/virtio_loopback_driver.c @@ -1,7 +1,22 @@ // SPDX-License-Identifier: GPL-2.0-or-later /* + * Virtio loopback device driver + * * Copyright 2022-2024 Virtual Open Systems SAS * + * Authors: + * Timos Ampelikiotis <t.ampelikiotis@virtualopensystems.com> + * Anna Panagopoulou <anna@virtualopensystems.com> + * Alvise Rigo <a.rigo@virtualopensystems.com> + * + * This module allows virtio devices to be used in a non-virtualized + * environment, coupled with vhost-user device (user-space drivers). + * + * This module is responsible to assign the virtio-loopback transport driver + * to a group of virtio drivers in order to be able to share notifications and + * the vrings (without copies) with the corresponding vhost-user devices in + * the user-space. + * * This program is free software; you can redistribute it and/or modify * it under the terms of the GNU General Public License as published by * the Free Software Foundation; either version 2 of the License, or @@ -11,10 +26,6 @@ * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU General Public License for more details. - * - * You should have received a copy of the GNU General Public License - * along with this program; if not, write to the Free Software Foundation, - * Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA. */ #define pr_fmt(fmt) "virtio-loopback: " fmt @@ -23,46 +34,43 @@ #include "virtio_loopback_driver.h" /* Features */ -MODULE_LICENSE("GPL v2"); +MODULE_LICENSE("GPL"); /* The global data for the loopback */ -struct loopback_device_data loopback_data; -struct loopback_devices_array loopback_devices; +static struct loopback_device_data loopback_data; +static struct loopback_devices_array loopback_devices; /* - * This functions registers all mmap calls done by the user-space into an array + * This function registers all mmap calls done by the user-space into an array */ -static void add_share_mmap(struct file *filp, uint64_t pfn, uint64_t vm_start, uint64_t size) +static void add_share_mmap(struct file *filp, uint64_t pfn, + uint64_t vm_start, uint64_t size) { - struct file_priv_data *file_data = (struct file_priv_data *)(filp->private_data); + struct file_priv_data *file_data = + (struct file_priv_data *)(filp->private_data); struct mmap_data *mm_data = (struct mmap_data *)file_data->mm_data; - pr_debug("Add new mmaping! index: %d\n", mm_data->mmap_index); - pr_debug("pfn: 0x%llx", pfn); - pr_debug("vm_start: 0x%llx", vm_start); - pr_debug("size: 0x%llx", size); - mm_data->share_mmap_list[mm_data->mmap_index].pfn = pfn; mm_data->share_mmap_list[mm_data->mmap_index].vm_start = vm_start; mm_data->share_mmap_list[mm_data->mmap_index].size = size; - mm_data->share_mmap_list[mm_data->mmap_index].uid = task_pid_nr(current); + mm_data->share_mmap_list[mm_data->mmap_index].uid = + task_pid_nr(current); mm_data->mmap_index++; } /* - * This functions removes a record from mmap array + * This function removes a record from mmap array */ static void share_mmap_rem(struct vm_area_struct *vma) { struct file *file = vma->vm_file; - struct file_priv_data *file_data = (struct file_priv_data *)(file->private_data); + struct file_priv_data *file_data = + (struct file_priv_data *)(file->private_data); struct mmap_data *mm_data = (struct mmap_data *)file_data->mm_data; int i; for (i = 0; i < MMAP_LIMIT; i++) { if (mm_data->share_mmap_list[i].vm_start == vma->vm_start) { - pr_debug("share_mmap with pa: 0x%llx and size: %x is deleted from the list\n", - mm_data->share_mmap_list[i].pfn, mm_data->share_mmap_list[i].size); mm_data->share_mmap_list[i].uid = 0; mm_data->share_mmap_list[i].pfn = 0; mm_data->share_mmap_list[i].vm_start = 0; @@ -73,87 +81,130 @@ static void share_mmap_rem(struct vm_area_struct *vma) static void print_mmap_idx(struct mmap_data *mm_data, int i) { - pr_debug("share_mmap_list[%d].uid %x\n", i, mm_data->share_mmap_list[i].uid); - pr_debug("share_mmap_list[%d].pfn %llx\n", i, mm_data->share_mmap_list[i].pfn); - pr_debug("share_mmap_list[%d].vm_start %llx\n", i, mm_data->share_mmap_list[i].vm_start); - pr_debug("share_mmap_list[%d].size %x\n", i, mm_data->share_mmap_list[i].size); + pr_debug("share_mmap_list[%d].uid %x\n", i, + mm_data->share_mmap_list[i].uid); + pr_debug("share_mmap_list[%d].pfn %llx\n", i, + mm_data->share_mmap_list[i].pfn); + pr_debug("share_mmap_list[%d].vm_start %llx\n", i, + mm_data->share_mmap_list[i].vm_start); + pr_debug("share_mmap_list[%d].size %x\n", i, + mm_data->share_mmap_list[i].size); } +/** + * print_mmaps - Debug function to print details of all active mmap entries + * @mm_data: Pointer to the mmap_data structure containing mmap details + * + * This function iterates through the `share_mmap_list` array in the given + * `mm_data` structure and logs the details of each active mmap entry by + * calling `print_mmap_idx`. The number of entries printed is determined as: + * - `MMAP_LIMIT` if `mmap_index` is `0`. + * - The value of `mmap_index` otherwise. + * + * Note: + * - The function uses `pr_debug` for logging, so enable debugging to see + * the output. + * - Ensure that `mm_data` is properly initialized before calling this + * function to avoid accessing invalid memory. + */ + static void print_mmaps(struct mmap_data *mm_data) { - int i, limit = mm_data->mmap_index == 0 ? MMAP_LIMIT : mm_data->mmap_index; + int i, limit = + mm_data->mmap_index == 0 ? MMAP_LIMIT : mm_data->mmap_index; for (i = 0; i < limit; i++) print_mmap_idx(mm_data, i); } -/* - * This function return the corresponding user-space address of a pfn - * based on the mapping done during the initialization +/** + * share_mmap_exist_vma_return_correct_pfn - Calculate corrected PFN for a + * given address. + * @mm_data: Pointer to struct containing memory mapping data + * @addr: Address for which to calculate the corrected PFN + * + * This function iterates through the list of shared memory mappings in + * `mm_data` and checks if the given `addr` lies within any of the mappings. + * If it does, it computes the corrected PFN based on the mapping's start + * address, size, and PFN. + * + * Returns: + * - The corrected PFN if the address falls within a mapping. + * - 0 if the address does not match any mapping. */ -static uint64_t share_mmap_exist_vma_return_correct_pfn(struct mmap_data *mm_data, uint64_t addr) +static uint64_t share_mmap_exist_vma_return_correct_pfn( + struct mmap_data *mm_data, + uint64_t addr) { int i; uint64_t corrected_pfn; for (i = 0; i < MMAP_LIMIT; i++) { if ((mm_data->share_mmap_list[i].vm_start <= addr) && - (addr < mm_data->share_mmap_list[i].vm_start + mm_data->share_mmap_list[i].size)) { - pr_debug("addr (0x%llx) exist in: 0x%llx - 0x%llx\n", addr, mm_data->share_mmap_list[i].vm_start, - mm_data->share_mmap_list[i].vm_start + mm_data->share_mmap_list[i].size); - pr_debug("((addr - share_mmap_list[i].vm_start) / PAGE_SIZE): 0x%llx\n", - ((addr - mm_data->share_mmap_list[i].vm_start) / PAGE_SIZE)); - pr_debug("share_mmap_list[i].pfn: 0x%llx\n", mm_data->share_mmap_list[i].pfn); - corrected_pfn = ((addr - mm_data->share_mmap_list[i].vm_start) / PAGE_SIZE) + mm_data->share_mmap_list[i].pfn; + (addr < mm_data->share_mmap_list[i].vm_start + + mm_data->share_mmap_list[i].size)) { + corrected_pfn = ((addr - + mm_data->share_mmap_list[i].vm_start) + / PAGE_SIZE) + + mm_data->share_mmap_list[i].pfn; return corrected_pfn; } } return 0; } -static void pf_mmap_close(struct vm_area_struct *vma) -{ - pr_debug("unmap\t-> vma->vm_start: 0x%lx\n", vma->vm_start); - pr_debug("unmap\t-> size: %lu\n", vma->vm_end - vma->vm_start); - share_mmap_rem(vma); -} - +/** + * pf_mmap_fault - Handle page faults for the device mmap area + * @vmf: Pointer to the `vm_fault` structure containing fault information + * + * This function is called during a page fault to find and insert the correct + * page for the faulting address. It calculates the corrected PFN using the + * provided mmap data of the device and updates the faulting page. + * + * Returns: + * - 0 if successful. + * - `VM_FAULT_SIGBUS` on failure. + */ static vm_fault_t pf_mmap_fault(struct vm_fault *vmf) { uint64_t corrected_pfn; pfn_t corr_pfn_struct; struct page *page; - int ret = 0; struct file *file = vmf->vma->vm_file; - struct file_priv_data *file_data = (struct file_priv_data *)(file->private_data); - struct mmap_data *mm_data = (struct mmap_data *)file_data->mm_data; + struct file_priv_data *file_data = + (struct file_priv_data *)(file->private_data); + struct mmap_data *mm_data = + (struct mmap_data *)file_data->mm_data; - pr_debug("----- Page fault: %lld -----\n", mm_data->sum_pgfaults); + /* Count the total number of page_faults for debugging purpose */ mm_data->sum_pgfaults++; /* Find the corrected pfn */ - corrected_pfn = share_mmap_exist_vma_return_correct_pfn(mm_data, vmf->address); + corrected_pfn = share_mmap_exist_vma_return_correct_pfn(mm_data, + vmf->address); corr_pfn_struct.val = corrected_pfn; - /* Some debug prints */ - pr_debug("vma->vm_start: 0x%lx\n", vmf->vma->vm_start); - pr_debug("vma->vm_pgoff: 0x%lx\n", vmf->vma->vm_pgoff); - pr_debug("vmf->address: 0x%lx\n", vmf->address); - pr_debug("corrected_pfn: 0x%llx\n", corrected_pfn); - pr_debug("pfn_valid(corrected_pfn): 0x%x\n", pfn_valid(corrected_pfn)); - - BUG_ON(!pfn_valid(corrected_pfn)); + /* Ensure the PFN is valid */ + if (unlikely(!pfn_valid(corrected_pfn))) { + pr_err("Invalid PFN: %llu\n", corrected_pfn); + return VM_FAULT_SIGBUS; + } /* After finding the page, correct the vmf->page */ page = pfn_to_page(corrected_pfn); - BUG_ON(!virt_addr_valid(page_address(page))); + if (unlikely(!virt_addr_valid(page_address(page)))) { + pr_err("Invalid page address for PFN: %llu\n", corrected_pfn); + return VM_FAULT_SIGBUS; + } /* Insert the correct page */ - ret = vmf_insert_pfn(vmf->vma, vmf->address, corrected_pfn); - pr_debug("vmf_insert_pfn -> ret: %d\n", ret); + return vmf_insert_pfn(vmf->vma, vmf->address, corrected_pfn); +} - return ret; +static void pf_mmap_close(struct vm_area_struct *vma) +{ + share_mmap_rem(vma); } const struct vm_operations_struct pf_mmap_ops = { @@ -161,12 +212,26 @@ const struct vm_operations_struct pf_mmap_ops = { .fault = pf_mmap_fault, }; +/** + * pf_mmap_vm_page - Set up memory mapping for a file + * @filp: Pointer to the file structure for the mapping + * @vma: Pointer to the VM area structure representing the memory mapping + * + * This function sets up a user-space area by associating a physical frame + * number (PFN) with the virtual address range. It updates internal data + * structures to track the mapping and sets appropriate VM flags. + * + * Returns: + * - 0 on success. + * - Negative error code on failure. + */ static int pf_mmap_vm_page(struct file *filp, struct vm_area_struct *vma) { uint64_t size = (unsigned long)(vma->vm_end - vma->vm_start); - struct file_priv_data *file_data = (struct file_priv_data *)(filp->private_data); + struct file_priv_data *file_data = + (struct file_priv_data *)(filp->private_data); struct mmap_data *mm_data = (struct mmap_data *)file_data->mm_data; - uint64_t pfn = ((mm_data->cur_ram_idx++) * 0x40000); + uint64_t pfn = ((mm_data->cur_ram_idx++) * (size >> PAGE_SHIFT)); #if LINUX_VERSION_CODE < KERNEL_VERSION(6, 3, 0) vma->vm_flags |= VM_PFNMAP; @@ -177,15 +242,32 @@ static int pf_mmap_vm_page(struct file *filp, struct vm_area_struct *vma) return 0; } +/** + * mmap_vqs_com_struct - Map virtqueue or communication structure to user space + * @filp: Pointer to the file structure associated with the mapping + * @vma: Pointer to the VM area structure describing the memory region + * + * This function maps either the virtqueue data or the communication structure + * to the user space using `remap_pfn_range`. The choice of what to map depends + * on the `share_communication_struct` flag in the mmap data structure. + * + * Returns: + * - 0 on success. + * - Negative error code on failure. + */ static int mmap_vqs_com_struct(struct file *filp, struct vm_area_struct *vma) { int ret = 0; unsigned long size = (unsigned long)(vma->vm_end - vma->vm_start); - struct file_priv_data *file_data = (struct file_priv_data *)(filp->private_data); - struct device_data *dev_data = (struct device_data *)file_data->dev_data; + struct file_priv_data *file_data = + (struct file_priv_data *)(filp->private_data); + struct device_data *dev_data = + (struct device_data *)file_data->dev_data; struct mmap_data *mmap_data = (struct mmap_data *)file_data->mm_data; - struct mmap_info *com_mmap_virt = (struct mmap_info *)(file_data->dev_data->info)->data; - uint64_t com_mmap_pfn = ((uint64_t)virt_to_phys(com_mmap_virt)) >> PAGE_SHIFT; + struct mmap_info *com_mmap_virt = + (struct mmap_info *)(file_data->dev_data->info)->data; + uint64_t com_mmap_pfn = + ((uint64_t)virt_to_phys(com_mmap_virt)) >> PAGE_SHIFT; uint64_t starting_pfn; if (mmap_data->share_communication_struct) { @@ -201,68 +283,79 @@ static int mmap_vqs_com_struct(struct file *filp, struct vm_area_struct *vma) starting_pfn = dev_data->vq_data.vq_pfn; } - ret = remap_pfn_range(vma, vma->vm_start, starting_pfn, size, vma->vm_page_prot); + ret = remap_pfn_range(vma, vma->vm_start, starting_pfn, size, + vma->vm_page_prot); if (ret != 0) { pr_err("Mmap error\n"); print_mmaps(mmap_data); - goto out; + } else { + add_share_mmap(filp, starting_pfn, vma->vm_start, size); } - add_share_mmap(filp, starting_pfn, vma->vm_start, size); - -out: return ret; } +/** + * op_mmap - Map vring buffers, virtqueue or communication structure + * to user space. + * @filp: Pointer to the file structure associated with the mapping + * @vma: Pointer to the VM area structure describing the memory region + * + * This function checks if the incoming mmap sys_call is related to a) vrings + * or b) virtqueues / communication structure data (depending on + * `share_communication_struct` and `share_vqs` variables. Then calls + * `mmap_vqs_com_struct` and `pf_mmap_vm_page` correspondingly in order + * to apply a different mapping logic. + * + * Returns: + * - 0 on success. + * - Negative error code on failure. + */ static int op_mmap(struct file *filp, struct vm_area_struct *vma) { - struct file_priv_data *file_data = (struct file_priv_data *)(filp->private_data); + struct file_priv_data *file_data = + (struct file_priv_data *)(filp->private_data); struct mmap_data *mmap_data = (struct mmap_data *)file_data->mm_data; int ret = 0; - pr_debug("MMAP SYS_CALL -> vma->vm_pgoff: 0x%lx", vma->vm_pgoff); vma->vm_ops = &pf_mmap_ops; - if (mmap_data->share_communication_struct || mmap_data->share_vqs) { + if (mmap_data->share_communication_struct || mmap_data->share_vqs) ret = mmap_vqs_com_struct(filp, vma); - goto out; - } - - ret = pf_mmap_vm_page(filp, vma); + else + ret = pf_mmap_vm_page(filp, vma); -out: return ret; } -/* Defined for future work */ static ssize_t loopback_write(struct file *file, - const char __user *user_buffer, - size_t size, - loff_t *offset) + const char __user *user_buffer, + size_t size, + loff_t *offset) { ssize_t len = sizeof(int); - pr_debug("loopback write function\n"); if (len <= 0) return 0; return len; } -/* Defined for future work */ static ssize_t loopback_read(struct file *file, - char __user *user_buffer, - size_t size, loff_t *offset) + char __user *user_buffer, + size_t size, loff_t *offset) { - pr_debug("loopback read function\n"); return 0; } +/* + * The lseek sys_call is needed only by the vhost-user device + * located in vhost-device crate. + */ static loff_t loopback_seek(struct file *file, loff_t offset, int whence) { loff_t new_pos; - pr_debug("loopback seek function!\n"); switch (whence) { case SEEK_SET: new_pos = offset; @@ -288,13 +381,14 @@ static int register_virtio_loopback_dev(uint32_t device_id) struct platform_device *pdev; int err = 0; - pr_info("Received request to register a new virtio-loopback-dev\n"); + pr_info("Received request to register a new loopback transport\n"); /* Register a new loopback-transport device */ - pdev = platform_device_register_simple("loopback-transport", device_id, NULL, 0); + pdev = platform_device_register_simple("loopback-transport", + device_id, NULL, 0); if (IS_ERR(pdev)) { err = PTR_ERR(pdev); - pr_err("failed to register loopback-transport device: %d\n", err); + pr_err("Failed to register transport device: %d\n", err); } return err; @@ -304,15 +398,14 @@ static int register_virtio_loopback_dev(uint32_t device_id) int insert_entry_data(struct virtio_loopback_device *vl_dev, int id) { int err = 0; - /* Read and that value atomically */ + /* Read that value atomically */ uint32_t max_used_dev_idx = atomic_read(&loopback_devices.device_num); /* Store the new vl_dev */ - if ((id <= MAX_PDEV) && (max_used_dev_idx < MAX_PDEV)) { + if ((id <= MAX_PDEV) && (max_used_dev_idx < MAX_PDEV)) loopback_devices.devices[id] = vl_dev; - } else { + else err = -ENOMEM; - } /* Mark the request as completed and free registration */ complete(&loopback_devices.reg_vl_dev_completion[id]); @@ -320,7 +413,8 @@ int insert_entry_data(struct virtio_loopback_device *vl_dev, int id) } /* Helper function to mark an entry as active */ -static struct virtio_loopback_device *activate_entry_data(struct device_data *data, uint32_t curr_dev_id) +static struct virtio_loopback_device * +activate_entry_data(struct device_data *data, uint32_t curr_dev_id) { struct virtio_loopback_device *vl_dev = NULL; @@ -334,36 +428,83 @@ static struct virtio_loopback_device *activate_entry_data(struct device_data *da return vl_dev; } -static int start_loopback(struct file_priv_data *file_data, uint32_t curr_dev_id) +static int start_loopback(struct file_priv_data *file_data, + uint32_t curr_dev_id) { struct virtio_loopback_device *vl_dev; - int rc; + int ret; /* Activate the entry */ vl_dev = activate_entry_data(file_data->dev_data, curr_dev_id); if (vl_dev) { file_data->vl_dev_irq = vl_dev; /* Register the activated vl_dev in the system */ - rc = loopback_register_virtio_dev(vl_dev); + ret = loopback_register_virtio_dev(vl_dev); } else { pr_debug("No available entry found!\n"); file_data->vl_dev_irq = NULL; - rc = -EFAULT; + ret = -EFAULT; } - return rc; + return ret; } -static long loopback_ioctl(struct file *file, - unsigned int cmd, unsigned long arg) +/** + * loopback_ioctl - Handle various ioctl commands for loopback device + * @file: Pointer to the file structure associated with the device + * @cmd: The ioctl command code + * @arg: User-space argument associated with the command + * + * This function processes various ioctl commands to configure and control the + * loopback device. The supported commands include: + * + * - `EFD_INIT`: The user-space adapter component shares an eventfd with the + * loopback device. This eventfd is triggered by the device each time a + * read / write operation is requested via the communication data structure. + * + * - `WAKEUP`: Sets a flag in the device's internal structure and wakes up any + * read / write process waiting on the communication wait queue. + * + * - `START_LOOPBACK`: Registers and starts a new loopback device, assigning a + * unique device ID and waiting for its probe function to complete before + * returning to user space. + * + * - `IRQ`: Handles an interrupt request by triggering the device's interrupt + * logic with the provided IRQ number. + * + * - `SHARE_VQS`: Shares a specified virtqueue (selected via a queue index) + * between the user-space application and the loopback device. + * + * - `SHARE_COM_STRUCT`: Notifies the loopback-device that the next mmap call + * will request the communication structure to be as shared between + * user-space and the loopback device. + * + * - `SHARE_VQS_NOTIF`: The user-space uses this command to share the eventfd + * associated with a specific virtqueue. This eventfd will be triggered each + * time the virtio device calls the `notify` function. In this way the + * by-pass the user-space adapter component and delivered directly to the + * vhost-user devices in user-space. + * + * If an unknown `cmd` is provided, the function logs an error and returns + * `-ENOTTY` to indicate an unsupported ioctl command. + * + * Returns: + * - `0` on success. + * - Negative error codes (`-EFAULT`, `-ENOTTY`, or others) on failure. + */ +static long loopback_ioctl(struct file *file, unsigned int cmd, + unsigned long arg) { struct efd_data efd_data; int irq, err; uint32_t queue_sel; - struct file_priv_data *file_data = (struct file_priv_data *)(file->private_data); + struct file_priv_data *file_data = + (struct file_priv_data *)(file->private_data); struct mmap_data *mm_data = (struct mmap_data *)file_data->mm_data; - struct device_data *dev_data = (struct device_data *)file_data->dev_data; + struct device_data *dev_data = + (struct device_data *)file_data->dev_data; uint32_t curr_avail_dev_id; + struct vq_notifier vq_notifier; switch (cmd) { case EFD_INIT: { @@ -378,12 +519,12 @@ static long loopback_ioctl(struct file *file, rcu_read_lock(); #if LINUX_VERSION_CODE < KERNEL_VERSION(5, 11, 220) - efd_file = fcheck_files(userspace_task->files, efd_data.efd[0]); + efd_file = fcheck_files(userspace_task->files, efd_data.efd[0]); #else #if LINUX_VERSION_CODE < KERNEL_VERSION(6, 7, 0) - efd_file = files_lookup_fd_rcu(userspace_task->files, efd_data.efd[0]); + efd_file = files_lookup_fd_rcu(userspace_task->files, efd_data.efd[0]); #else - efd_file = files_lookup_fd_raw(userspace_task->files, efd_data.efd[0]); + efd_file = files_lookup_fd_raw(userspace_task->files, efd_data.efd[0]); #endif #endif rcu_read_unlock(); @@ -395,25 +536,32 @@ static long loopback_ioctl(struct file *file, break; } case WAKEUP: { - atomic_set(&((struct virtio_neg *)(dev_data->info->data))->done, 1); + atomic_set(&((struct virtio_neg *)(dev_data->info->data))->done, + 1); wake_up(&(dev_data)->wq); break; } case START_LOOPBACK: { - if (copy_from_user(&(file_data)->device_info, (struct virtio_device_info_struct *) arg, - sizeof(struct virtio_device_info_struct))) + if (copy_from_user(&(file_data)->device_info, + (struct virtio_device_info_struct *) arg, + sizeof(struct virtio_device_info_struct))) return -EFAULT; /* Read and increase that value atomically */ - curr_avail_dev_id = atomic_add_return(1, &loopback_devices.device_num) - 1; + curr_avail_dev_id = + atomic_add_return(1, &loopback_devices.device_num) - 1; /* Register a new loopback device */ err = register_virtio_loopback_dev(curr_avail_dev_id); if (err) return -EFAULT; - /* Wait for probe function to be called before return control to user-space app */ - wait_for_completion(&loopback_devices.reg_vl_dev_completion[curr_avail_dev_id]); + /* + * Wait for probe function to be called before return control + * to user-space app + */ + wait_for_completion( + &loopback_devices.reg_vl_dev_completion[curr_avail_dev_id]); /* Start the loopback */ err = start_loopback(file_data, curr_avail_dev_id); @@ -425,27 +573,55 @@ static long loopback_ioctl(struct file *file, case IRQ: if (copy_from_user(&irq, (int *) arg, sizeof(int))) return -EFAULT; - pr_debug("\nIRQ\n"); /* * Both of the interrupt ways work but a) is more stable * and b) has better performance: * a) vl_interrupt(NULL); * b) queue_work(interrupt_workqueue, &async_interrupt); */ - /* Call the function */ vl_interrupt(file_data->vl_dev_irq, irq); break; case SHARE_VQS: - if (copy_from_user(&queue_sel, (uint32_t *) arg, sizeof(uint32_t))) + if (copy_from_user(&queue_sel, (uint32_t *) arg, + sizeof(uint32_t))) return -EFAULT; - pr_debug("\n\nSHARE_VQS: %u\n\n", queue_sel); dev_data->vq_data.vq_pfn = dev_data->vq_data.vq_pfns[queue_sel]; - pr_debug("Selected pfn is: 0x%llx", dev_data->vq_data.vq_pfn); mm_data->share_vqs = true; break; case SHARE_COM_STRUCT: mm_data->share_communication_struct = true; break; + case SHARE_VQS_NOTIF: + + struct task_struct *userspace_task; + struct file *efd_file; + + if (copy_from_user(&vq_notifier, (struct vq_notifier *) arg, + sizeof(struct vq_notifier))) + return -EFAULT; + + userspace_task = + pid_task(find_vpid(vq_notifier.pid), PIDTYPE_PID); + + rcu_read_lock(); +#if LINUX_VERSION_CODE < KERNEL_VERSION(5, 11, 220) + efd_file = fcheck_files(userspace_task->files, vq_notifier.notifier_fd); +#else +#if LINUX_VERSION_CODE < KERNEL_VERSION(6, 7, 0) + efd_file = files_lookup_fd_rcu(userspace_task->files, vq_notifier.notifier_fd); +#else + efd_file = files_lookup_fd_raw(userspace_task->files, vq_notifier.notifier_fd); +#endif +#endif + rcu_read_unlock(); + + dev_data->vq_data.vq_notifiers[vq_notifier.vq_index] = + eventfd_ctx_fileget(efd_file); + if (!dev_data->vq_data.vq_notifiers[vq_notifier.vq_index]) + return -1; + /* Mark device notifiers as enabled */ + dev_data->vq_data.vq_notifiers_enabled = true; + break; default: pr_err("Unknown loopback ioctl: %u\n", cmd); return -ENOTTY; @@ -456,13 +632,15 @@ static long loopback_ioctl(struct file *file, static int loopback_open(struct inode *inode, struct file *file) { - uint32_t val_1gb = 1024 * 1024 * 1024; // 1GB + uint32_t val_1gb = 1024 * 1024 * 1024; struct virtio_neg device_neg = {.done = ATOMIC_INIT(0)}; /* Allocate file private data */ - struct file_priv_data *file_data = kmalloc(sizeof(struct file_priv_data), - GFP_KERNEL); - struct device_data *dev_data = kmalloc(sizeof(struct device_data), GFP_KERNEL); - struct mmap_data *mm_data = kmalloc(sizeof(struct mmap_data), GFP_KERNEL); + struct file_priv_data *file_data = + kmalloc(sizeof(struct file_priv_data), GFP_KERNEL); + struct device_data *dev_data = + kmalloc(sizeof(struct device_data), GFP_KERNEL); + struct mmap_data *mm_data = + kmalloc(sizeof(struct mmap_data), GFP_KERNEL); if (!file_data || !dev_data || !mm_data) goto error_kmalloc; @@ -486,6 +664,7 @@ static int loopback_open(struct inode *inode, struct file *file) /* Init vq_data */ dev_data->vq_data.vq_index = 0; dev_data->valid_eventfd = true; + dev_data->vq_data.vq_notifiers_enabled = false; file_data->dev_data = dev_data; /* Init file mmap_data */ @@ -510,11 +689,13 @@ error_kmalloc: static int loopback_release(struct inode *inode, struct file *file) { - struct file_priv_data *file_data = (struct file_priv_data *)(file->private_data); - struct device_data *dev_data = (struct device_data *)file_data->dev_data; + struct file_priv_data *file_data = + (struct file_priv_data *)(file->private_data); + struct device_data *dev_data = + (struct device_data *)file_data->dev_data; struct mmap_data *mm_data = (struct mmap_data *)file_data->mm_data; - pr_info("Release the device\n"); + pr_info("Releasing the device\n"); /* * This makes the read/write do not wait * for the virtio-loopback-adapter if @@ -527,7 +708,7 @@ static int loopback_release(struct inode *inode, struct file *file) /* Cancel any pending work */ cancel_work_sync(&file_data->vl_dev_irq->notify_work); /* Continue with the vl_dev unregister */ - virtio_loopback_remove(file_data->vl_dev_irq->pdev); + virtio_loopback_driver.remove(file_data->vl_dev_irq->pdev); file_data->vl_dev_irq = NULL; } /* Subsequently free the dev_data */ @@ -552,7 +733,7 @@ static const struct file_operations fops = { .read = loopback_read, .write = loopback_write, .open = loopback_open, - .unlocked_ioctl = loopback_ioctl, + .unlocked_ioctl = loopback_ioctl, .mmap = op_mmap, .llseek = loopback_seek, .release = loopback_release @@ -568,9 +749,9 @@ static int __init loopback_init(void) /* Set-up the loopback_data */ loopback_data.dev_major = MAJOR(dev); #if LINUX_VERSION_CODE < KERNEL_VERSION(6, 4, 0) - loopback_data.class = class_create(THIS_MODULE, "loopback"); + loopback_data.class = class_create(THIS_MODULE, "loopback"); #else - loopback_data.class = class_create("loopback"); + loopback_data.class = class_create("loopback"); #endif if (IS_ERR(loopback_data.class)) { pr_err("Failed to create class\n"); @@ -579,10 +760,8 @@ static int __init loopback_init(void) cdev_init(&loopback_data.cdev, &fops); loopback_data.cdev.owner = THIS_MODULE; cdev_add(&loopback_data.cdev, MKDEV(loopback_data.dev_major, 0), 1); - device_create(loopback_data.class, NULL, MKDEV(loopback_data.dev_major, 0), - NULL, "loopback"); - /* Create the workqueues of the loopback driver */ - loopback_data.notify_workqueue = create_singlethread_workqueue("notify_workqueue"); + device_create(loopback_data.class, NULL, + MKDEV(loopback_data.dev_major, 0), NULL, "loopback"); /* Register virtio_loopback_transport */ (void)platform_driver_register(&virtio_loopback_driver); @@ -600,14 +779,16 @@ static int __init loopback_init(void) static void __exit loopback_exit(void) { int i; - uint32_t max_used_device_num = atomic_read(&loopback_devices.device_num); + uint32_t max_used_device_num = + atomic_read(&loopback_devices.device_num); - pr_info("Exit driver!\n"); + pr_info("Exit virtio_loopback driver!\n"); - /* Unregister loopback device */ + /* Unregister loopback devices */ for (i = 0; i < max_used_device_num; i++) if (loopback_devices.devices[i]) - platform_device_unregister(loopback_devices.devices[i]->pdev); + platform_device_unregister( + loopback_devices.devices[i]->pdev); /* Unregister virtio_loopback_transport */ platform_driver_unregister(&virtio_loopback_driver); @@ -619,10 +800,6 @@ static void __exit loopback_exit(void) pr_debug("device_destroy!\n"); class_destroy(loopback_data.class); pr_debug("class_destroy!\n"); - - /* Destroy the notify workqueue */ - flush_workqueue(loopback_data.notify_workqueue); - destroy_workqueue(loopback_data.notify_workqueue); } module_init(loopback_init); |