| /* |
| * vhost-backend |
| * |
| * Copyright (c) 2013 Virtual Open Systems Sarl. |
| * |
| * This work is licensed under the terms of the GNU GPL, version 2 or later. |
| * See the COPYING file in the top-level directory. |
| * |
| */ |
| |
| #include "qemu/osdep.h" |
| #include "hw/virtio/vhost.h" |
| #include "hw/virtio/vhost-backend.h" |
| #include "qemu/error-report.h" |
| #include "qemu/main-loop.h" |
| #include "standard-headers/linux/vhost_types.h" |
| |
| #include "hw/virtio/vhost-vdpa.h" |
| #ifdef CONFIG_VHOST_KERNEL |
| #include <linux/vhost.h> |
| #include <sys/ioctl.h> |
| |
| static int vhost_kernel_call(struct vhost_dev *dev, unsigned long int request, |
| void *arg) |
| { |
| int fd = (uintptr_t) dev->opaque; |
| int ret; |
| |
| assert(dev->vhost_ops->backend_type == VHOST_BACKEND_TYPE_KERNEL); |
| |
| ret = ioctl(fd, request, arg); |
| return ret < 0 ? -errno : ret; |
| } |
| |
| static int vhost_kernel_init(struct vhost_dev *dev, void *opaque, Error **errp) |
| { |
| assert(dev->vhost_ops->backend_type == VHOST_BACKEND_TYPE_KERNEL); |
| |
| dev->opaque = opaque; |
| |
| return 0; |
| } |
| |
| static int vhost_kernel_cleanup(struct vhost_dev *dev) |
| { |
| int fd = (uintptr_t) dev->opaque; |
| |
| assert(dev->vhost_ops->backend_type == VHOST_BACKEND_TYPE_KERNEL); |
| |
| return close(fd) < 0 ? -errno : 0; |
| } |
| |
| static int vhost_kernel_memslots_limit(struct vhost_dev *dev) |
| { |
| int limit = 64; |
| char *s; |
| |
| if (g_file_get_contents("/sys/module/vhost/parameters/max_mem_regions", |
| &s, NULL, NULL)) { |
| uint64_t val = g_ascii_strtoull(s, NULL, 10); |
| if (val < INT_MAX && val > 0) { |
| g_free(s); |
| return val; |
| } |
| error_report("ignoring invalid max_mem_regions value in vhost module:" |
| " %s", s); |
| } |
| g_free(s); |
| return limit; |
| } |
| |
| static int vhost_kernel_net_set_backend(struct vhost_dev *dev, |
| struct vhost_vring_file *file) |
| { |
| return vhost_kernel_call(dev, VHOST_NET_SET_BACKEND, file); |
| } |
| |
| static int vhost_kernel_scsi_set_endpoint(struct vhost_dev *dev, |
| struct vhost_scsi_target *target) |
| { |
| return vhost_kernel_call(dev, VHOST_SCSI_SET_ENDPOINT, target); |
| } |
| |
| static int vhost_kernel_scsi_clear_endpoint(struct vhost_dev *dev, |
| struct vhost_scsi_target *target) |
| { |
| return vhost_kernel_call(dev, VHOST_SCSI_CLEAR_ENDPOINT, target); |
| } |
| |
| static int vhost_kernel_scsi_get_abi_version(struct vhost_dev *dev, int *version) |
| { |
| return vhost_kernel_call(dev, VHOST_SCSI_GET_ABI_VERSION, version); |
| } |
| |
| static int vhost_kernel_set_log_base(struct vhost_dev *dev, uint64_t base, |
| struct vhost_log *log) |
| { |
| return vhost_kernel_call(dev, VHOST_SET_LOG_BASE, &base); |
| } |
| |
| static int vhost_kernel_set_mem_table(struct vhost_dev *dev, |
| struct vhost_memory *mem) |
| { |
| return vhost_kernel_call(dev, VHOST_SET_MEM_TABLE, mem); |
| } |
| |
| static int vhost_kernel_set_vring_addr(struct vhost_dev *dev, |
| struct vhost_vring_addr *addr) |
| { |
| return vhost_kernel_call(dev, VHOST_SET_VRING_ADDR, addr); |
| } |
| |
| static int vhost_kernel_set_vring_endian(struct vhost_dev *dev, |
| struct vhost_vring_state *ring) |
| { |
| return vhost_kernel_call(dev, VHOST_SET_VRING_ENDIAN, ring); |
| } |
| |
| static int vhost_kernel_set_vring_num(struct vhost_dev *dev, |
| struct vhost_vring_state *ring) |
| { |
| return vhost_kernel_call(dev, VHOST_SET_VRING_NUM, ring); |
| } |
| |
| static int vhost_kernel_set_vring_base(struct vhost_dev *dev, |
| struct vhost_vring_state *ring) |
| { |
| return vhost_kernel_call(dev, VHOST_SET_VRING_BASE, ring); |
| } |
| |
| static int vhost_kernel_get_vring_base(struct vhost_dev *dev, |
| struct vhost_vring_state *ring) |
| { |
| return vhost_kernel_call(dev, VHOST_GET_VRING_BASE, ring); |
| } |
| |
| static int vhost_kernel_set_vring_kick(struct vhost_dev *dev, |
| struct vhost_vring_file *file) |
| { |
| return vhost_kernel_call(dev, VHOST_SET_VRING_KICK, file); |
| } |
| |
| static int vhost_kernel_set_vring_call(struct vhost_dev *dev, |
| struct vhost_vring_file *file) |
| { |
| return vhost_kernel_call(dev, VHOST_SET_VRING_CALL, file); |
| } |
| |
| static int vhost_kernel_set_vring_err(struct vhost_dev *dev, |
| struct vhost_vring_file *file) |
| { |
| return vhost_kernel_call(dev, VHOST_SET_VRING_ERR, file); |
| } |
| |
| static int vhost_kernel_set_vring_busyloop_timeout(struct vhost_dev *dev, |
| struct vhost_vring_state *s) |
| { |
| return vhost_kernel_call(dev, VHOST_SET_VRING_BUSYLOOP_TIMEOUT, s); |
| } |
| |
| static int vhost_kernel_set_features(struct vhost_dev *dev, |
| uint64_t features) |
| { |
| return vhost_kernel_call(dev, VHOST_SET_FEATURES, &features); |
| } |
| |
| static int vhost_kernel_set_backend_cap(struct vhost_dev *dev) |
| { |
| uint64_t features; |
| uint64_t f = 0x1ULL << VHOST_BACKEND_F_IOTLB_MSG_V2; |
| int r; |
| |
| if (vhost_kernel_call(dev, VHOST_GET_BACKEND_FEATURES, &features)) { |
| return 0; |
| } |
| |
| features &= f; |
| r = vhost_kernel_call(dev, VHOST_SET_BACKEND_FEATURES, |
| &features); |
| if (r) { |
| return 0; |
| } |
| |
| dev->backend_cap = features; |
| |
| return 0; |
| } |
| |
| static int vhost_kernel_get_features(struct vhost_dev *dev, |
| uint64_t *features) |
| { |
| return vhost_kernel_call(dev, VHOST_GET_FEATURES, features); |
| } |
| |
| static int vhost_kernel_set_owner(struct vhost_dev *dev) |
| { |
| return vhost_kernel_call(dev, VHOST_SET_OWNER, NULL); |
| } |
| |
| static int vhost_kernel_reset_device(struct vhost_dev *dev) |
| { |
| return vhost_kernel_call(dev, VHOST_RESET_OWNER, NULL); |
| } |
| |
| static int vhost_kernel_get_vq_index(struct vhost_dev *dev, int idx) |
| { |
| assert(idx >= dev->vq_index && idx < dev->vq_index + dev->nvqs); |
| |
| return idx - dev->vq_index; |
| } |
| |
| static int vhost_kernel_vsock_set_guest_cid(struct vhost_dev *dev, |
| uint64_t guest_cid) |
| { |
| return vhost_kernel_call(dev, VHOST_VSOCK_SET_GUEST_CID, &guest_cid); |
| } |
| |
| static int vhost_kernel_vsock_set_running(struct vhost_dev *dev, int start) |
| { |
| return vhost_kernel_call(dev, VHOST_VSOCK_SET_RUNNING, &start); |
| } |
| |
| static void vhost_kernel_iotlb_read(void *opaque) |
| { |
| struct vhost_dev *dev = opaque; |
| ssize_t len; |
| |
| if (dev->backend_cap & |
| (0x1ULL << VHOST_BACKEND_F_IOTLB_MSG_V2)) { |
| struct vhost_msg_v2 msg; |
| |
| while ((len = read((uintptr_t)dev->opaque, &msg, sizeof msg)) > 0) { |
| if (len < sizeof msg) { |
| error_report("Wrong vhost message len: %d", (int)len); |
| break; |
| } |
| if (msg.type != VHOST_IOTLB_MSG_V2) { |
| error_report("Unknown vhost iotlb message type"); |
| break; |
| } |
| |
| vhost_backend_handle_iotlb_msg(dev, &msg.iotlb); |
| } |
| } else { |
| struct vhost_msg msg; |
| |
| while ((len = read((uintptr_t)dev->opaque, &msg, sizeof msg)) > 0) { |
| if (len < sizeof msg) { |
| error_report("Wrong vhost message len: %d", (int)len); |
| break; |
| } |
| if (msg.type != VHOST_IOTLB_MSG) { |
| error_report("Unknown vhost iotlb message type"); |
| break; |
| } |
| |
| vhost_backend_handle_iotlb_msg(dev, &msg.iotlb); |
| } |
| } |
| } |
| |
| static int vhost_kernel_send_device_iotlb_msg(struct vhost_dev *dev, |
| struct vhost_iotlb_msg *imsg) |
| { |
| if (dev->backend_cap & (1ULL << VHOST_BACKEND_F_IOTLB_MSG_V2)) { |
| struct vhost_msg_v2 msg = {}; |
| |
| msg.type = VHOST_IOTLB_MSG_V2; |
| msg.iotlb = *imsg; |
| |
| if (write((uintptr_t)dev->opaque, &msg, sizeof msg) != sizeof msg) { |
| error_report("Fail to update device iotlb"); |
| return -EFAULT; |
| } |
| } else { |
| struct vhost_msg msg = {}; |
| |
| msg.type = VHOST_IOTLB_MSG; |
| msg.iotlb = *imsg; |
| |
| if (write((uintptr_t)dev->opaque, &msg, sizeof msg) != sizeof msg) { |
| error_report("Fail to update device iotlb"); |
| return -EFAULT; |
| } |
| } |
| |
| return 0; |
| } |
| |
| static void vhost_kernel_set_iotlb_callback(struct vhost_dev *dev, |
| int enabled) |
| { |
| if (enabled) |
| qemu_set_fd_handler((uintptr_t)dev->opaque, |
| vhost_kernel_iotlb_read, NULL, dev); |
| else |
| qemu_set_fd_handler((uintptr_t)dev->opaque, NULL, NULL, NULL); |
| } |
| |
| const VhostOps kernel_ops = { |
| .backend_type = VHOST_BACKEND_TYPE_KERNEL, |
| .vhost_backend_init = vhost_kernel_init, |
| .vhost_backend_cleanup = vhost_kernel_cleanup, |
| .vhost_backend_memslots_limit = vhost_kernel_memslots_limit, |
| .vhost_net_set_backend = vhost_kernel_net_set_backend, |
| .vhost_scsi_set_endpoint = vhost_kernel_scsi_set_endpoint, |
| .vhost_scsi_clear_endpoint = vhost_kernel_scsi_clear_endpoint, |
| .vhost_scsi_get_abi_version = vhost_kernel_scsi_get_abi_version, |
| .vhost_set_log_base = vhost_kernel_set_log_base, |
| .vhost_set_mem_table = vhost_kernel_set_mem_table, |
| .vhost_set_vring_addr = vhost_kernel_set_vring_addr, |
| .vhost_set_vring_endian = vhost_kernel_set_vring_endian, |
| .vhost_set_vring_num = vhost_kernel_set_vring_num, |
| .vhost_set_vring_base = vhost_kernel_set_vring_base, |
| .vhost_get_vring_base = vhost_kernel_get_vring_base, |
| .vhost_set_vring_kick = vhost_kernel_set_vring_kick, |
| .vhost_set_vring_call = vhost_kernel_set_vring_call, |
| .vhost_set_vring_err = vhost_kernel_set_vring_err, |
| .vhost_set_vring_busyloop_timeout = |
| vhost_kernel_set_vring_busyloop_timeout, |
| .vhost_set_features = vhost_kernel_set_features, |
| .vhost_get_features = vhost_kernel_get_features, |
| .vhost_set_backend_cap = vhost_kernel_set_backend_cap, |
| .vhost_set_owner = vhost_kernel_set_owner, |
| .vhost_reset_device = vhost_kernel_reset_device, |
| .vhost_get_vq_index = vhost_kernel_get_vq_index, |
| .vhost_vsock_set_guest_cid = vhost_kernel_vsock_set_guest_cid, |
| .vhost_vsock_set_running = vhost_kernel_vsock_set_running, |
| .vhost_set_iotlb_callback = vhost_kernel_set_iotlb_callback, |
| .vhost_send_device_iotlb_msg = vhost_kernel_send_device_iotlb_msg, |
| }; |
| #endif |
| |
| int vhost_backend_update_device_iotlb(struct vhost_dev *dev, |
| uint64_t iova, uint64_t uaddr, |
| uint64_t len, |
| IOMMUAccessFlags perm) |
| { |
| struct vhost_iotlb_msg imsg; |
| |
| imsg.iova = iova; |
| imsg.uaddr = uaddr; |
| imsg.size = len; |
| imsg.type = VHOST_IOTLB_UPDATE; |
| |
| switch (perm) { |
| case IOMMU_RO: |
| imsg.perm = VHOST_ACCESS_RO; |
| break; |
| case IOMMU_WO: |
| imsg.perm = VHOST_ACCESS_WO; |
| break; |
| case IOMMU_RW: |
| imsg.perm = VHOST_ACCESS_RW; |
| break; |
| default: |
| return -EINVAL; |
| } |
| |
| if (dev->vhost_ops && dev->vhost_ops->vhost_send_device_iotlb_msg) |
| return dev->vhost_ops->vhost_send_device_iotlb_msg(dev, &imsg); |
| |
| return -ENODEV; |
| } |
| |
| int vhost_backend_invalidate_device_iotlb(struct vhost_dev *dev, |
| uint64_t iova, uint64_t len) |
| { |
| struct vhost_iotlb_msg imsg; |
| |
| imsg.iova = iova; |
| imsg.size = len; |
| imsg.type = VHOST_IOTLB_INVALIDATE; |
| |
| if (dev->vhost_ops && dev->vhost_ops->vhost_send_device_iotlb_msg) |
| return dev->vhost_ops->vhost_send_device_iotlb_msg(dev, &imsg); |
| |
| return -ENODEV; |
| } |
| |
| int vhost_backend_handle_iotlb_msg(struct vhost_dev *dev, |
| struct vhost_iotlb_msg *imsg) |
| { |
| int ret = 0; |
| |
| if (unlikely(!dev->vdev)) { |
| error_report("Unexpected IOTLB message when virtio device is stopped"); |
| return -EINVAL; |
| } |
| |
| switch (imsg->type) { |
| case VHOST_IOTLB_MISS: |
| ret = vhost_device_iotlb_miss(dev, imsg->iova, |
| imsg->perm != VHOST_ACCESS_RO); |
| break; |
| case VHOST_IOTLB_ACCESS_FAIL: |
| /* FIXME: report device iotlb error */ |
| error_report("Access failure IOTLB message type not supported"); |
| ret = -ENOTSUP; |
| break; |
| case VHOST_IOTLB_UPDATE: |
| case VHOST_IOTLB_INVALIDATE: |
| default: |
| error_report("Unexpected IOTLB message type"); |
| ret = -EINVAL; |
| break; |
| } |
| |
| return ret; |
| } |