blob: a85c199c76aa25559acf931621b84dd3dac6184d [file] [log] [blame]
Eric Auger0ea27302015-06-08 09:25:25 -06001/*
2 * vfio based device assignment support - platform devices
3 *
4 * Copyright Linaro Limited, 2014
5 *
6 * Authors:
7 * Kim Phillips <kim.phillips@linaro.org>
8 * Eric Auger <eric.auger@linaro.org>
9 *
10 * This work is licensed under the terms of the GNU GPL, version 2. See
11 * the COPYING file in the top-level directory.
12 *
13 * Based on vfio based PCI device assignment support:
14 * Copyright Red Hat, Inc. 2012
15 */
16
Peter Maydellc6eacb12016-01-26 18:17:14 +000017#include "qemu/osdep.h"
Zhenzhong Duana6c50e12023-11-21 16:44:11 +080018#include CONFIG_DEVICES /* CONFIG_IOMMUFD */
Markus Armbrusterda34e652016-03-14 09:01:28 +010019#include "qapi/error.h"
Eric Auger0ea27302015-06-08 09:25:25 -060020#include <sys/ioctl.h>
Leon Alraee2075272015-06-17 13:35:00 +010021#include <linux/vfio.h>
Eric Auger0ea27302015-06-08 09:25:25 -060022
23#include "hw/vfio/vfio-platform.h"
Zhenzhong Duana6c50e12023-11-21 16:44:11 +080024#include "sysemu/iommufd.h"
Markus Armbrusterd6454272019-08-12 07:23:45 +020025#include "migration/vmstate.h"
Eric Auger0ea27302015-06-08 09:25:25 -060026#include "qemu/error-report.h"
Daniel Brodsky6e8a3552020-04-03 21:21:08 -070027#include "qemu/lockable.h"
Markus Armbrusterdb725812019-08-12 07:23:50 +020028#include "qemu/main-loop.h"
Markus Armbruster0b8fa322019-05-23 16:35:07 +020029#include "qemu/module.h"
Eric Auger0ea27302015-06-08 09:25:25 -060030#include "qemu/range.h"
Eric Auger0ea27302015-06-08 09:25:25 -060031#include "exec/memory.h"
Philippe Mathieu-Daudéd7919372018-05-28 20:26:59 -030032#include "exec/address-spaces.h"
Eric Auger38559972015-06-08 09:25:26 -060033#include "qemu/queue.h"
Eric Auger0ea27302015-06-08 09:25:25 -060034#include "hw/sysbus.h"
35#include "trace.h"
Markus Armbruster64552b62019-08-12 07:23:42 +020036#include "hw/irq.h"
Eric Auger0ea27302015-06-08 09:25:25 -060037#include "hw/platform-bus.h"
Markus Armbrustera27bd6c2019-08-12 07:23:51 +020038#include "hw/qdev-properties.h"
Eric Augerfb5f8162015-07-06 12:15:14 -060039#include "sysemu/kvm.h"
Eric Auger0ea27302015-06-08 09:25:25 -060040
Eric Auger38559972015-06-08 09:25:26 -060041/*
42 * Functions used whatever the injection method
43 */
44
Eric Augera5b39cd2015-10-05 12:30:12 -060045static inline bool vfio_irq_is_automasked(VFIOINTp *intp)
46{
47 return intp->flags & VFIO_IRQ_INFO_AUTOMASKED;
48}
49
Eric Auger38559972015-06-08 09:25:26 -060050/**
51 * vfio_init_intp - allocate, initialize the IRQ struct pointer
52 * and add it into the list of IRQs
53 * @vbasedev: the VFIO device handle
54 * @info: irq info struct retrieved from VFIO driver
Eric Auger5ff74192016-10-17 10:58:00 -060055 * @errp: error object
Eric Auger38559972015-06-08 09:25:26 -060056 */
57static VFIOINTp *vfio_init_intp(VFIODevice *vbasedev,
Eric Auger5ff74192016-10-17 10:58:00 -060058 struct vfio_irq_info info, Error **errp)
Eric Auger38559972015-06-08 09:25:26 -060059{
60 int ret;
61 VFIOPlatformDevice *vdev =
62 container_of(vbasedev, VFIOPlatformDevice, vbasedev);
63 SysBusDevice *sbdev = SYS_BUS_DEVICE(vdev);
64 VFIOINTp *intp;
65
66 intp = g_malloc0(sizeof(*intp));
67 intp->vdev = vdev;
68 intp->pin = info.index;
69 intp->flags = info.flags;
70 intp->state = VFIO_IRQ_INACTIVE;
Eric Augerfb5f8162015-07-06 12:15:14 -060071 intp->kvm_accel = false;
Eric Auger38559972015-06-08 09:25:26 -060072
73 sysbus_init_irq(sbdev, &intp->qemuirq);
74
75 /* Get an eventfd for trigger */
Markus Armbrusterb21e2382022-03-15 15:41:56 +010076 intp->interrupt = g_new0(EventNotifier, 1);
Eric Augera22313d2015-10-05 12:30:12 -060077 ret = event_notifier_init(intp->interrupt, 0);
Eric Auger38559972015-06-08 09:25:26 -060078 if (ret) {
Eric Augera22313d2015-10-05 12:30:12 -060079 g_free(intp->interrupt);
Eric Auger38559972015-06-08 09:25:26 -060080 g_free(intp);
Eric Auger5ff74192016-10-17 10:58:00 -060081 error_setg_errno(errp, -ret,
Li Qiangbf04ef32019-05-21 08:15:42 -070082 "failed to initialize trigger eventfd notifier");
Eric Auger38559972015-06-08 09:25:26 -060083 return NULL;
84 }
Eric Augera5b39cd2015-10-05 12:30:12 -060085 if (vfio_irq_is_automasked(intp)) {
86 /* Get an eventfd for resample/unmask */
Markus Armbrusterb21e2382022-03-15 15:41:56 +010087 intp->unmask = g_new0(EventNotifier, 1);
Eric Augera5b39cd2015-10-05 12:30:12 -060088 ret = event_notifier_init(intp->unmask, 0);
89 if (ret) {
90 g_free(intp->interrupt);
91 g_free(intp->unmask);
92 g_free(intp);
Eric Auger5ff74192016-10-17 10:58:00 -060093 error_setg_errno(errp, -ret,
Li Qiangbf04ef32019-05-21 08:15:42 -070094 "failed to initialize resample eventfd notifier");
Eric Augera5b39cd2015-10-05 12:30:12 -060095 return NULL;
96 }
Eric Augerfb5f8162015-07-06 12:15:14 -060097 }
Eric Auger38559972015-06-08 09:25:26 -060098
99 QLIST_INSERT_HEAD(&vdev->intp_list, intp, next);
100 return intp;
101}
102
103/**
104 * vfio_set_trigger_eventfd - set VFIO eventfd handling
105 *
106 * @intp: IRQ struct handle
107 * @handler: handler to be called on eventfd signaling
108 *
109 * Setup VFIO signaling and attach an optional user-side handler
110 * to the eventfd
111 */
112static int vfio_set_trigger_eventfd(VFIOINTp *intp,
113 eventfd_user_side_handler_t handler)
114{
115 VFIODevice *vbasedev = &intp->vdev->vbasedev;
Eric Auger201a7332019-06-13 09:57:37 -0600116 int32_t fd = event_notifier_get_fd(intp->interrupt);
117 Error *err = NULL;
Eric Auger38559972015-06-08 09:25:26 -0600118
Eric Auger201a7332019-06-13 09:57:37 -0600119 qemu_set_fd_handler(fd, (IOHandler *)handler, NULL, intp);
120
Zhenzhong Duan84e37d02024-05-22 12:39:59 +0800121 if (!vfio_set_irq_signaling(vbasedev, intp->pin, 0,
122 VFIO_IRQ_SET_ACTION_TRIGGER, fd, &err)) {
Eric Auger201a7332019-06-13 09:57:37 -0600123 error_reportf_err(err, VFIO_MSG_PREFIX, vbasedev->name);
124 qemu_set_fd_handler(fd, NULL, NULL, NULL);
Zhenzhong Duan84e37d02024-05-22 12:39:59 +0800125 return -EINVAL;
Eric Auger38559972015-06-08 09:25:26 -0600126 }
Eric Auger201a7332019-06-13 09:57:37 -0600127
Zhenzhong Duan84e37d02024-05-22 12:39:59 +0800128 return 0;
Eric Auger38559972015-06-08 09:25:26 -0600129}
130
131/*
132 * Functions only used when eventfds are handled on user-side
133 * ie. without irqfd
134 */
135
136/**
137 * vfio_mmap_set_enabled - enable/disable the fast path mode
138 * @vdev: the VFIO platform device
139 * @enabled: the target mmap state
140 *
141 * enabled = true ~ fast path = MMIO region is mmaped (no KVM TRAP);
142 * enabled = false ~ slow path = MMIO region is trapped and region callbacks
143 * are called; slow path enables to trap the device IRQ status register reset
144*/
145
146static void vfio_mmap_set_enabled(VFIOPlatformDevice *vdev, bool enabled)
147{
148 int i;
149
Eric Auger38559972015-06-08 09:25:26 -0600150 for (i = 0; i < vdev->vbasedev.num_regions; i++) {
Alex Williamsondb0da022016-03-10 09:39:07 -0700151 vfio_region_mmaps_set_enabled(vdev->regions[i], enabled);
Eric Auger38559972015-06-08 09:25:26 -0600152 }
153}
154
155/**
156 * vfio_intp_mmap_enable - timer function, restores the fast path
157 * if there is no more active IRQ
158 * @opaque: actually points to the VFIO platform device
159 *
Cai Huoqing631ba5a2021-07-30 09:26:13 +0800160 * Called on mmap timer timeout, this function checks whether the
Eric Auger38559972015-06-08 09:25:26 -0600161 * IRQ is still active and if not, restores the fast path.
162 * by construction a single eventfd is handled at a time.
163 * if the IRQ is still active, the timer is re-programmed.
164 */
165static void vfio_intp_mmap_enable(void *opaque)
166{
167 VFIOINTp *tmp;
168 VFIOPlatformDevice *vdev = (VFIOPlatformDevice *)opaque;
169
Amey Narkhede88eef592020-10-23 18:13:42 +0530170 QEMU_LOCK_GUARD(&vdev->intp_mutex);
Eric Auger38559972015-06-08 09:25:26 -0600171 QLIST_FOREACH(tmp, &vdev->intp_list, next) {
172 if (tmp->state == VFIO_IRQ_ACTIVE) {
173 trace_vfio_platform_intp_mmap_enable(tmp->pin);
174 /* re-program the timer to check active status later */
175 timer_mod(vdev->mmap_timer,
176 qemu_clock_get_ms(QEMU_CLOCK_VIRTUAL) +
177 vdev->mmap_timeout);
Eric Auger38559972015-06-08 09:25:26 -0600178 return;
179 }
180 }
181 vfio_mmap_set_enabled(vdev, true);
Eric Auger38559972015-06-08 09:25:26 -0600182}
183
184/**
185 * vfio_intp_inject_pending_lockheld - Injects a pending IRQ
186 * @opaque: opaque pointer, in practice the VFIOINTp handle
187 *
188 * The function is called on a previous IRQ completion, from
189 * vfio_platform_eoi, while the intp_mutex is locked.
190 * Also in such situation, the slow path already is set and
191 * the mmap timer was already programmed.
192 */
193static void vfio_intp_inject_pending_lockheld(VFIOINTp *intp)
194{
195 trace_vfio_platform_intp_inject_pending_lockheld(intp->pin,
Eric Augera22313d2015-10-05 12:30:12 -0600196 event_notifier_get_fd(intp->interrupt));
Eric Auger38559972015-06-08 09:25:26 -0600197
198 intp->state = VFIO_IRQ_ACTIVE;
199
200 /* trigger the virtual IRQ */
201 qemu_set_irq(intp->qemuirq, 1);
202}
203
204/**
205 * vfio_intp_interrupt - The user-side eventfd handler
206 * @opaque: opaque pointer which in practice is the VFIOINTp handle
207 *
208 * the function is entered in event handler context:
209 * the vIRQ is injected into the guest if there is no other active
210 * or pending IRQ.
211 */
212static void vfio_intp_interrupt(VFIOINTp *intp)
213{
214 int ret;
215 VFIOINTp *tmp;
216 VFIOPlatformDevice *vdev = intp->vdev;
217 bool delay_handling = false;
218
Daniel Brodsky6e8a3552020-04-03 21:21:08 -0700219 QEMU_LOCK_GUARD(&vdev->intp_mutex);
Eric Auger38559972015-06-08 09:25:26 -0600220 if (intp->state == VFIO_IRQ_INACTIVE) {
221 QLIST_FOREACH(tmp, &vdev->intp_list, next) {
222 if (tmp->state == VFIO_IRQ_ACTIVE ||
223 tmp->state == VFIO_IRQ_PENDING) {
224 delay_handling = true;
225 break;
226 }
227 }
228 }
229 if (delay_handling) {
230 /*
231 * the new IRQ gets a pending status and is pushed in
232 * the pending queue
233 */
234 intp->state = VFIO_IRQ_PENDING;
235 trace_vfio_intp_interrupt_set_pending(intp->pin);
236 QSIMPLEQ_INSERT_TAIL(&vdev->pending_intp_queue,
237 intp, pqnext);
Chen Qun9b83b002020-08-27 19:03:08 +0800238 event_notifier_test_and_clear(intp->interrupt);
Eric Auger38559972015-06-08 09:25:26 -0600239 return;
240 }
241
242 trace_vfio_platform_intp_interrupt(intp->pin,
Eric Augera22313d2015-10-05 12:30:12 -0600243 event_notifier_get_fd(intp->interrupt));
Eric Auger38559972015-06-08 09:25:26 -0600244
Eric Augera22313d2015-10-05 12:30:12 -0600245 ret = event_notifier_test_and_clear(intp->interrupt);
Eric Auger38559972015-06-08 09:25:26 -0600246 if (!ret) {
John Snow594fd212015-06-29 16:56:26 -0400247 error_report("Error when clearing fd=%d (ret = %d)",
Eric Augera22313d2015-10-05 12:30:12 -0600248 event_notifier_get_fd(intp->interrupt), ret);
Eric Auger38559972015-06-08 09:25:26 -0600249 }
250
251 intp->state = VFIO_IRQ_ACTIVE;
252
253 /* sets slow path */
254 vfio_mmap_set_enabled(vdev, false);
255
256 /* trigger the virtual IRQ */
257 qemu_set_irq(intp->qemuirq, 1);
258
259 /*
260 * Schedule the mmap timer which will restore fastpath when no IRQ
261 * is active anymore
262 */
263 if (vdev->mmap_timeout) {
264 timer_mod(vdev->mmap_timer,
265 qemu_clock_get_ms(QEMU_CLOCK_VIRTUAL) +
266 vdev->mmap_timeout);
267 }
Eric Auger38559972015-06-08 09:25:26 -0600268}
269
270/**
271 * vfio_platform_eoi - IRQ completion routine
272 * @vbasedev: the VFIO device handle
273 *
274 * De-asserts the active virtual IRQ and unmasks the physical IRQ
275 * (effective for level sensitive IRQ auto-masked by the VFIO driver).
276 * Then it handles next pending IRQ if any.
277 * eoi function is called on the first access to any MMIO region
278 * after an IRQ was triggered, trapped since slow path was set.
279 * It is assumed this access corresponds to the IRQ status
280 * register reset. With such a mechanism, a single IRQ can be
281 * handled at a time since there is no way to know which IRQ
282 * was completed by the guest (we would need additional details
283 * about the IRQ status register mask).
284 */
285static void vfio_platform_eoi(VFIODevice *vbasedev)
286{
287 VFIOINTp *intp;
288 VFIOPlatformDevice *vdev =
289 container_of(vbasedev, VFIOPlatformDevice, vbasedev);
290
Amey Narkhede88eef592020-10-23 18:13:42 +0530291 QEMU_LOCK_GUARD(&vdev->intp_mutex);
Eric Auger38559972015-06-08 09:25:26 -0600292 QLIST_FOREACH(intp, &vdev->intp_list, next) {
293 if (intp->state == VFIO_IRQ_ACTIVE) {
294 trace_vfio_platform_eoi(intp->pin,
Eric Augera22313d2015-10-05 12:30:12 -0600295 event_notifier_get_fd(intp->interrupt));
Eric Auger38559972015-06-08 09:25:26 -0600296 intp->state = VFIO_IRQ_INACTIVE;
297
298 /* deassert the virtual IRQ */
299 qemu_set_irq(intp->qemuirq, 0);
300
Eric Augera5b39cd2015-10-05 12:30:12 -0600301 if (vfio_irq_is_automasked(intp)) {
Eric Auger38559972015-06-08 09:25:26 -0600302 /* unmasks the physical level-sensitive IRQ */
303 vfio_unmask_single_irqindex(vbasedev, intp->pin);
304 }
305
306 /* a single IRQ can be active at a time */
307 break;
308 }
309 }
310 /* in case there are pending IRQs, handle the first one */
311 if (!QSIMPLEQ_EMPTY(&vdev->pending_intp_queue)) {
312 intp = QSIMPLEQ_FIRST(&vdev->pending_intp_queue);
313 vfio_intp_inject_pending_lockheld(intp);
314 QSIMPLEQ_REMOVE_HEAD(&vdev->pending_intp_queue, pqnext);
315 }
Eric Auger38559972015-06-08 09:25:26 -0600316}
317
318/**
319 * vfio_start_eventfd_injection - starts the virtual IRQ injection using
320 * user-side handled eventfds
Eric Auger58892b42015-10-05 12:30:12 -0600321 * @sbdev: the sysbus device handle
322 * @irq: the qemu irq handle
Eric Auger38559972015-06-08 09:25:26 -0600323 */
324
Eric Auger58892b42015-10-05 12:30:12 -0600325static void vfio_start_eventfd_injection(SysBusDevice *sbdev, qemu_irq irq)
Eric Auger38559972015-06-08 09:25:26 -0600326{
Eric Auger58892b42015-10-05 12:30:12 -0600327 VFIOPlatformDevice *vdev = VFIO_PLATFORM_DEVICE(sbdev);
328 VFIOINTp *intp;
329
330 QLIST_FOREACH(intp, &vdev->intp_list, next) {
331 if (intp->qemuirq == irq) {
332 break;
333 }
334 }
335 assert(intp);
Eric Auger38559972015-06-08 09:25:26 -0600336
Eric Auger201a7332019-06-13 09:57:37 -0600337 if (vfio_set_trigger_eventfd(intp, vfio_intp_interrupt)) {
Eric Auger58892b42015-10-05 12:30:12 -0600338 abort();
Eric Auger38559972015-06-08 09:25:26 -0600339 }
Eric Auger38559972015-06-08 09:25:26 -0600340}
341
Eric Augerfb5f8162015-07-06 12:15:14 -0600342/*
343 * Functions used for irqfd
344 */
345
346/**
347 * vfio_set_resample_eventfd - sets the resamplefd for an IRQ
348 * @intp: the IRQ struct handle
349 * programs the VFIO driver to unmask this IRQ when the
350 * intp->unmask eventfd is triggered
351 */
352static int vfio_set_resample_eventfd(VFIOINTp *intp)
353{
Eric Auger201a7332019-06-13 09:57:37 -0600354 int32_t fd = event_notifier_get_fd(intp->unmask);
Eric Augerfb5f8162015-07-06 12:15:14 -0600355 VFIODevice *vbasedev = &intp->vdev->vbasedev;
Eric Auger201a7332019-06-13 09:57:37 -0600356 Error *err = NULL;
Eric Augerfb5f8162015-07-06 12:15:14 -0600357
Eric Auger201a7332019-06-13 09:57:37 -0600358 qemu_set_fd_handler(fd, NULL, NULL, NULL);
Zhenzhong Duan84e37d02024-05-22 12:39:59 +0800359 if (!vfio_set_irq_signaling(vbasedev, intp->pin, 0,
360 VFIO_IRQ_SET_ACTION_UNMASK, fd, &err)) {
Eric Auger201a7332019-06-13 09:57:37 -0600361 error_reportf_err(err, VFIO_MSG_PREFIX, vbasedev->name);
Zhenzhong Duan84e37d02024-05-22 12:39:59 +0800362 return -EINVAL;
Eric Augerfb5f8162015-07-06 12:15:14 -0600363 }
Zhenzhong Duan84e37d02024-05-22 12:39:59 +0800364 return 0;
Eric Augerfb5f8162015-07-06 12:15:14 -0600365}
366
Eric Auger58892b42015-10-05 12:30:12 -0600367/**
368 * vfio_start_irqfd_injection - starts the virtual IRQ injection using
369 * irqfd
370 *
371 * @sbdev: the sysbus device handle
372 * @irq: the qemu irq handle
373 *
374 * In case the irqfd setup fails, we fallback to userspace handled eventfd
375 */
Eric Augerfb5f8162015-07-06 12:15:14 -0600376static void vfio_start_irqfd_injection(SysBusDevice *sbdev, qemu_irq irq)
377{
378 VFIOPlatformDevice *vdev = VFIO_PLATFORM_DEVICE(sbdev);
379 VFIOINTp *intp;
380
381 if (!kvm_irqfds_enabled() || !kvm_resamplefds_enabled() ||
382 !vdev->irqfd_allowed) {
Eric Auger58892b42015-10-05 12:30:12 -0600383 goto fail_irqfd;
Eric Augerfb5f8162015-07-06 12:15:14 -0600384 }
385
386 QLIST_FOREACH(intp, &vdev->intp_list, next) {
387 if (intp->qemuirq == irq) {
388 break;
389 }
390 }
391 assert(intp);
392
Eric Augera22313d2015-10-05 12:30:12 -0600393 if (kvm_irqchip_add_irqfd_notifier(kvm_state, intp->interrupt,
394 intp->unmask, irq) < 0) {
Eric Augerfb5f8162015-07-06 12:15:14 -0600395 goto fail_irqfd;
396 }
397
398 if (vfio_set_trigger_eventfd(intp, NULL) < 0) {
399 goto fail_vfio;
400 }
Eric Augera5b39cd2015-10-05 12:30:12 -0600401 if (vfio_irq_is_automasked(intp)) {
402 if (vfio_set_resample_eventfd(intp) < 0) {
403 goto fail_vfio;
404 }
405 trace_vfio_platform_start_level_irqfd_injection(intp->pin,
406 event_notifier_get_fd(intp->interrupt),
407 event_notifier_get_fd(intp->unmask));
408 } else {
409 trace_vfio_platform_start_edge_irqfd_injection(intp->pin,
410 event_notifier_get_fd(intp->interrupt));
Eric Augerfb5f8162015-07-06 12:15:14 -0600411 }
412
Eric Augerfb5f8162015-07-06 12:15:14 -0600413 intp->kvm_accel = true;
414
Eric Augerfb5f8162015-07-06 12:15:14 -0600415 return;
416fail_vfio:
Eric Augera22313d2015-10-05 12:30:12 -0600417 kvm_irqchip_remove_irqfd_notifier(kvm_state, intp->interrupt, irq);
Eric Auger58892b42015-10-05 12:30:12 -0600418 abort();
Eric Augerfb5f8162015-07-06 12:15:14 -0600419fail_irqfd:
Eric Auger58892b42015-10-05 12:30:12 -0600420 vfio_start_eventfd_injection(sbdev, irq);
Eric Augerfb5f8162015-07-06 12:15:14 -0600421 return;
422}
423
Eric Auger0ea27302015-06-08 09:25:25 -0600424/* VFIO skeleton */
425
426static void vfio_platform_compute_needs_reset(VFIODevice *vbasedev)
427{
428 vbasedev->needs_reset = true;
429}
430
431/* not implemented yet */
432static int vfio_platform_hot_reset_multi(VFIODevice *vbasedev)
433{
434 return -1;
435}
436
437/**
438 * vfio_populate_device - Allocate and populate MMIO region
Eric Auger38559972015-06-08 09:25:26 -0600439 * and IRQ structs according to driver returned information
Eric Auger0ea27302015-06-08 09:25:25 -0600440 * @vbasedev: the VFIO device handle
Eric Auger5ff74192016-10-17 10:58:00 -0600441 * @errp: error object
Eric Auger0ea27302015-06-08 09:25:25 -0600442 *
443 */
Zhenzhong Duan958609c2024-05-22 12:40:01 +0800444static bool vfio_populate_device(VFIODevice *vbasedev, Error **errp)
Eric Auger0ea27302015-06-08 09:25:25 -0600445{
Eric Auger38559972015-06-08 09:25:26 -0600446 VFIOINTp *intp, *tmp;
Eric Auger0ea27302015-06-08 09:25:25 -0600447 int i, ret = -1;
448 VFIOPlatformDevice *vdev =
449 container_of(vbasedev, VFIOPlatformDevice, vbasedev);
450
451 if (!(vbasedev->flags & VFIO_DEVICE_FLAGS_PLATFORM)) {
Eric Auger5ff74192016-10-17 10:58:00 -0600452 error_setg(errp, "this isn't a platform device");
Zhenzhong Duan958609c2024-05-22 12:40:01 +0800453 return false;
Eric Auger0ea27302015-06-08 09:25:25 -0600454 }
455
Eric Auger0b707432015-06-11 09:44:40 +0100456 vdev->regions = g_new0(VFIORegion *, vbasedev->num_regions);
Eric Auger0ea27302015-06-08 09:25:25 -0600457
458 for (i = 0; i < vbasedev->num_regions; i++) {
Alex Williamsondb0da022016-03-10 09:39:07 -0700459 char *name = g_strdup_printf("VFIO %s region %d\n", vbasedev->name, i);
Eric Auger0ea27302015-06-08 09:25:25 -0600460
Markus Armbrusterbdd81ad2015-11-10 12:11:08 -0700461 vdev->regions[i] = g_new0(VFIORegion, 1);
Alex Williamsondb0da022016-03-10 09:39:07 -0700462 ret = vfio_region_setup(OBJECT(vdev), vbasedev,
463 vdev->regions[i], i, name);
464 g_free(name);
Eric Auger0ea27302015-06-08 09:25:25 -0600465 if (ret) {
Eric Auger5ff74192016-10-17 10:58:00 -0600466 error_setg_errno(errp, -ret, "failed to get region %d info", i);
Eric Auger0ea27302015-06-08 09:25:25 -0600467 goto reg_error;
468 }
Eric Auger0ea27302015-06-08 09:25:25 -0600469 }
470
Eric Auger38559972015-06-08 09:25:26 -0600471 vdev->mmap_timer = timer_new_ms(QEMU_CLOCK_VIRTUAL,
472 vfio_intp_mmap_enable, vdev);
473
474 QSIMPLEQ_INIT(&vdev->pending_intp_queue);
475
476 for (i = 0; i < vbasedev->num_irqs; i++) {
477 struct vfio_irq_info irq = { .argsz = sizeof(irq) };
478
479 irq.index = i;
480 ret = ioctl(vbasedev->fd, VFIO_DEVICE_GET_IRQ_INFO, &irq);
481 if (ret) {
Eric Auger5ff74192016-10-17 10:58:00 -0600482 error_setg_errno(errp, -ret, "failed to get device irq info");
Eric Auger38559972015-06-08 09:25:26 -0600483 goto irq_err;
484 } else {
485 trace_vfio_platform_populate_interrupts(irq.index,
486 irq.count,
487 irq.flags);
Eric Auger5ff74192016-10-17 10:58:00 -0600488 intp = vfio_init_intp(vbasedev, irq, errp);
Eric Auger38559972015-06-08 09:25:26 -0600489 if (!intp) {
Eric Auger38559972015-06-08 09:25:26 -0600490 goto irq_err;
491 }
492 }
493 }
Zhenzhong Duan958609c2024-05-22 12:40:01 +0800494 return true;
Eric Auger38559972015-06-08 09:25:26 -0600495irq_err:
496 timer_del(vdev->mmap_timer);
497 QLIST_FOREACH_SAFE(intp, &vdev->intp_list, next, tmp) {
498 QLIST_REMOVE(intp, next);
499 g_free(intp);
500 }
Eric Auger0ea27302015-06-08 09:25:25 -0600501reg_error:
502 for (i = 0; i < vbasedev->num_regions; i++) {
Alex Williamsondb0da022016-03-10 09:39:07 -0700503 if (vdev->regions[i]) {
504 vfio_region_finalize(vdev->regions[i]);
505 }
Eric Auger0ea27302015-06-08 09:25:25 -0600506 g_free(vdev->regions[i]);
507 }
508 g_free(vdev->regions);
Zhenzhong Duan958609c2024-05-22 12:40:01 +0800509 return false;
Eric Auger0ea27302015-06-08 09:25:25 -0600510}
511
512/* specialized functions for VFIO Platform devices */
513static VFIODeviceOps vfio_platform_ops = {
514 .vfio_compute_needs_reset = vfio_platform_compute_needs_reset,
515 .vfio_hot_reset_multi = vfio_platform_hot_reset_multi,
Eric Auger38559972015-06-08 09:25:26 -0600516 .vfio_eoi = vfio_platform_eoi,
Eric Auger0ea27302015-06-08 09:25:25 -0600517};
518
519/**
520 * vfio_base_device_init - perform preliminary VFIO setup
521 * @vbasedev: the VFIO device handle
Eric Auger9bdbfbd2016-10-17 10:58:01 -0600522 * @errp: error object
Eric Auger0ea27302015-06-08 09:25:25 -0600523 *
524 * Implement the VFIO command sequence that allows to discover
525 * assigned device resources: group extraction, device
526 * fd retrieval, resource query.
527 * Precondition: the device name must be initialized
528 */
Zhenzhong Duan958609c2024-05-22 12:40:01 +0800529static bool vfio_base_device_init(VFIODevice *vbasedev, Error **errp)
Eric Auger0ea27302015-06-08 09:25:25 -0600530{
Zhenzhong Duan3016e602023-11-21 16:44:12 +0800531 /* @fd takes precedence over @sysfsdev which takes precedence over @host */
532 if (vbasedev->fd < 0 && vbasedev->sysfsdev) {
Alex Williamson7df93812016-03-10 09:39:07 -0700533 g_free(vbasedev->name);
Julia Suvorova3e015d82018-03-01 10:08:06 +0300534 vbasedev->name = g_path_get_basename(vbasedev->sysfsdev);
Zhenzhong Duan3016e602023-11-21 16:44:12 +0800535 } else if (vbasedev->fd < 0) {
Alex Williamson7df93812016-03-10 09:39:07 -0700536 if (!vbasedev->name || strchr(vbasedev->name, '/')) {
Eric Auger9bdbfbd2016-10-17 10:58:01 -0600537 error_setg(errp, "wrong host device name");
Zhenzhong Duan958609c2024-05-22 12:40:01 +0800538 return false;
Alex Williamson7df93812016-03-10 09:39:07 -0700539 }
540
541 vbasedev->sysfsdev = g_strdup_printf("/sys/bus/platform/devices/%s",
542 vbasedev->name);
Eric Auger0ea27302015-06-08 09:25:25 -0600543 }
544
Zhenzhong Duanc6c6cf92024-05-22 12:40:00 +0800545 if (!vfio_device_get_name(vbasedev, errp)) {
Zhenzhong Duan958609c2024-05-22 12:40:01 +0800546 return false;
Eric Auger0ea27302015-06-08 09:25:25 -0600547 }
548
Zhenzhong Duanb7754832024-05-07 14:42:44 +0800549 if (!vfio_attach_device(vbasedev->name, vbasedev,
550 &address_space_memory, errp)) {
Zhenzhong Duan958609c2024-05-22 12:40:01 +0800551 return false;
Eric Auger0ea27302015-06-08 09:25:25 -0600552 }
553
Zhenzhong Duan958609c2024-05-22 12:40:01 +0800554 if (vfio_populate_device(vbasedev, errp)) {
555 return true;
Eric Auger0ea27302015-06-08 09:25:25 -0600556 }
557
Zhenzhong Duan958609c2024-05-22 12:40:01 +0800558 vfio_detach_device(vbasedev);
559 return false;
Eric Auger0ea27302015-06-08 09:25:25 -0600560}
561
562/**
Eric Auger0ea27302015-06-08 09:25:25 -0600563 * vfio_platform_realize - the device realize function
564 * @dev: device state pointer
565 * @errp: error
566 *
567 * initialize the device, its memory regions and IRQ structures
568 * IRQ are started separately
569 */
570static void vfio_platform_realize(DeviceState *dev, Error **errp)
571{
Zhao Liu498696e2024-03-11 11:38:17 +0800572 ERRP_GUARD();
Eric Auger0ea27302015-06-08 09:25:25 -0600573 VFIOPlatformDevice *vdev = VFIO_PLATFORM_DEVICE(dev);
574 SysBusDevice *sbdev = SYS_BUS_DEVICE(dev);
575 VFIODevice *vbasedev = &vdev->vbasedev;
Zhenzhong Duan958609c2024-05-22 12:40:01 +0800576 int i;
Eric Auger0ea27302015-06-08 09:25:25 -0600577
Eric Auger89202c62018-02-06 11:08:26 -0700578 qemu_mutex_init(&vdev->intp_mutex);
579
Alex Williamson7df93812016-03-10 09:39:07 -0700580 trace_vfio_platform_realize(vbasedev->sysfsdev ?
581 vbasedev->sysfsdev : vbasedev->name,
582 vdev->compat);
Eric Auger0ea27302015-06-08 09:25:25 -0600583
Zhenzhong Duan958609c2024-05-22 12:40:01 +0800584 if (!vfio_base_device_init(vbasedev, errp)) {
585 goto init_err;
Eric Auger0ea27302015-06-08 09:25:25 -0600586 }
587
Eric Augera49531e2018-10-15 10:52:09 -0600588 if (!vdev->compat) {
589 GError *gerr = NULL;
590 gchar *contents;
591 gsize length;
592 char *path;
593
594 path = g_strdup_printf("%s/of_node/compatible", vbasedev->sysfsdev);
595 if (!g_file_get_contents(path, &contents, &length, &gerr)) {
596 error_setg(errp, "%s", gerr->message);
597 g_error_free(gerr);
598 g_free(path);
599 return;
600 }
601 g_free(path);
602 vdev->compat = contents;
603 for (vdev->num_compat = 0; length; vdev->num_compat++) {
604 size_t skip = strlen(contents) + 1;
605 contents += skip;
606 length -= skip;
607 }
608 }
609
Eric Auger0ea27302015-06-08 09:25:25 -0600610 for (i = 0; i < vbasedev->num_regions; i++) {
Alex Williamsondb0da022016-03-10 09:39:07 -0700611 if (vfio_region_mmap(vdev->regions[i])) {
Markus Armbrustere1eb2922018-10-17 10:26:29 +0200612 warn_report("%s mmap unsupported, performance may be slow",
613 memory_region_name(vdev->regions[i]->mem));
Alex Williamsondb0da022016-03-10 09:39:07 -0700614 }
615 sysbus_init_mmio(sbdev, vdev->regions[i]->mem);
Eric Auger0ea27302015-06-08 09:25:25 -0600616 }
Zhenzhong Duan958609c2024-05-22 12:40:01 +0800617 return;
Eric Auger9bdbfbd2016-10-17 10:58:01 -0600618
Zhenzhong Duan958609c2024-05-22 12:40:01 +0800619init_err:
Eric Auger9bdbfbd2016-10-17 10:58:01 -0600620 if (vdev->vbasedev.name) {
Markus Armbrusterc3b8e3e2018-10-17 10:26:30 +0200621 error_prepend(errp, VFIO_MSG_PREFIX, vdev->vbasedev.name);
Eric Auger9bdbfbd2016-10-17 10:58:01 -0600622 } else {
623 error_prepend(errp, "vfio error: ");
624 }
Eric Auger0ea27302015-06-08 09:25:25 -0600625}
626
627static const VMStateDescription vfio_platform_vmstate = {
Li Qiangda56e332019-05-21 08:15:41 -0700628 .name = "vfio-platform",
Eric Auger0ea27302015-06-08 09:25:25 -0600629 .unmigratable = 1,
630};
631
632static Property vfio_platform_dev_properties[] = {
633 DEFINE_PROP_STRING("host", VFIOPlatformDevice, vbasedev.name),
Alex Williamson7df93812016-03-10 09:39:07 -0700634 DEFINE_PROP_STRING("sysfsdev", VFIOPlatformDevice, vbasedev.sysfsdev),
Alex Williamson5e15d792015-09-23 13:04:44 -0600635 DEFINE_PROP_BOOL("x-no-mmap", VFIOPlatformDevice, vbasedev.no_mmap, false),
Eric Auger38559972015-06-08 09:25:26 -0600636 DEFINE_PROP_UINT32("mmap-timeout-ms", VFIOPlatformDevice,
637 mmap_timeout, 1100),
Eric Augerfb5f8162015-07-06 12:15:14 -0600638 DEFINE_PROP_BOOL("x-irqfd", VFIOPlatformDevice, irqfd_allowed, true),
Zhenzhong Duana6c50e12023-11-21 16:44:11 +0800639#ifdef CONFIG_IOMMUFD
640 DEFINE_PROP_LINK("iommufd", VFIOPlatformDevice, vbasedev.iommufd,
641 TYPE_IOMMUFD_BACKEND, IOMMUFDBackend *),
642#endif
Eric Auger0ea27302015-06-08 09:25:25 -0600643 DEFINE_PROP_END_OF_LIST(),
644};
645
Zhenzhong Duan3016e602023-11-21 16:44:12 +0800646static void vfio_platform_instance_init(Object *obj)
647{
648 VFIOPlatformDevice *vdev = VFIO_PLATFORM_DEVICE(obj);
Zhenzhong Duana0cf44c2023-11-21 16:44:22 +0800649 VFIODevice *vbasedev = &vdev->vbasedev;
Zhenzhong Duan3016e602023-11-21 16:44:12 +0800650
Zhenzhong Duan6106a322023-11-21 16:44:25 +0800651 vfio_device_init(vbasedev, VFIO_DEVICE_TYPE_PLATFORM, &vfio_platform_ops,
652 DEVICE(vdev), false);
Zhenzhong Duan3016e602023-11-21 16:44:12 +0800653}
654
655#ifdef CONFIG_IOMMUFD
656static void vfio_platform_set_fd(Object *obj, const char *str, Error **errp)
657{
658 vfio_device_set_fd(&VFIO_PLATFORM_DEVICE(obj)->vbasedev, str, errp);
659}
660#endif
661
Eric Auger0ea27302015-06-08 09:25:25 -0600662static void vfio_platform_class_init(ObjectClass *klass, void *data)
663{
664 DeviceClass *dc = DEVICE_CLASS(klass);
Eric Augerfb5f8162015-07-06 12:15:14 -0600665 SysBusDeviceClass *sbc = SYS_BUS_DEVICE_CLASS(klass);
Eric Auger0ea27302015-06-08 09:25:25 -0600666
667 dc->realize = vfio_platform_realize;
Marc-André Lureau4f67d302020-01-10 19:30:32 +0400668 device_class_set_props(dc, vfio_platform_dev_properties);
Zhenzhong Duan3016e602023-11-21 16:44:12 +0800669#ifdef CONFIG_IOMMUFD
670 object_class_property_add_str(klass, "fd", NULL, vfio_platform_set_fd);
671#endif
Eric Auger0ea27302015-06-08 09:25:25 -0600672 dc->vmsd = &vfio_platform_vmstate;
673 dc->desc = "VFIO-based platform device assignment";
Eric Augerfb5f8162015-07-06 12:15:14 -0600674 sbc->connect_irq_notifier = vfio_start_irqfd_injection;
Eric Auger0ea27302015-06-08 09:25:25 -0600675 set_bit(DEVICE_CATEGORY_MISC, dc->categories);
Eric Augera49531e2018-10-15 10:52:09 -0600676 /* Supported by TYPE_VIRT_MACHINE */
677 dc->user_creatable = true;
Eric Auger0ea27302015-06-08 09:25:25 -0600678}
679
680static const TypeInfo vfio_platform_dev_info = {
681 .name = TYPE_VFIO_PLATFORM,
682 .parent = TYPE_SYS_BUS_DEVICE,
683 .instance_size = sizeof(VFIOPlatformDevice),
Zhenzhong Duan3016e602023-11-21 16:44:12 +0800684 .instance_init = vfio_platform_instance_init,
Eric Auger0ea27302015-06-08 09:25:25 -0600685 .class_init = vfio_platform_class_init,
686 .class_size = sizeof(VFIOPlatformDeviceClass),
Eric Auger0ea27302015-06-08 09:25:25 -0600687};
688
689static void register_vfio_platform_dev_type(void)
690{
691 type_register_static(&vfio_platform_dev_info);
692}
693
694type_init(register_vfio_platform_dev_type)