blob: 001aeda4c154d4a9ff5b2e9f73cebdc743c2c29b [file] [log] [blame]
Gregory Haskins721eecbf2009-05-20 10:30:49 -04001/*
2 * kvm eventfd support - use eventfd objects to signal various KVM events
3 *
4 * Copyright 2009 Novell. All Rights Reserved.
Avi Kivity221d0592010-05-23 18:37:00 +03005 * Copyright 2010 Red Hat, Inc. and/or its affiliates.
Gregory Haskins721eecbf2009-05-20 10:30:49 -04006 *
7 * Author:
8 * Gregory Haskins <ghaskins@novell.com>
9 *
10 * This file is free software; you can redistribute it and/or modify
11 * it under the terms of version 2 of the GNU General Public License
12 * as published by the Free Software Foundation.
13 *
14 * This program is distributed in the hope that it will be useful,
15 * but WITHOUT ANY WARRANTY; without even the implied warranty of
16 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
17 * GNU General Public License for more details.
18 *
19 * You should have received a copy of the GNU General Public License
20 * along with this program; if not, write to the Free Software Foundation,
21 * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301, USA.
22 */
23
24#include <linux/kvm_host.h>
Gregory Haskinsd34e6b12009-07-07 17:08:49 -040025#include <linux/kvm.h>
Eric Auger166c9772015-09-18 22:29:42 +080026#include <linux/kvm_irqfd.h>
Gregory Haskins721eecbf2009-05-20 10:30:49 -040027#include <linux/workqueue.h>
28#include <linux/syscalls.h>
29#include <linux/wait.h>
30#include <linux/poll.h>
31#include <linux/file.h>
32#include <linux/list.h>
33#include <linux/eventfd.h>
Gregory Haskinsd34e6b12009-07-07 17:08:49 -040034#include <linux/kernel.h>
Christian Borntraeger719d93c2014-01-16 13:44:20 +010035#include <linux/srcu.h>
Tejun Heo5a0e3ad2010-03-24 17:04:11 +090036#include <linux/slab.h>
Paul Mackerras56f89f362014-06-30 20:51:09 +100037#include <linux/seqlock.h>
Eric Auger9016cfb2015-09-18 22:29:44 +080038#include <linux/irqbypass.h>
Paul Mackerrase4d57e12014-06-30 20:51:12 +100039#include <trace/events/kvm.h>
Gregory Haskinsd34e6b12009-07-07 17:08:49 -040040
Andre Przywaraaf669ac2015-03-26 14:39:29 +000041#include <kvm/iodev.h>
Gregory Haskins721eecbf2009-05-20 10:30:49 -040042
Paul Mackerras297e2102014-06-30 20:51:13 +100043#ifdef CONFIG_HAVE_KVM_IRQFD
Gregory Haskins721eecbf2009-05-20 10:30:49 -040044
Paolo Bonzini36343f62016-10-26 13:35:56 +020045static struct workqueue_struct *irqfd_cleanup_wq;
Gregory Haskins721eecbf2009-05-20 10:30:49 -040046
47static void
48irqfd_inject(struct work_struct *work)
49{
Eric Auger166c9772015-09-18 22:29:42 +080050 struct kvm_kernel_irqfd *irqfd =
51 container_of(work, struct kvm_kernel_irqfd, inject);
Gregory Haskins721eecbf2009-05-20 10:30:49 -040052 struct kvm *kvm = irqfd->kvm;
53
Alex Williamson7a844282012-09-21 11:58:03 -060054 if (!irqfd->resampler) {
Yang Zhangaa2fbe62013-04-11 19:21:40 +080055 kvm_set_irq(kvm, KVM_USERSPACE_IRQ_SOURCE_ID, irqfd->gsi, 1,
56 false);
57 kvm_set_irq(kvm, KVM_USERSPACE_IRQ_SOURCE_ID, irqfd->gsi, 0,
58 false);
Alex Williamson7a844282012-09-21 11:58:03 -060059 } else
60 kvm_set_irq(kvm, KVM_IRQFD_RESAMPLE_IRQ_SOURCE_ID,
Yang Zhangaa2fbe62013-04-11 19:21:40 +080061 irqfd->gsi, 1, false);
Alex Williamson7a844282012-09-21 11:58:03 -060062}
63
64/*
65 * Since resampler irqfds share an IRQ source ID, we de-assert once
66 * then notify all of the resampler irqfds using this GSI. We can't
67 * do multiple de-asserts or we risk racing with incoming re-asserts.
68 */
69static void
70irqfd_resampler_ack(struct kvm_irq_ack_notifier *kian)
71{
Eric Auger166c9772015-09-18 22:29:42 +080072 struct kvm_kernel_irqfd_resampler *resampler;
Christian Borntraeger719d93c2014-01-16 13:44:20 +010073 struct kvm *kvm;
Eric Auger166c9772015-09-18 22:29:42 +080074 struct kvm_kernel_irqfd *irqfd;
Christian Borntraeger719d93c2014-01-16 13:44:20 +010075 int idx;
Alex Williamson7a844282012-09-21 11:58:03 -060076
Eric Auger166c9772015-09-18 22:29:42 +080077 resampler = container_of(kian,
78 struct kvm_kernel_irqfd_resampler, notifier);
Christian Borntraeger719d93c2014-01-16 13:44:20 +010079 kvm = resampler->kvm;
Alex Williamson7a844282012-09-21 11:58:03 -060080
Christian Borntraeger719d93c2014-01-16 13:44:20 +010081 kvm_set_irq(kvm, KVM_IRQFD_RESAMPLE_IRQ_SOURCE_ID,
Yang Zhangaa2fbe62013-04-11 19:21:40 +080082 resampler->notifier.gsi, 0, false);
Alex Williamson7a844282012-09-21 11:58:03 -060083
Christian Borntraeger719d93c2014-01-16 13:44:20 +010084 idx = srcu_read_lock(&kvm->irq_srcu);
Alex Williamson7a844282012-09-21 11:58:03 -060085
86 list_for_each_entry_rcu(irqfd, &resampler->list, resampler_link)
87 eventfd_signal(irqfd->resamplefd, 1);
88
Christian Borntraeger719d93c2014-01-16 13:44:20 +010089 srcu_read_unlock(&kvm->irq_srcu, idx);
Alex Williamson7a844282012-09-21 11:58:03 -060090}
91
92static void
Eric Auger166c9772015-09-18 22:29:42 +080093irqfd_resampler_shutdown(struct kvm_kernel_irqfd *irqfd)
Alex Williamson7a844282012-09-21 11:58:03 -060094{
Eric Auger166c9772015-09-18 22:29:42 +080095 struct kvm_kernel_irqfd_resampler *resampler = irqfd->resampler;
Alex Williamson7a844282012-09-21 11:58:03 -060096 struct kvm *kvm = resampler->kvm;
97
98 mutex_lock(&kvm->irqfds.resampler_lock);
99
100 list_del_rcu(&irqfd->resampler_link);
Christian Borntraeger719d93c2014-01-16 13:44:20 +0100101 synchronize_srcu(&kvm->irq_srcu);
Alex Williamson7a844282012-09-21 11:58:03 -0600102
103 if (list_empty(&resampler->list)) {
104 list_del(&resampler->link);
105 kvm_unregister_irq_ack_notifier(kvm, &resampler->notifier);
106 kvm_set_irq(kvm, KVM_IRQFD_RESAMPLE_IRQ_SOURCE_ID,
Yang Zhangaa2fbe62013-04-11 19:21:40 +0800107 resampler->notifier.gsi, 0, false);
Alex Williamson7a844282012-09-21 11:58:03 -0600108 kfree(resampler);
109 }
110
111 mutex_unlock(&kvm->irqfds.resampler_lock);
Gregory Haskins721eecbf2009-05-20 10:30:49 -0400112}
113
114/*
115 * Race-free decouple logic (ordering is critical)
116 */
117static void
118irqfd_shutdown(struct work_struct *work)
119{
Eric Auger166c9772015-09-18 22:29:42 +0800120 struct kvm_kernel_irqfd *irqfd =
121 container_of(work, struct kvm_kernel_irqfd, shutdown);
Lan Tianyub5020a82017-12-21 21:10:36 -0500122 struct kvm *kvm = irqfd->kvm;
Michael S. Tsirkinb6a114d2010-01-13 19:12:30 +0200123 u64 cnt;
Gregory Haskins721eecbf2009-05-20 10:30:49 -0400124
Lan Tianyub5020a82017-12-21 21:10:36 -0500125 /* Make sure irqfd has been initalized in assign path. */
126 synchronize_srcu(&kvm->irq_srcu);
127
Gregory Haskins721eecbf2009-05-20 10:30:49 -0400128 /*
129 * Synchronize with the wait-queue and unhook ourselves to prevent
130 * further events.
131 */
Michael S. Tsirkinb6a114d2010-01-13 19:12:30 +0200132 eventfd_ctx_remove_wait_queue(irqfd->eventfd, &irqfd->wait, &cnt);
Gregory Haskins721eecbf2009-05-20 10:30:49 -0400133
134 /*
135 * We know no new events will be scheduled at this point, so block
136 * until all previously outstanding events have completed
137 */
Tejun Heo43829732012-08-20 14:51:24 -0700138 flush_work(&irqfd->inject);
Gregory Haskins721eecbf2009-05-20 10:30:49 -0400139
Alex Williamson7a844282012-09-21 11:58:03 -0600140 if (irqfd->resampler) {
141 irqfd_resampler_shutdown(irqfd);
142 eventfd_ctx_put(irqfd->resamplefd);
143 }
144
Gregory Haskins721eecbf2009-05-20 10:30:49 -0400145 /*
146 * It is now safe to release the object's resources
147 */
Eric Auger9016cfb2015-09-18 22:29:44 +0800148#ifdef CONFIG_HAVE_KVM_IRQ_BYPASS
149 irq_bypass_unregister_consumer(&irqfd->consumer);
150#endif
Gregory Haskins721eecbf2009-05-20 10:30:49 -0400151 eventfd_ctx_put(irqfd->eventfd);
152 kfree(irqfd);
153}
154
155
156/* assumes kvm->irqfds.lock is held */
157static bool
Eric Auger166c9772015-09-18 22:29:42 +0800158irqfd_is_active(struct kvm_kernel_irqfd *irqfd)
Gregory Haskins721eecbf2009-05-20 10:30:49 -0400159{
160 return list_empty(&irqfd->list) ? false : true;
161}
162
163/*
164 * Mark the irqfd as inactive and schedule it for removal
165 *
166 * assumes kvm->irqfds.lock is held
167 */
168static void
Eric Auger166c9772015-09-18 22:29:42 +0800169irqfd_deactivate(struct kvm_kernel_irqfd *irqfd)
Gregory Haskins721eecbf2009-05-20 10:30:49 -0400170{
171 BUG_ON(!irqfd_is_active(irqfd));
172
173 list_del_init(&irqfd->list);
174
Paolo Bonzini36343f62016-10-26 13:35:56 +0200175 queue_work(irqfd_cleanup_wq, &irqfd->shutdown);
Gregory Haskins721eecbf2009-05-20 10:30:49 -0400176}
177
Paolo Bonzinib97e6de2015-10-28 19:16:47 +0100178int __attribute__((weak)) kvm_arch_set_irq_inatomic(
Andrey Smetaninc9a5ecc2015-10-16 10:07:47 +0300179 struct kvm_kernel_irq_routing_entry *irq,
180 struct kvm *kvm, int irq_source_id,
181 int level,
182 bool line_status)
183{
184 return -EWOULDBLOCK;
185}
186
Gregory Haskins721eecbf2009-05-20 10:30:49 -0400187/*
188 * Called with wqh->lock held and interrupts disabled
189 */
190static int
Ingo Molnarac6424b2017-06-20 12:06:13 +0200191irqfd_wakeup(wait_queue_entry_t *wait, unsigned mode, int sync, void *key)
Gregory Haskins721eecbf2009-05-20 10:30:49 -0400192{
Eric Auger166c9772015-09-18 22:29:42 +0800193 struct kvm_kernel_irqfd *irqfd =
194 container_of(wait, struct kvm_kernel_irqfd, wait);
Al Viro3ad6f932017-07-03 20:14:56 -0400195 __poll_t flags = key_to_poll(key);
Paul Mackerras56f89f362014-06-30 20:51:09 +1000196 struct kvm_kernel_irq_routing_entry irq;
Michael S. Tsirkinbd2b53b2010-11-18 19:09:08 +0200197 struct kvm *kvm = irqfd->kvm;
Paul Mackerras56f89f362014-06-30 20:51:09 +1000198 unsigned seq;
Christian Borntraeger719d93c2014-01-16 13:44:20 +0100199 int idx;
Gregory Haskins721eecbf2009-05-20 10:30:49 -0400200
Linus Torvaldsa9a08842018-02-11 14:34:03 -0800201 if (flags & EPOLLIN) {
Christian Borntraeger719d93c2014-01-16 13:44:20 +0100202 idx = srcu_read_lock(&kvm->irq_srcu);
Paul Mackerras56f89f362014-06-30 20:51:09 +1000203 do {
204 seq = read_seqcount_begin(&irqfd->irq_entry_sc);
205 irq = irqfd->irq_entry;
206 } while (read_seqcount_retry(&irqfd->irq_entry_sc, seq));
Gregory Haskins721eecbf2009-05-20 10:30:49 -0400207 /* An event has been signaled, inject an interrupt */
Paolo Bonzinib97e6de2015-10-28 19:16:47 +0100208 if (kvm_arch_set_irq_inatomic(&irq, kvm,
209 KVM_USERSPACE_IRQ_SOURCE_ID, 1,
210 false) == -EWOULDBLOCK)
Michael S. Tsirkinbd2b53b2010-11-18 19:09:08 +0200211 schedule_work(&irqfd->inject);
Christian Borntraeger719d93c2014-01-16 13:44:20 +0100212 srcu_read_unlock(&kvm->irq_srcu, idx);
Michael S. Tsirkinbd2b53b2010-11-18 19:09:08 +0200213 }
Gregory Haskins721eecbf2009-05-20 10:30:49 -0400214
Linus Torvaldsa9a08842018-02-11 14:34:03 -0800215 if (flags & EPOLLHUP) {
Gregory Haskins721eecbf2009-05-20 10:30:49 -0400216 /* The eventfd is closing, detach from KVM */
Sebastian Andrzej Siewiorca0488a2019-03-15 18:58:15 +0100217 unsigned long iflags;
Gregory Haskins721eecbf2009-05-20 10:30:49 -0400218
Sebastian Andrzej Siewiorca0488a2019-03-15 18:58:15 +0100219 spin_lock_irqsave(&kvm->irqfds.lock, iflags);
Gregory Haskins721eecbf2009-05-20 10:30:49 -0400220
221 /*
222 * We must check if someone deactivated the irqfd before
223 * we could acquire the irqfds.lock since the item is
224 * deactivated from the KVM side before it is unhooked from
225 * the wait-queue. If it is already deactivated, we can
226 * simply return knowing the other side will cleanup for us.
227 * We cannot race against the irqfd going away since the
228 * other side is required to acquire wqh->lock, which we hold
229 */
230 if (irqfd_is_active(irqfd))
231 irqfd_deactivate(irqfd);
232
Sebastian Andrzej Siewiorca0488a2019-03-15 18:58:15 +0100233 spin_unlock_irqrestore(&kvm->irqfds.lock, iflags);
Gregory Haskins721eecbf2009-05-20 10:30:49 -0400234 }
235
236 return 0;
237}
238
239static void
240irqfd_ptable_queue_proc(struct file *file, wait_queue_head_t *wqh,
241 poll_table *pt)
242{
Eric Auger166c9772015-09-18 22:29:42 +0800243 struct kvm_kernel_irqfd *irqfd =
244 container_of(pt, struct kvm_kernel_irqfd, pt);
Gregory Haskins721eecbf2009-05-20 10:30:49 -0400245 add_wait_queue(wqh, &irqfd->wait);
246}
247
Michael S. Tsirkinbd2b53b2010-11-18 19:09:08 +0200248/* Must be called under irqfds.lock */
Eric Auger166c9772015-09-18 22:29:42 +0800249static void irqfd_update(struct kvm *kvm, struct kvm_kernel_irqfd *irqfd)
Michael S. Tsirkinbd2b53b2010-11-18 19:09:08 +0200250{
251 struct kvm_kernel_irq_routing_entry *e;
Paul Mackerras8ba918d2014-06-30 20:51:10 +1000252 struct kvm_kernel_irq_routing_entry entries[KVM_NR_IRQCHIPS];
Andrey Smetanin351dc6472015-10-16 10:07:45 +0300253 int n_entries;
Paul Mackerras8ba918d2014-06-30 20:51:10 +1000254
Paul Mackerras9957c862014-06-30 20:51:11 +1000255 n_entries = kvm_irq_map_gsi(kvm, entries, irqfd->gsi);
Michael S. Tsirkinbd2b53b2010-11-18 19:09:08 +0200256
Paul Mackerras56f89f362014-06-30 20:51:09 +1000257 write_seqcount_begin(&irqfd->irq_entry_sc);
258
Paul Mackerras8ba918d2014-06-30 20:51:10 +1000259 e = entries;
Andrey Smetanin351dc6472015-10-16 10:07:45 +0300260 if (n_entries == 1)
261 irqfd->irq_entry = *e;
262 else
263 irqfd->irq_entry.type = 0;
Paul Mackerras56f89f362014-06-30 20:51:09 +1000264
Paul Mackerras56f89f362014-06-30 20:51:09 +1000265 write_seqcount_end(&irqfd->irq_entry_sc);
Michael S. Tsirkinbd2b53b2010-11-18 19:09:08 +0200266}
267
Eric Auger1a02b272015-09-18 22:29:43 +0800268#ifdef CONFIG_HAVE_KVM_IRQ_BYPASS
269void __attribute__((weak)) kvm_arch_irq_bypass_stop(
270 struct irq_bypass_consumer *cons)
271{
272}
273
274void __attribute__((weak)) kvm_arch_irq_bypass_start(
275 struct irq_bypass_consumer *cons)
276{
277}
Feng Wuf70c20a2015-09-18 22:29:53 +0800278
279int __attribute__((weak)) kvm_arch_update_irqfd_routing(
280 struct kvm *kvm, unsigned int host_irq,
281 uint32_t guest_irq, bool set)
282{
283 return 0;
284}
Eric Auger1a02b272015-09-18 22:29:43 +0800285#endif
286
Gregory Haskins721eecbf2009-05-20 10:30:49 -0400287static int
Alex Williamsond4db2932012-06-29 09:56:08 -0600288kvm_irqfd_assign(struct kvm *kvm, struct kvm_irqfd *args)
Gregory Haskins721eecbf2009-05-20 10:30:49 -0400289{
Eric Auger166c9772015-09-18 22:29:42 +0800290 struct kvm_kernel_irqfd *irqfd, *tmp;
Al Virocffe78d2013-08-30 15:47:17 -0400291 struct fd f;
Alex Williamson7a844282012-09-21 11:58:03 -0600292 struct eventfd_ctx *eventfd = NULL, *resamplefd = NULL;
Gregory Haskins721eecbf2009-05-20 10:30:49 -0400293 int ret;
Al Viroe6c8adc2017-07-03 22:25:56 -0400294 __poll_t events;
Paul Mackerras9957c862014-06-30 20:51:11 +1000295 int idx;
Gregory Haskins721eecbf2009-05-20 10:30:49 -0400296
Eric Auger01c94e62015-03-04 11:14:33 +0100297 if (!kvm_arch_intc_initialized(kvm))
298 return -EAGAIN;
299
Ben Gardonb12ce362019-02-11 11:02:49 -0800300 irqfd = kzalloc(sizeof(*irqfd), GFP_KERNEL_ACCOUNT);
Gregory Haskins721eecbf2009-05-20 10:30:49 -0400301 if (!irqfd)
302 return -ENOMEM;
303
304 irqfd->kvm = kvm;
Alex Williamsond4db2932012-06-29 09:56:08 -0600305 irqfd->gsi = args->gsi;
Gregory Haskins721eecbf2009-05-20 10:30:49 -0400306 INIT_LIST_HEAD(&irqfd->list);
307 INIT_WORK(&irqfd->inject, irqfd_inject);
308 INIT_WORK(&irqfd->shutdown, irqfd_shutdown);
Paul Mackerras56f89f362014-06-30 20:51:09 +1000309 seqcount_init(&irqfd->irq_entry_sc);
Gregory Haskins721eecbf2009-05-20 10:30:49 -0400310
Al Virocffe78d2013-08-30 15:47:17 -0400311 f = fdget(args->fd);
312 if (!f.file) {
313 ret = -EBADF;
314 goto out;
Gregory Haskins721eecbf2009-05-20 10:30:49 -0400315 }
316
Al Virocffe78d2013-08-30 15:47:17 -0400317 eventfd = eventfd_ctx_fileget(f.file);
Gregory Haskins721eecbf2009-05-20 10:30:49 -0400318 if (IS_ERR(eventfd)) {
319 ret = PTR_ERR(eventfd);
320 goto fail;
321 }
322
323 irqfd->eventfd = eventfd;
324
Alex Williamson7a844282012-09-21 11:58:03 -0600325 if (args->flags & KVM_IRQFD_FLAG_RESAMPLE) {
Eric Auger166c9772015-09-18 22:29:42 +0800326 struct kvm_kernel_irqfd_resampler *resampler;
Alex Williamson7a844282012-09-21 11:58:03 -0600327
328 resamplefd = eventfd_ctx_fdget(args->resamplefd);
329 if (IS_ERR(resamplefd)) {
330 ret = PTR_ERR(resamplefd);
331 goto fail;
332 }
333
334 irqfd->resamplefd = resamplefd;
335 INIT_LIST_HEAD(&irqfd->resampler_link);
336
337 mutex_lock(&kvm->irqfds.resampler_lock);
338
339 list_for_each_entry(resampler,
Alex Williamson49f8a1a2012-12-06 14:44:59 -0700340 &kvm->irqfds.resampler_list, link) {
Alex Williamson7a844282012-09-21 11:58:03 -0600341 if (resampler->notifier.gsi == irqfd->gsi) {
342 irqfd->resampler = resampler;
343 break;
344 }
345 }
346
347 if (!irqfd->resampler) {
Ben Gardonb12ce362019-02-11 11:02:49 -0800348 resampler = kzalloc(sizeof(*resampler),
349 GFP_KERNEL_ACCOUNT);
Alex Williamson7a844282012-09-21 11:58:03 -0600350 if (!resampler) {
351 ret = -ENOMEM;
352 mutex_unlock(&kvm->irqfds.resampler_lock);
353 goto fail;
354 }
355
356 resampler->kvm = kvm;
357 INIT_LIST_HEAD(&resampler->list);
358 resampler->notifier.gsi = irqfd->gsi;
359 resampler->notifier.irq_acked = irqfd_resampler_ack;
360 INIT_LIST_HEAD(&resampler->link);
361
362 list_add(&resampler->link, &kvm->irqfds.resampler_list);
363 kvm_register_irq_ack_notifier(kvm,
364 &resampler->notifier);
365 irqfd->resampler = resampler;
366 }
367
368 list_add_rcu(&irqfd->resampler_link, &irqfd->resampler->list);
Christian Borntraeger719d93c2014-01-16 13:44:20 +0100369 synchronize_srcu(&kvm->irq_srcu);
Alex Williamson7a844282012-09-21 11:58:03 -0600370
371 mutex_unlock(&kvm->irqfds.resampler_lock);
372 }
373
Gregory Haskins721eecbf2009-05-20 10:30:49 -0400374 /*
375 * Install our own custom wake-up handling so we are notified via
376 * a callback whenever someone signals the underlying eventfd
377 */
378 init_waitqueue_func_entry(&irqfd->wait, irqfd_wakeup);
379 init_poll_funcptr(&irqfd->pt, irqfd_ptable_queue_proc);
380
Michael S. Tsirkinf1d1c302010-01-13 18:58:09 +0200381 spin_lock_irq(&kvm->irqfds.lock);
382
383 ret = 0;
384 list_for_each_entry(tmp, &kvm->irqfds.items, list) {
385 if (irqfd->eventfd != tmp->eventfd)
386 continue;
387 /* This fd is used for another irq already. */
388 ret = -EBUSY;
389 spin_unlock_irq(&kvm->irqfds.lock);
390 goto fail;
391 }
392
Paul Mackerras9957c862014-06-30 20:51:11 +1000393 idx = srcu_read_lock(&kvm->irq_srcu);
394 irqfd_update(kvm, irqfd);
Michael S. Tsirkinbd2b53b2010-11-18 19:09:08 +0200395
Gregory Haskins721eecbf2009-05-20 10:30:49 -0400396 list_add_tail(&irqfd->list, &kvm->irqfds.items);
Gregory Haskins721eecbf2009-05-20 10:30:49 -0400397
Cornelia Huck684a0b72014-03-17 19:11:35 +0100398 spin_unlock_irq(&kvm->irqfds.lock);
399
Gregory Haskins721eecbf2009-05-20 10:30:49 -0400400 /*
401 * Check if there was an event already pending on the eventfd
402 * before we registered, and trigger it as if we didn't miss it.
403 */
Christoph Hellwig9965ed172018-03-05 07:26:05 -0800404 events = vfs_poll(f.file, &irqfd->pt);
Cornelia Huck684a0b72014-03-17 19:11:35 +0100405
Linus Torvaldsa9a08842018-02-11 14:34:03 -0800406 if (events & EPOLLIN)
Gregory Haskins721eecbf2009-05-20 10:30:49 -0400407 schedule_work(&irqfd->inject);
408
Eric Auger9016cfb2015-09-18 22:29:44 +0800409#ifdef CONFIG_HAVE_KVM_IRQ_BYPASS
Alex Williamson14717e22016-05-05 11:58:35 -0600410 if (kvm_arch_has_irq_bypass()) {
411 irqfd->consumer.token = (void *)irqfd->eventfd;
412 irqfd->consumer.add_producer = kvm_arch_irq_bypass_add_producer;
413 irqfd->consumer.del_producer = kvm_arch_irq_bypass_del_producer;
414 irqfd->consumer.stop = kvm_arch_irq_bypass_stop;
415 irqfd->consumer.start = kvm_arch_irq_bypass_start;
416 ret = irq_bypass_register_consumer(&irqfd->consumer);
417 if (ret)
418 pr_info("irq bypass consumer (token %p) registration fails: %d\n",
Eric Auger9016cfb2015-09-18 22:29:44 +0800419 irqfd->consumer.token, ret);
Alex Williamson14717e22016-05-05 11:58:35 -0600420 }
Eric Auger9016cfb2015-09-18 22:29:44 +0800421#endif
Gregory Haskins721eecbf2009-05-20 10:30:49 -0400422
Lan Tianyub5020a82017-12-21 21:10:36 -0500423 srcu_read_unlock(&kvm->irq_srcu, idx);
Paolo Bonzini9432a312018-05-28 13:31:13 +0200424
425 /*
426 * do not drop the file until the irqfd is fully initialized, otherwise
427 * we might race against the EPOLLHUP
428 */
429 fdput(f);
Gregory Haskins721eecbf2009-05-20 10:30:49 -0400430 return 0;
431
432fail:
Alex Williamson7a844282012-09-21 11:58:03 -0600433 if (irqfd->resampler)
434 irqfd_resampler_shutdown(irqfd);
435
436 if (resamplefd && !IS_ERR(resamplefd))
437 eventfd_ctx_put(resamplefd);
438
Gregory Haskins721eecbf2009-05-20 10:30:49 -0400439 if (eventfd && !IS_ERR(eventfd))
440 eventfd_ctx_put(eventfd);
441
Al Virocffe78d2013-08-30 15:47:17 -0400442 fdput(f);
Gregory Haskins721eecbf2009-05-20 10:30:49 -0400443
Al Virocffe78d2013-08-30 15:47:17 -0400444out:
Gregory Haskins721eecbf2009-05-20 10:30:49 -0400445 kfree(irqfd);
446 return ret;
447}
Paolo Bonzinic77dcac2014-08-06 14:24:45 +0200448
449bool kvm_irq_has_notifier(struct kvm *kvm, unsigned irqchip, unsigned pin)
450{
451 struct kvm_irq_ack_notifier *kian;
452 int gsi, idx;
453
454 idx = srcu_read_lock(&kvm->irq_srcu);
455 gsi = kvm_irq_map_chip_pin(kvm, irqchip, pin);
456 if (gsi != -1)
457 hlist_for_each_entry_rcu(kian, &kvm->irq_ack_notifier_list,
458 link)
459 if (kian->gsi == gsi) {
460 srcu_read_unlock(&kvm->irq_srcu, idx);
461 return true;
462 }
463
464 srcu_read_unlock(&kvm->irq_srcu, idx);
465
466 return false;
467}
468EXPORT_SYMBOL_GPL(kvm_irq_has_notifier);
469
Andrey Smetaninba1aefc2015-10-16 10:07:46 +0300470void kvm_notify_acked_gsi(struct kvm *kvm, int gsi)
Paolo Bonzinic77dcac2014-08-06 14:24:45 +0200471{
472 struct kvm_irq_ack_notifier *kian;
Andrey Smetaninba1aefc2015-10-16 10:07:46 +0300473
474 hlist_for_each_entry_rcu(kian, &kvm->irq_ack_notifier_list,
475 link)
476 if (kian->gsi == gsi)
477 kian->irq_acked(kian);
478}
479
480void kvm_notify_acked_irq(struct kvm *kvm, unsigned irqchip, unsigned pin)
481{
Paolo Bonzinic77dcac2014-08-06 14:24:45 +0200482 int gsi, idx;
483
484 trace_kvm_ack_irq(irqchip, pin);
485
486 idx = srcu_read_lock(&kvm->irq_srcu);
487 gsi = kvm_irq_map_chip_pin(kvm, irqchip, pin);
488 if (gsi != -1)
Andrey Smetaninba1aefc2015-10-16 10:07:46 +0300489 kvm_notify_acked_gsi(kvm, gsi);
Paolo Bonzinic77dcac2014-08-06 14:24:45 +0200490 srcu_read_unlock(&kvm->irq_srcu, idx);
491}
492
493void kvm_register_irq_ack_notifier(struct kvm *kvm,
494 struct kvm_irq_ack_notifier *kian)
495{
496 mutex_lock(&kvm->irq_lock);
497 hlist_add_head_rcu(&kian->link, &kvm->irq_ack_notifier_list);
498 mutex_unlock(&kvm->irq_lock);
David Hildenbrand993225a2017-04-07 10:50:33 +0200499 kvm_arch_post_irq_ack_notifier_list_update(kvm);
Paolo Bonzinic77dcac2014-08-06 14:24:45 +0200500}
501
502void kvm_unregister_irq_ack_notifier(struct kvm *kvm,
503 struct kvm_irq_ack_notifier *kian)
504{
505 mutex_lock(&kvm->irq_lock);
506 hlist_del_init_rcu(&kian->link);
507 mutex_unlock(&kvm->irq_lock);
508 synchronize_srcu(&kvm->irq_srcu);
David Hildenbrand993225a2017-04-07 10:50:33 +0200509 kvm_arch_post_irq_ack_notifier_list_update(kvm);
Paolo Bonzinic77dcac2014-08-06 14:24:45 +0200510}
Alexander Graf914daba2012-10-09 00:22:59 +0200511#endif
Gregory Haskins721eecbf2009-05-20 10:30:49 -0400512
513void
Gregory Haskinsd34e6b12009-07-07 17:08:49 -0400514kvm_eventfd_init(struct kvm *kvm)
Gregory Haskins721eecbf2009-05-20 10:30:49 -0400515{
Paul Mackerras297e2102014-06-30 20:51:13 +1000516#ifdef CONFIG_HAVE_KVM_IRQFD
Gregory Haskins721eecbf2009-05-20 10:30:49 -0400517 spin_lock_init(&kvm->irqfds.lock);
518 INIT_LIST_HEAD(&kvm->irqfds.items);
Alex Williamson7a844282012-09-21 11:58:03 -0600519 INIT_LIST_HEAD(&kvm->irqfds.resampler_list);
520 mutex_init(&kvm->irqfds.resampler_lock);
Alexander Graf914daba2012-10-09 00:22:59 +0200521#endif
Gregory Haskinsd34e6b12009-07-07 17:08:49 -0400522 INIT_LIST_HEAD(&kvm->ioeventfds);
Gregory Haskins721eecbf2009-05-20 10:30:49 -0400523}
524
Paul Mackerras297e2102014-06-30 20:51:13 +1000525#ifdef CONFIG_HAVE_KVM_IRQFD
Gregory Haskins721eecbf2009-05-20 10:30:49 -0400526/*
527 * shutdown any irqfd's that match fd+gsi
528 */
529static int
Alex Williamsond4db2932012-06-29 09:56:08 -0600530kvm_irqfd_deassign(struct kvm *kvm, struct kvm_irqfd *args)
Gregory Haskins721eecbf2009-05-20 10:30:49 -0400531{
Eric Auger166c9772015-09-18 22:29:42 +0800532 struct kvm_kernel_irqfd *irqfd, *tmp;
Gregory Haskins721eecbf2009-05-20 10:30:49 -0400533 struct eventfd_ctx *eventfd;
534
Alex Williamsond4db2932012-06-29 09:56:08 -0600535 eventfd = eventfd_ctx_fdget(args->fd);
Gregory Haskins721eecbf2009-05-20 10:30:49 -0400536 if (IS_ERR(eventfd))
537 return PTR_ERR(eventfd);
538
539 spin_lock_irq(&kvm->irqfds.lock);
540
541 list_for_each_entry_safe(irqfd, tmp, &kvm->irqfds.items, list) {
Alex Williamsond4db2932012-06-29 09:56:08 -0600542 if (irqfd->eventfd == eventfd && irqfd->gsi == args->gsi) {
Michael S. Tsirkinbd2b53b2010-11-18 19:09:08 +0200543 /*
Paul Mackerras56f89f362014-06-30 20:51:09 +1000544 * This clearing of irq_entry.type is needed for when
Michael S. Tsirkinc8ce0572011-03-06 13:03:26 +0200545 * another thread calls kvm_irq_routing_update before
546 * we flush workqueue below (we synchronize with
547 * kvm_irq_routing_update using irqfds.lock).
Michael S. Tsirkinbd2b53b2010-11-18 19:09:08 +0200548 */
Paul Mackerras56f89f362014-06-30 20:51:09 +1000549 write_seqcount_begin(&irqfd->irq_entry_sc);
550 irqfd->irq_entry.type = 0;
551 write_seqcount_end(&irqfd->irq_entry_sc);
Gregory Haskins721eecbf2009-05-20 10:30:49 -0400552 irqfd_deactivate(irqfd);
Michael S. Tsirkinbd2b53b2010-11-18 19:09:08 +0200553 }
Gregory Haskins721eecbf2009-05-20 10:30:49 -0400554 }
555
556 spin_unlock_irq(&kvm->irqfds.lock);
557 eventfd_ctx_put(eventfd);
558
559 /*
560 * Block until we know all outstanding shutdown jobs have completed
561 * so that we guarantee there will not be any more interrupts on this
562 * gsi once this deassign function returns.
563 */
Paolo Bonzini36343f62016-10-26 13:35:56 +0200564 flush_workqueue(irqfd_cleanup_wq);
Gregory Haskins721eecbf2009-05-20 10:30:49 -0400565
566 return 0;
567}
568
569int
Alex Williamsond4db2932012-06-29 09:56:08 -0600570kvm_irqfd(struct kvm *kvm, struct kvm_irqfd *args)
Gregory Haskins721eecbf2009-05-20 10:30:49 -0400571{
Alex Williamson7a844282012-09-21 11:58:03 -0600572 if (args->flags & ~(KVM_IRQFD_FLAG_DEASSIGN | KVM_IRQFD_FLAG_RESAMPLE))
Alex Williamson326cf032012-06-29 09:56:24 -0600573 return -EINVAL;
574
Alex Williamsond4db2932012-06-29 09:56:08 -0600575 if (args->flags & KVM_IRQFD_FLAG_DEASSIGN)
576 return kvm_irqfd_deassign(kvm, args);
Gregory Haskins721eecbf2009-05-20 10:30:49 -0400577
Alex Williamsond4db2932012-06-29 09:56:08 -0600578 return kvm_irqfd_assign(kvm, args);
Gregory Haskins721eecbf2009-05-20 10:30:49 -0400579}
580
581/*
582 * This function is called as the kvm VM fd is being released. Shutdown all
583 * irqfds that still remain open
584 */
585void
586kvm_irqfd_release(struct kvm *kvm)
587{
Eric Auger166c9772015-09-18 22:29:42 +0800588 struct kvm_kernel_irqfd *irqfd, *tmp;
Gregory Haskins721eecbf2009-05-20 10:30:49 -0400589
590 spin_lock_irq(&kvm->irqfds.lock);
591
592 list_for_each_entry_safe(irqfd, tmp, &kvm->irqfds.items, list)
593 irqfd_deactivate(irqfd);
594
595 spin_unlock_irq(&kvm->irqfds.lock);
596
597 /*
598 * Block until we know all outstanding shutdown jobs have completed
599 * since we do not take a kvm* reference.
600 */
Paolo Bonzini36343f62016-10-26 13:35:56 +0200601 flush_workqueue(irqfd_cleanup_wq);
Gregory Haskins721eecbf2009-05-20 10:30:49 -0400602
603}
604
605/*
Paul Mackerras9957c862014-06-30 20:51:11 +1000606 * Take note of a change in irq routing.
Christian Borntraeger719d93c2014-01-16 13:44:20 +0100607 * Caller must invoke synchronize_srcu(&kvm->irq_srcu) afterwards.
Michael S. Tsirkinbd2b53b2010-11-18 19:09:08 +0200608 */
Paul Mackerras9957c862014-06-30 20:51:11 +1000609void kvm_irq_routing_update(struct kvm *kvm)
Michael S. Tsirkinbd2b53b2010-11-18 19:09:08 +0200610{
Eric Auger166c9772015-09-18 22:29:42 +0800611 struct kvm_kernel_irqfd *irqfd;
Michael S. Tsirkinbd2b53b2010-11-18 19:09:08 +0200612
613 spin_lock_irq(&kvm->irqfds.lock);
614
Feng Wuf70c20a2015-09-18 22:29:53 +0800615 list_for_each_entry(irqfd, &kvm->irqfds.items, list) {
Paul Mackerras9957c862014-06-30 20:51:11 +1000616 irqfd_update(kvm, irqfd);
Michael S. Tsirkinbd2b53b2010-11-18 19:09:08 +0200617
Feng Wuf70c20a2015-09-18 22:29:53 +0800618#ifdef CONFIG_HAVE_KVM_IRQ_BYPASS
619 if (irqfd->producer) {
620 int ret = kvm_arch_update_irqfd_routing(
621 irqfd->kvm, irqfd->producer->irq,
622 irqfd->gsi, 1);
623 WARN_ON(ret);
624 }
625#endif
626 }
627
Michael S. Tsirkinbd2b53b2010-11-18 19:09:08 +0200628 spin_unlock_irq(&kvm->irqfds.lock);
629}
630
Paolo Bonzini36343f62016-10-26 13:35:56 +0200631/*
632 * create a host-wide workqueue for issuing deferred shutdown requests
633 * aggregated from all vm* instances. We need our own isolated
634 * queue to ease flushing work items when a VM exits.
635 */
636int kvm_irqfd_init(void)
637{
638 irqfd_cleanup_wq = alloc_workqueue("kvm-irqfd-cleanup", 0, 0);
639 if (!irqfd_cleanup_wq)
640 return -ENOMEM;
641
642 return 0;
643}
644
Cornelia Hucka0f155e2013-02-28 12:33:18 +0100645void kvm_irqfd_exit(void)
Gregory Haskins721eecbf2009-05-20 10:30:49 -0400646{
Paolo Bonzini36343f62016-10-26 13:35:56 +0200647 destroy_workqueue(irqfd_cleanup_wq);
Gregory Haskins721eecbf2009-05-20 10:30:49 -0400648}
Alexander Graf914daba2012-10-09 00:22:59 +0200649#endif
Gregory Haskinsd34e6b12009-07-07 17:08:49 -0400650
651/*
652 * --------------------------------------------------------------------
653 * ioeventfd: translate a PIO/MMIO memory write to an eventfd signal.
654 *
655 * userspace can register a PIO/MMIO address with an eventfd for receiving
656 * notification when the memory has been touched.
657 * --------------------------------------------------------------------
658 */
659
660struct _ioeventfd {
661 struct list_head list;
662 u64 addr;
663 int length;
664 struct eventfd_ctx *eventfd;
665 u64 datamatch;
666 struct kvm_io_device dev;
Michael S. Tsirkin05e07f92013-04-04 13:27:21 +0300667 u8 bus_idx;
Gregory Haskinsd34e6b12009-07-07 17:08:49 -0400668 bool wildcard;
669};
670
671static inline struct _ioeventfd *
672to_ioeventfd(struct kvm_io_device *dev)
673{
674 return container_of(dev, struct _ioeventfd, dev);
675}
676
677static void
678ioeventfd_release(struct _ioeventfd *p)
679{
680 eventfd_ctx_put(p->eventfd);
681 list_del(&p->list);
682 kfree(p);
683}
684
685static bool
686ioeventfd_in_range(struct _ioeventfd *p, gpa_t addr, int len, const void *val)
687{
688 u64 _val;
689
Michael S. Tsirkinf848a5a2014-03-31 21:50:38 +0300690 if (addr != p->addr)
691 /* address must be precise for a hit */
692 return false;
693
694 if (!p->length)
695 /* length = 0 means only look at the address, so always a hit */
696 return true;
697
698 if (len != p->length)
Gregory Haskinsd34e6b12009-07-07 17:08:49 -0400699 /* address-range must be precise for a hit */
700 return false;
701
702 if (p->wildcard)
703 /* all else equal, wildcard is always a hit */
704 return true;
705
706 /* otherwise, we have to actually compare the data */
707
708 BUG_ON(!IS_ALIGNED((unsigned long)val, len));
709
710 switch (len) {
711 case 1:
712 _val = *(u8 *)val;
713 break;
714 case 2:
715 _val = *(u16 *)val;
716 break;
717 case 4:
718 _val = *(u32 *)val;
719 break;
720 case 8:
721 _val = *(u64 *)val;
722 break;
723 default:
724 return false;
725 }
726
727 return _val == p->datamatch ? true : false;
728}
729
730/* MMIO/PIO writes trigger an event if the addr/val match */
731static int
Nikolay Nikolaeve32edf42015-03-26 14:39:28 +0000732ioeventfd_write(struct kvm_vcpu *vcpu, struct kvm_io_device *this, gpa_t addr,
733 int len, const void *val)
Gregory Haskinsd34e6b12009-07-07 17:08:49 -0400734{
735 struct _ioeventfd *p = to_ioeventfd(this);
736
737 if (!ioeventfd_in_range(p, addr, len, val))
738 return -EOPNOTSUPP;
739
740 eventfd_signal(p->eventfd, 1);
741 return 0;
742}
743
744/*
745 * This function is called as KVM is completely shutting down. We do not
746 * need to worry about locking just nuke anything we have as quickly as possible
747 */
748static void
749ioeventfd_destructor(struct kvm_io_device *this)
750{
751 struct _ioeventfd *p = to_ioeventfd(this);
752
753 ioeventfd_release(p);
754}
755
756static const struct kvm_io_device_ops ioeventfd_ops = {
757 .write = ioeventfd_write,
758 .destructor = ioeventfd_destructor,
759};
760
761/* assumes kvm->slots_lock held */
762static bool
763ioeventfd_check_collision(struct kvm *kvm, struct _ioeventfd *p)
764{
765 struct _ioeventfd *_p;
766
767 list_for_each_entry(_p, &kvm->ioeventfds, list)
Michael S. Tsirkin05e07f92013-04-04 13:27:21 +0300768 if (_p->bus_idx == p->bus_idx &&
Michael S. Tsirkinf848a5a2014-03-31 21:50:38 +0300769 _p->addr == p->addr &&
770 (!_p->length || !p->length ||
771 (_p->length == p->length &&
772 (_p->wildcard || p->wildcard ||
773 _p->datamatch == p->datamatch))))
Gregory Haskinsd34e6b12009-07-07 17:08:49 -0400774 return true;
775
776 return false;
777}
778
Cornelia Huck2b834512013-02-28 12:33:20 +0100779static enum kvm_bus ioeventfd_bus_from_flags(__u32 flags)
780{
781 if (flags & KVM_IOEVENTFD_FLAG_PIO)
782 return KVM_PIO_BUS;
783 if (flags & KVM_IOEVENTFD_FLAG_VIRTIO_CCW_NOTIFY)
784 return KVM_VIRTIO_CCW_NOTIFY_BUS;
785 return KVM_MMIO_BUS;
786}
787
Jason Wang85da11c2015-09-15 14:41:55 +0800788static int kvm_assign_ioeventfd_idx(struct kvm *kvm,
789 enum kvm_bus bus_idx,
790 struct kvm_ioeventfd *args)
Gregory Haskinsd34e6b12009-07-07 17:08:49 -0400791{
Gregory Haskinsd34e6b12009-07-07 17:08:49 -0400792
Jason Wang85da11c2015-09-15 14:41:55 +0800793 struct eventfd_ctx *eventfd;
794 struct _ioeventfd *p;
795 int ret;
Michael S. Tsirkinf848a5a2014-03-31 21:50:38 +0300796
Gregory Haskinsd34e6b12009-07-07 17:08:49 -0400797 eventfd = eventfd_ctx_fdget(args->fd);
798 if (IS_ERR(eventfd))
799 return PTR_ERR(eventfd);
800
Ben Gardonb12ce362019-02-11 11:02:49 -0800801 p = kzalloc(sizeof(*p), GFP_KERNEL_ACCOUNT);
Gregory Haskinsd34e6b12009-07-07 17:08:49 -0400802 if (!p) {
803 ret = -ENOMEM;
804 goto fail;
805 }
806
807 INIT_LIST_HEAD(&p->list);
808 p->addr = args->addr;
Michael S. Tsirkin05e07f92013-04-04 13:27:21 +0300809 p->bus_idx = bus_idx;
Gregory Haskinsd34e6b12009-07-07 17:08:49 -0400810 p->length = args->len;
811 p->eventfd = eventfd;
812
813 /* The datamatch feature is optional, otherwise this is a wildcard */
814 if (args->flags & KVM_IOEVENTFD_FLAG_DATAMATCH)
815 p->datamatch = args->datamatch;
816 else
817 p->wildcard = true;
818
Marcelo Tosatti79fac952009-12-23 14:35:26 -0200819 mutex_lock(&kvm->slots_lock);
Gregory Haskinsd34e6b12009-07-07 17:08:49 -0400820
Lucas De Marchi25985ed2011-03-30 22:57:33 -0300821 /* Verify that there isn't a match already */
Gregory Haskinsd34e6b12009-07-07 17:08:49 -0400822 if (ioeventfd_check_collision(kvm, p)) {
823 ret = -EEXIST;
824 goto unlock_fail;
825 }
826
827 kvm_iodevice_init(&p->dev, &ioeventfd_ops);
828
Sasha Levin743eeb02011-07-27 16:00:48 +0300829 ret = kvm_io_bus_register_dev(kvm, bus_idx, p->addr, p->length,
830 &p->dev);
Gregory Haskinsd34e6b12009-07-07 17:08:49 -0400831 if (ret < 0)
832 goto unlock_fail;
833
Christian Borntraeger4a12f952017-07-07 10:51:38 +0200834 kvm_get_bus(kvm, bus_idx)->ioeventfd_count++;
Gregory Haskinsd34e6b12009-07-07 17:08:49 -0400835 list_add_tail(&p->list, &kvm->ioeventfds);
836
Marcelo Tosatti79fac952009-12-23 14:35:26 -0200837 mutex_unlock(&kvm->slots_lock);
Gregory Haskinsd34e6b12009-07-07 17:08:49 -0400838
839 return 0;
840
841unlock_fail:
Marcelo Tosatti79fac952009-12-23 14:35:26 -0200842 mutex_unlock(&kvm->slots_lock);
Gregory Haskinsd34e6b12009-07-07 17:08:49 -0400843
844fail:
845 kfree(p);
846 eventfd_ctx_put(eventfd);
847
848 return ret;
849}
850
851static int
Jason Wang85da11c2015-09-15 14:41:55 +0800852kvm_deassign_ioeventfd_idx(struct kvm *kvm, enum kvm_bus bus_idx,
853 struct kvm_ioeventfd *args)
Gregory Haskinsd34e6b12009-07-07 17:08:49 -0400854{
Gregory Haskinsd34e6b12009-07-07 17:08:49 -0400855 struct _ioeventfd *p, *tmp;
856 struct eventfd_ctx *eventfd;
Christian Borntraeger4a12f952017-07-07 10:51:38 +0200857 struct kvm_io_bus *bus;
Gregory Haskinsd34e6b12009-07-07 17:08:49 -0400858 int ret = -ENOENT;
859
860 eventfd = eventfd_ctx_fdget(args->fd);
861 if (IS_ERR(eventfd))
862 return PTR_ERR(eventfd);
863
Marcelo Tosatti79fac952009-12-23 14:35:26 -0200864 mutex_lock(&kvm->slots_lock);
Gregory Haskinsd34e6b12009-07-07 17:08:49 -0400865
866 list_for_each_entry_safe(p, tmp, &kvm->ioeventfds, list) {
867 bool wildcard = !(args->flags & KVM_IOEVENTFD_FLAG_DATAMATCH);
868
Michael S. Tsirkin05e07f92013-04-04 13:27:21 +0300869 if (p->bus_idx != bus_idx ||
870 p->eventfd != eventfd ||
Gregory Haskinsd34e6b12009-07-07 17:08:49 -0400871 p->addr != args->addr ||
872 p->length != args->len ||
873 p->wildcard != wildcard)
874 continue;
875
876 if (!p->wildcard && p->datamatch != args->datamatch)
877 continue;
878
Marcelo Tosattie93f8a02009-12-23 14:35:24 -0200879 kvm_io_bus_unregister_dev(kvm, bus_idx, &p->dev);
Christian Borntraeger4a12f952017-07-07 10:51:38 +0200880 bus = kvm_get_bus(kvm, bus_idx);
881 if (bus)
882 bus->ioeventfd_count--;
Gregory Haskinsd34e6b12009-07-07 17:08:49 -0400883 ioeventfd_release(p);
884 ret = 0;
885 break;
886 }
887
Marcelo Tosatti79fac952009-12-23 14:35:26 -0200888 mutex_unlock(&kvm->slots_lock);
Gregory Haskinsd34e6b12009-07-07 17:08:49 -0400889
890 eventfd_ctx_put(eventfd);
891
892 return ret;
893}
894
Jason Wang85da11c2015-09-15 14:41:55 +0800895static int kvm_deassign_ioeventfd(struct kvm *kvm, struct kvm_ioeventfd *args)
896{
897 enum kvm_bus bus_idx = ioeventfd_bus_from_flags(args->flags);
Jason Wangeefd6b02015-09-15 14:41:56 +0800898 int ret = kvm_deassign_ioeventfd_idx(kvm, bus_idx, args);
Jason Wang85da11c2015-09-15 14:41:55 +0800899
Jason Wangeefd6b02015-09-15 14:41:56 +0800900 if (!args->len && bus_idx == KVM_MMIO_BUS)
901 kvm_deassign_ioeventfd_idx(kvm, KVM_FAST_MMIO_BUS, args);
902
903 return ret;
Jason Wang85da11c2015-09-15 14:41:55 +0800904}
905
906static int
907kvm_assign_ioeventfd(struct kvm *kvm, struct kvm_ioeventfd *args)
908{
909 enum kvm_bus bus_idx;
Jason Wangeefd6b02015-09-15 14:41:56 +0800910 int ret;
Jason Wang85da11c2015-09-15 14:41:55 +0800911
912 bus_idx = ioeventfd_bus_from_flags(args->flags);
913 /* must be natural-word sized, or 0 to ignore length */
914 switch (args->len) {
915 case 0:
916 case 1:
917 case 2:
918 case 4:
919 case 8:
920 break;
921 default:
922 return -EINVAL;
923 }
924
925 /* check for range overflow */
926 if (args->addr + args->len < args->addr)
927 return -EINVAL;
928
929 /* check for extra flags that we don't understand */
930 if (args->flags & ~KVM_IOEVENTFD_VALID_FLAG_MASK)
931 return -EINVAL;
932
933 /* ioeventfd with no length can't be combined with DATAMATCH */
Jason Wange9ea5062015-09-15 14:41:59 +0800934 if (!args->len && (args->flags & KVM_IOEVENTFD_FLAG_DATAMATCH))
Jason Wang85da11c2015-09-15 14:41:55 +0800935 return -EINVAL;
936
Jason Wangeefd6b02015-09-15 14:41:56 +0800937 ret = kvm_assign_ioeventfd_idx(kvm, bus_idx, args);
938 if (ret)
939 goto fail;
940
941 /* When length is ignored, MMIO is also put on a separate bus, for
942 * faster lookups.
943 */
944 if (!args->len && bus_idx == KVM_MMIO_BUS) {
945 ret = kvm_assign_ioeventfd_idx(kvm, KVM_FAST_MMIO_BUS, args);
946 if (ret < 0)
947 goto fast_fail;
948 }
949
950 return 0;
951
952fast_fail:
953 kvm_deassign_ioeventfd_idx(kvm, bus_idx, args);
954fail:
955 return ret;
Jason Wang85da11c2015-09-15 14:41:55 +0800956}
957
Gregory Haskinsd34e6b12009-07-07 17:08:49 -0400958int
959kvm_ioeventfd(struct kvm *kvm, struct kvm_ioeventfd *args)
960{
961 if (args->flags & KVM_IOEVENTFD_FLAG_DEASSIGN)
962 return kvm_deassign_ioeventfd(kvm, args);
963
964 return kvm_assign_ioeventfd(kvm, args);
965}