1 /******************************************************************************
2 * xen_intr.c
3 *
4 * Xen event and interrupt services for x86 HVM guests.
5 *
6 * Copyright (c) 2002-2005, K A Fraser
7 * Copyright (c) 2005, Intel Corporation <[email protected]>
8 * Copyright (c) 2012, Spectra Logic Corporation
9 *
10 * This file may be distributed separately from the Linux kernel, or
11 * incorporated into other software packages, subject to the following license:
12 *
13 * Permission is hereby granted, free of charge, to any person obtaining a copy
14 * of this source file (the "Software"), to deal in the Software without
15 * restriction, including without limitation the rights to use, copy, modify,
16 * merge, publish, distribute, sublicense, and/or sell copies of the Software,
17 * and to permit persons to whom the Software is furnished to do so, subject to
18 * the following conditions:
19 *
20 * The above copyright notice and this permission notice shall be included in
21 * all copies or substantial portions of the Software.
22 *
23 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
24 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
25 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
26 * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
27 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
28 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
29 * IN THE SOFTWARE.
30 */
31
32 #include <sys/cdefs.h>
33 __FBSDID("$FreeBSD$");
34
35 #include "opt_ddb.h"
36
37 #include <sys/param.h>
38 #include <sys/systm.h>
39 #include <sys/bus.h>
40 #include <sys/malloc.h>
41 #include <sys/kernel.h>
42 #include <sys/limits.h>
43 #include <sys/lock.h>
44 #include <sys/mutex.h>
45 #include <sys/interrupt.h>
46 #include <sys/pcpu.h>
47 #include <sys/smp.h>
48 #include <sys/refcount.h>
49
50 #include <vm/vm.h>
51 #include <vm/pmap.h>
52
53 #include <machine/intr_machdep.h>
54 #include <x86/apicvar.h>
55 #include <x86/apicreg.h>
56 #include <machine/smp.h>
57 #include <machine/stdarg.h>
58
59 #include <machine/xen/synch_bitops.h>
60 #include <machine/xen/xen-os.h>
61
62 #include <xen/xen-os.h>
63 #include <xen/hypervisor.h>
64 #include <xen/xen_intr.h>
65 #include <xen/evtchn/evtchnvar.h>
66
67 #include <dev/xen/xenpci/xenpcivar.h>
68 #include <dev/pci/pcivar.h>
69
70 #ifdef DDB
71 #include <ddb/ddb.h>
72 #endif
73
74 static MALLOC_DEFINE(M_XENINTR, "xen_intr", "Xen Interrupt Services");
75
76 static u_int first_evtchn_irq;
77
78 /**
79 * Per-cpu event channel processing state.
80 */
81 struct xen_intr_pcpu_data {
82 /**
83 * The last event channel bitmap section (level one bit) processed.
84 * This is used to ensure we scan all ports before
85 * servicing an already servied port again.
86 */
87 u_int last_processed_l1i;
88
89 /**
90 * The last event channel processed within the event channel
91 * bitmap being scanned.
92 */
93 u_int last_processed_l2i;
94
95 /** Pointer to this CPU's interrupt statistic counter. */
96 u_long *evtchn_intrcnt;
97
98 /**
99 * A bitmap of ports that can be serviced from this CPU.
100 * A set bit means interrupt handling is enabled.
101 */
102 u_long evtchn_enabled[sizeof(u_long) * 8];
103 };
104
105 /*
106 * Start the scan at port 0 by initializing the last scanned
107 * location as the highest numbered event channel port.
108 */
109 DPCPU_DEFINE_STATIC(struct xen_intr_pcpu_data, xen_intr_pcpu) = {
110 .last_processed_l1i = LONG_BIT - 1,
111 .last_processed_l2i = LONG_BIT - 1
112 };
113
114 DPCPU_DECLARE(struct vcpu_info *, vcpu_info);
115
116 #define XEN_EEXIST 17 /* Xen "already exists" error */
117 #define XEN_ALLOCATE_VECTOR 0 /* Allocate a vector for this event channel */
118 #define XEN_INVALID_EVTCHN 0 /* Invalid event channel */
119
120 #define is_valid_evtchn(x) ((x) != XEN_INVALID_EVTCHN)
121
122 struct xenisrc {
123 struct intsrc xi_intsrc;
124 enum evtchn_type xi_type;
125 int xi_cpu; /* VCPU for delivery. */
126 int xi_vector; /* Global isrc vector number. */
127 evtchn_port_t xi_port;
128 int xi_pirq;
129 int xi_virq;
130 void *xi_cookie;
131 u_int xi_close:1; /* close on unbind? */
132 u_int xi_activehi:1;
133 u_int xi_edgetrigger:1;
134 u_int xi_masked:1;
135 volatile u_int xi_refcount;
136 };
137
138 static void xen_intr_suspend(struct pic *);
139 static void xen_intr_resume(struct pic *, bool suspend_cancelled);
140 static void xen_intr_enable_source(struct intsrc *isrc);
141 static void xen_intr_disable_source(struct intsrc *isrc, int eoi);
142 static void xen_intr_eoi_source(struct intsrc *isrc);
143 static void xen_intr_enable_intr(struct intsrc *isrc);
144 static void xen_intr_disable_intr(struct intsrc *isrc);
145 static int xen_intr_vector(struct intsrc *isrc);
146 static int xen_intr_source_pending(struct intsrc *isrc);
147 static int xen_intr_config_intr(struct intsrc *isrc,
148 enum intr_trigger trig, enum intr_polarity pol);
149 static int xen_intr_assign_cpu(struct intsrc *isrc, u_int apic_id);
150
151 static void xen_intr_pirq_enable_source(struct intsrc *isrc);
152 static void xen_intr_pirq_disable_source(struct intsrc *isrc, int eoi);
153 static void xen_intr_pirq_eoi_source(struct intsrc *isrc);
154 static void xen_intr_pirq_enable_intr(struct intsrc *isrc);
155 static void xen_intr_pirq_disable_intr(struct intsrc *isrc);
156 static int xen_intr_pirq_config_intr(struct intsrc *isrc,
157 enum intr_trigger trig, enum intr_polarity pol);
158
159 /**
160 * PIC interface for all event channel port types except physical IRQs.
161 */
162 struct pic xen_intr_pic = {
163 .pic_enable_source = xen_intr_enable_source,
164 .pic_disable_source = xen_intr_disable_source,
165 .pic_eoi_source = xen_intr_eoi_source,
166 .pic_enable_intr = xen_intr_enable_intr,
167 .pic_disable_intr = xen_intr_disable_intr,
168 .pic_vector = xen_intr_vector,
169 .pic_source_pending = xen_intr_source_pending,
170 .pic_suspend = xen_intr_suspend,
171 .pic_resume = xen_intr_resume,
172 .pic_config_intr = xen_intr_config_intr,
173 .pic_assign_cpu = xen_intr_assign_cpu
174 };
175
176 /**
177 * PIC interface for all event channel representing
178 * physical interrupt sources.
179 */
180 struct pic xen_intr_pirq_pic = {
181 #ifdef __amd64__
182 .pic_register_sources = xenpv_register_pirqs,
183 #endif
184 .pic_enable_source = xen_intr_pirq_enable_source,
185 .pic_disable_source = xen_intr_pirq_disable_source,
186 .pic_eoi_source = xen_intr_pirq_eoi_source,
187 .pic_enable_intr = xen_intr_pirq_enable_intr,
188 .pic_disable_intr = xen_intr_pirq_disable_intr,
189 .pic_vector = xen_intr_vector,
190 .pic_source_pending = xen_intr_source_pending,
191 .pic_config_intr = xen_intr_pirq_config_intr,
192 .pic_assign_cpu = xen_intr_assign_cpu
193 };
194
195 static struct mtx xen_intr_isrc_lock;
196 static u_int xen_intr_auto_vector_count;
197 static struct xenisrc *xen_intr_port_to_isrc[NR_EVENT_CHANNELS];
198 static u_long *xen_intr_pirq_eoi_map;
199 static boolean_t xen_intr_pirq_eoi_map_enabled;
200
201 /*------------------------- Private Functions --------------------------------*/
202 /**
203 * Disable signal delivery for an event channel port on the
204 * specified CPU.
205 *
206 * \param port The event channel port to mask.
207 *
208 * This API is used to manage the port<=>CPU binding of event
209 * channel handlers.
210 *
211 * \note This operation does not preclude reception of an event
212 * for this event channel on another CPU. To mask the
213 * event channel globally, use evtchn_mask().
214 */
215 static inline void
evtchn_cpu_mask_port(u_int cpu,evtchn_port_t port)216 evtchn_cpu_mask_port(u_int cpu, evtchn_port_t port)
217 {
218 struct xen_intr_pcpu_data *pcpu;
219
220 pcpu = DPCPU_ID_PTR(cpu, xen_intr_pcpu);
221 xen_clear_bit(port, pcpu->evtchn_enabled);
222 }
223
224 /**
225 * Enable signal delivery for an event channel port on the
226 * specified CPU.
227 *
228 * \param port The event channel port to unmask.
229 *
230 * This API is used to manage the port<=>CPU binding of event
231 * channel handlers.
232 *
233 * \note This operation does not guarantee that event delivery
234 * is enabled for this event channel port. The port must
235 * also be globally enabled. See evtchn_unmask().
236 */
237 static inline void
evtchn_cpu_unmask_port(u_int cpu,evtchn_port_t port)238 evtchn_cpu_unmask_port(u_int cpu, evtchn_port_t port)
239 {
240 struct xen_intr_pcpu_data *pcpu;
241
242 pcpu = DPCPU_ID_PTR(cpu, xen_intr_pcpu);
243 xen_set_bit(port, pcpu->evtchn_enabled);
244 }
245
246 /**
247 * Allocate and register a per-cpu Xen upcall interrupt counter.
248 *
249 * \param cpu The cpu for which to register this interrupt count.
250 */
251 static void
xen_intr_intrcnt_add(u_int cpu)252 xen_intr_intrcnt_add(u_int cpu)
253 {
254 char buf[MAXCOMLEN + 1];
255 struct xen_intr_pcpu_data *pcpu;
256
257 pcpu = DPCPU_ID_PTR(cpu, xen_intr_pcpu);
258 if (pcpu->evtchn_intrcnt != NULL)
259 return;
260
261 snprintf(buf, sizeof(buf), "cpu%d:xen", cpu);
262 intrcnt_add(buf, &pcpu->evtchn_intrcnt);
263 }
264
265 /**
266 * Search for an already allocated but currently unused Xen interrupt
267 * source object.
268 *
269 * \param type Restrict the search to interrupt sources of the given
270 * type.
271 *
272 * \return A pointer to a free Xen interrupt source object or NULL.
273 */
274 static struct xenisrc *
xen_intr_find_unused_isrc(enum evtchn_type type)275 xen_intr_find_unused_isrc(enum evtchn_type type)
276 {
277 int isrc_idx;
278
279 KASSERT(mtx_owned(&xen_intr_isrc_lock), ("Evtchn isrc lock not held"));
280
281 for (isrc_idx = 0; isrc_idx < xen_intr_auto_vector_count; isrc_idx ++) {
282 struct xenisrc *isrc;
283 u_int vector;
284
285 vector = first_evtchn_irq + isrc_idx;
286 isrc = (struct xenisrc *)intr_lookup_source(vector);
287 if (isrc != NULL
288 && isrc->xi_type == EVTCHN_TYPE_UNBOUND) {
289 KASSERT(isrc->xi_intsrc.is_handlers == 0,
290 ("Free evtchn still has handlers"));
291 isrc->xi_type = type;
292 return (isrc);
293 }
294 }
295 return (NULL);
296 }
297
298 /**
299 * Allocate a Xen interrupt source object.
300 *
301 * \param type The type of interrupt source to create.
302 *
303 * \return A pointer to a newly allocated Xen interrupt source
304 * object or NULL.
305 */
306 static struct xenisrc *
xen_intr_alloc_isrc(enum evtchn_type type,int vector)307 xen_intr_alloc_isrc(enum evtchn_type type, int vector)
308 {
309 static int warned;
310 struct xenisrc *isrc;
311
312 KASSERT(mtx_owned(&xen_intr_isrc_lock), ("Evtchn alloc lock not held"));
313
314 if (xen_intr_auto_vector_count > NR_EVENT_CHANNELS) {
315 if (!warned) {
316 warned = 1;
317 printf("xen_intr_alloc: Event channels exhausted.\n");
318 }
319 return (NULL);
320 }
321
322 if (type != EVTCHN_TYPE_PIRQ) {
323 vector = first_evtchn_irq + xen_intr_auto_vector_count;
324 xen_intr_auto_vector_count++;
325 }
326
327 KASSERT((intr_lookup_source(vector) == NULL),
328 ("Trying to use an already allocated vector"));
329
330 mtx_unlock(&xen_intr_isrc_lock);
331 isrc = malloc(sizeof(*isrc), M_XENINTR, M_WAITOK | M_ZERO);
332 isrc->xi_intsrc.is_pic =
333 (type == EVTCHN_TYPE_PIRQ) ? &xen_intr_pirq_pic : &xen_intr_pic;
334 isrc->xi_vector = vector;
335 isrc->xi_type = type;
336 intr_register_source(&isrc->xi_intsrc);
337 mtx_lock(&xen_intr_isrc_lock);
338
339 return (isrc);
340 }
341
342 /**
343 * Attempt to free an active Xen interrupt source object.
344 *
345 * \param isrc The interrupt source object to release.
346 *
347 * \returns EBUSY if the source is still in use, otherwise 0.
348 */
349 static int
xen_intr_release_isrc(struct xenisrc * isrc)350 xen_intr_release_isrc(struct xenisrc *isrc)
351 {
352
353 mtx_lock(&xen_intr_isrc_lock);
354 KASSERT(isrc->xi_intsrc.is_handlers == 0,
355 ("Release called, but xenisrc still in use"));
356 evtchn_mask_port(isrc->xi_port);
357 evtchn_clear_port(isrc->xi_port);
358
359 /* Rebind port to CPU 0. */
360 evtchn_cpu_mask_port(isrc->xi_cpu, isrc->xi_port);
361 evtchn_cpu_unmask_port(0, isrc->xi_port);
362
363 if (isrc->xi_close != 0 && is_valid_evtchn(isrc->xi_port)) {
364 struct evtchn_close close = { .port = isrc->xi_port };
365 if (HYPERVISOR_event_channel_op(EVTCHNOP_close, &close))
366 panic("EVTCHNOP_close failed");
367 }
368
369 xen_intr_port_to_isrc[isrc->xi_port] = NULL;
370 isrc->xi_cpu = 0;
371 isrc->xi_type = EVTCHN_TYPE_UNBOUND;
372 isrc->xi_port = 0;
373 isrc->xi_cookie = NULL;
374 mtx_unlock(&xen_intr_isrc_lock);
375 return (0);
376 }
377
378 /**
379 * Associate an interrupt handler with an already allocated local Xen
380 * event channel port.
381 *
382 * \param isrcp The returned Xen interrupt object associated with
383 * the specified local port.
384 * \param local_port The event channel to bind.
385 * \param type The event channel type of local_port.
386 * \param intr_owner The device making this bind request.
387 * \param filter An interrupt filter handler. Specify NULL
388 * to always dispatch to the ithread handler.
389 * \param handler An interrupt ithread handler. Optional (can
390 * specify NULL) if all necessary event actions
391 * are performed by filter.
392 * \param arg Argument to present to both filter and handler.
393 * \param irqflags Interrupt handler flags. See sys/bus.h.
394 * \param handlep Pointer to an opaque handle used to manage this
395 * registration.
396 *
397 * \returns 0 on success, otherwise an errno.
398 */
399 static int
xen_intr_bind_isrc(struct xenisrc ** isrcp,evtchn_port_t local_port,enum evtchn_type type,const char * intr_owner,driver_filter_t filter,driver_intr_t handler,void * arg,enum intr_type flags,xen_intr_handle_t * port_handlep)400 xen_intr_bind_isrc(struct xenisrc **isrcp, evtchn_port_t local_port,
401 enum evtchn_type type, const char *intr_owner, driver_filter_t filter,
402 driver_intr_t handler, void *arg, enum intr_type flags,
403 xen_intr_handle_t *port_handlep)
404 {
405 struct xenisrc *isrc;
406 int error;
407
408 *isrcp = NULL;
409 if (port_handlep == NULL) {
410 printf("%s: xen_intr_bind_isrc: Bad event handle\n",
411 intr_owner);
412 return (EINVAL);
413 }
414
415 mtx_lock(&xen_intr_isrc_lock);
416 isrc = xen_intr_find_unused_isrc(type);
417 if (isrc == NULL) {
418 isrc = xen_intr_alloc_isrc(type, XEN_ALLOCATE_VECTOR);
419 if (isrc == NULL) {
420 mtx_unlock(&xen_intr_isrc_lock);
421 return (ENOSPC);
422 }
423 }
424 isrc->xi_port = local_port;
425 xen_intr_port_to_isrc[local_port] = isrc;
426 refcount_init(&isrc->xi_refcount, 1);
427 mtx_unlock(&xen_intr_isrc_lock);
428
429 /* Assign the opaque handler (the event channel port) */
430 *port_handlep = &isrc->xi_vector;
431
432 #ifdef SMP
433 if (type == EVTCHN_TYPE_PORT) {
434 /*
435 * By default all interrupts are assigned to vCPU#0
436 * unless specified otherwise, so shuffle them to balance
437 * the interrupt load.
438 */
439 xen_intr_assign_cpu(&isrc->xi_intsrc, intr_next_cpu(0));
440 }
441 #endif
442
443 if (filter == NULL && handler == NULL) {
444 /*
445 * No filter/handler provided, leave the event channel
446 * masked and without a valid handler, the caller is
447 * in charge of setting that up.
448 */
449 *isrcp = isrc;
450 return (0);
451 }
452
453 error = xen_intr_add_handler(intr_owner, filter, handler, arg, flags,
454 *port_handlep);
455 if (error != 0) {
456 xen_intr_release_isrc(isrc);
457 return (error);
458 }
459 *isrcp = isrc;
460 return (0);
461 }
462
463 /**
464 * Lookup a Xen interrupt source object given an interrupt binding handle.
465 *
466 * \param handle A handle initialized by a previous call to
467 * xen_intr_bind_isrc().
468 *
469 * \returns A pointer to the Xen interrupt source object associated
470 * with the given interrupt handle. NULL if no association
471 * currently exists.
472 */
473 static struct xenisrc *
xen_intr_isrc(xen_intr_handle_t handle)474 xen_intr_isrc(xen_intr_handle_t handle)
475 {
476 int vector;
477
478 if (handle == NULL)
479 return (NULL);
480
481 vector = *(int *)handle;
482 KASSERT(vector >= first_evtchn_irq &&
483 vector < (first_evtchn_irq + xen_intr_auto_vector_count),
484 ("Xen interrupt vector is out of range"));
485
486 return ((struct xenisrc *)intr_lookup_source(vector));
487 }
488
489 /**
490 * Determine the event channel ports at the given section of the
491 * event port bitmap which have pending events for the given cpu.
492 *
493 * \param pcpu The Xen interrupt pcpu data for the cpu being querried.
494 * \param sh The Xen shared info area.
495 * \param idx The index of the section of the event channel bitmap to
496 * inspect.
497 *
498 * \returns A u_long with bits set for every event channel with pending
499 * events.
500 */
501 static inline u_long
xen_intr_active_ports(struct xen_intr_pcpu_data * pcpu,shared_info_t * sh,u_int idx)502 xen_intr_active_ports(struct xen_intr_pcpu_data *pcpu, shared_info_t *sh,
503 u_int idx)
504 {
505
506 CTASSERT(sizeof(sh->evtchn_mask[0]) == sizeof(sh->evtchn_pending[0]));
507 CTASSERT(sizeof(sh->evtchn_mask[0]) == sizeof(pcpu->evtchn_enabled[0]));
508 CTASSERT(sizeof(sh->evtchn_mask) == sizeof(sh->evtchn_pending));
509 CTASSERT(sizeof(sh->evtchn_mask) == sizeof(pcpu->evtchn_enabled));
510 return (sh->evtchn_pending[idx]
511 & ~sh->evtchn_mask[idx]
512 & pcpu->evtchn_enabled[idx]);
513 }
514
515 /**
516 * Interrupt handler for processing all Xen event channel events.
517 *
518 * \param trap_frame The trap frame context for the current interrupt.
519 */
520 void
xen_intr_handle_upcall(struct trapframe * trap_frame)521 xen_intr_handle_upcall(struct trapframe *trap_frame)
522 {
523 u_int l1i, l2i, port, cpu;
524 u_long masked_l1, masked_l2;
525 struct xenisrc *isrc;
526 shared_info_t *s;
527 vcpu_info_t *v;
528 struct xen_intr_pcpu_data *pc;
529 u_long l1, l2;
530
531 /*
532 * Disable preemption in order to always check and fire events
533 * on the right vCPU
534 */
535 critical_enter();
536
537 cpu = PCPU_GET(cpuid);
538 pc = DPCPU_PTR(xen_intr_pcpu);
539 s = HYPERVISOR_shared_info;
540 v = DPCPU_GET(vcpu_info);
541
542 if (xen_hvm_domain() && !xen_vector_callback_enabled) {
543 KASSERT((cpu == 0), ("Fired PCI event callback on wrong CPU"));
544 }
545
546 v->evtchn_upcall_pending = 0;
547
548 #if 0
549 #ifndef CONFIG_X86 /* No need for a barrier -- XCHG is a barrier on x86. */
550 /* Clear master flag /before/ clearing selector flag. */
551 wmb();
552 #endif
553 #endif
554
555 l1 = atomic_readandclear_long(&v->evtchn_pending_sel);
556
557 l1i = pc->last_processed_l1i;
558 l2i = pc->last_processed_l2i;
559 (*pc->evtchn_intrcnt)++;
560
561 while (l1 != 0) {
562
563 l1i = (l1i + 1) % LONG_BIT;
564 masked_l1 = l1 & ((~0UL) << l1i);
565
566 if (masked_l1 == 0) {
567 /*
568 * if we masked out all events, wrap around
569 * to the beginning.
570 */
571 l1i = LONG_BIT - 1;
572 l2i = LONG_BIT - 1;
573 continue;
574 }
575 l1i = ffsl(masked_l1) - 1;
576
577 do {
578 l2 = xen_intr_active_ports(pc, s, l1i);
579
580 l2i = (l2i + 1) % LONG_BIT;
581 masked_l2 = l2 & ((~0UL) << l2i);
582
583 if (masked_l2 == 0) {
584 /* if we masked out all events, move on */
585 l2i = LONG_BIT - 1;
586 break;
587 }
588 l2i = ffsl(masked_l2) - 1;
589
590 /* process port */
591 port = (l1i * LONG_BIT) + l2i;
592 synch_clear_bit(port, &s->evtchn_pending[0]);
593
594 isrc = xen_intr_port_to_isrc[port];
595 if (__predict_false(isrc == NULL))
596 continue;
597
598 /* Make sure we are firing on the right vCPU */
599 KASSERT((isrc->xi_cpu == PCPU_GET(cpuid)),
600 ("Received unexpected event on vCPU#%d, event bound to vCPU#%d",
601 PCPU_GET(cpuid), isrc->xi_cpu));
602
603 intr_execute_handlers(&isrc->xi_intsrc, trap_frame);
604
605 /*
606 * If this is the final port processed,
607 * we'll pick up here+1 next time.
608 */
609 pc->last_processed_l1i = l1i;
610 pc->last_processed_l2i = l2i;
611
612 } while (l2i != LONG_BIT - 1);
613
614 l2 = xen_intr_active_ports(pc, s, l1i);
615 if (l2 == 0) {
616 /*
617 * We handled all ports, so we can clear the
618 * selector bit.
619 */
620 l1 &= ~(1UL << l1i);
621 }
622 }
623 critical_exit();
624 }
625
626 static int
xen_intr_init(void * dummy __unused)627 xen_intr_init(void *dummy __unused)
628 {
629 shared_info_t *s = HYPERVISOR_shared_info;
630 struct xen_intr_pcpu_data *pcpu;
631 struct physdev_pirq_eoi_gmfn eoi_gmfn;
632 int i, rc;
633
634 if (!xen_domain())
635 return (0);
636
637 mtx_init(&xen_intr_isrc_lock, "xen-irq-lock", NULL, MTX_DEF);
638
639 /*
640 * Set the per-cpu mask of CPU#0 to enable all, since by default all
641 * event channels are bound to CPU#0.
642 */
643 CPU_FOREACH(i) {
644 pcpu = DPCPU_ID_PTR(i, xen_intr_pcpu);
645 memset(pcpu->evtchn_enabled, i == 0 ? ~0 : 0,
646 sizeof(pcpu->evtchn_enabled));
647 }
648
649 for (i = 0; i < nitems(s->evtchn_mask); i++)
650 atomic_store_rel_long(&s->evtchn_mask[i], ~0);
651
652 /* Try to register PIRQ EOI map */
653 xen_intr_pirq_eoi_map = malloc(PAGE_SIZE, M_XENINTR, M_WAITOK | M_ZERO);
654 eoi_gmfn.gmfn = atop(vtophys(xen_intr_pirq_eoi_map));
655 rc = HYPERVISOR_physdev_op(PHYSDEVOP_pirq_eoi_gmfn_v2, &eoi_gmfn);
656 if (rc != 0 && bootverbose)
657 printf("Xen interrupts: unable to register PIRQ EOI map\n");
658 else
659 xen_intr_pirq_eoi_map_enabled = true;
660
661 intr_register_pic(&xen_intr_pic);
662 if (xen_pv_domain() && xen_initial_domain())
663 intr_register_pic(&xen_intr_pirq_pic);
664
665 if (bootverbose)
666 printf("Xen interrupt system initialized\n");
667
668 return (0);
669 }
670 SYSINIT(xen_intr_init, SI_SUB_INTR, SI_ORDER_SECOND, xen_intr_init, NULL);
671
672 static void
xen_intrcnt_init(void * dummy __unused)673 xen_intrcnt_init(void *dummy __unused)
674 {
675 unsigned int i;
676
677 if (!xen_domain())
678 return;
679
680 /*
681 * Register interrupt count manually as we aren't guaranteed to see a
682 * call to xen_intr_assign_cpu() before our first interrupt.
683 */
684 CPU_FOREACH(i)
685 xen_intr_intrcnt_add(i);
686 }
687 SYSINIT(xen_intrcnt_init, SI_SUB_INTR, SI_ORDER_MIDDLE, xen_intrcnt_init, NULL);
688
689 void
xen_intr_alloc_irqs(void)690 xen_intr_alloc_irqs(void)
691 {
692
693 if (num_io_irqs > UINT_MAX - NR_EVENT_CHANNELS)
694 panic("IRQ allocation overflow (num_msi_irqs too high?)");
695 first_evtchn_irq = num_io_irqs;
696 num_io_irqs += NR_EVENT_CHANNELS;
697 }
698
699 /*--------------------------- Common PIC Functions ---------------------------*/
700 /**
701 * Prepare this PIC for system suspension.
702 */
703 static void
xen_intr_suspend(struct pic * unused)704 xen_intr_suspend(struct pic *unused)
705 {
706 }
707
708 static void
xen_rebind_ipi(struct xenisrc * isrc)709 xen_rebind_ipi(struct xenisrc *isrc)
710 {
711 #ifdef SMP
712 int cpu = isrc->xi_cpu;
713 int vcpu_id = pcpu_find(cpu)->pc_vcpu_id;
714 int error;
715 struct evtchn_bind_ipi bind_ipi = { .vcpu = vcpu_id };
716
717 error = HYPERVISOR_event_channel_op(EVTCHNOP_bind_ipi,
718 &bind_ipi);
719 if (error != 0)
720 panic("unable to rebind xen IPI: %d", error);
721
722 isrc->xi_port = bind_ipi.port;
723 isrc->xi_cpu = 0;
724 xen_intr_port_to_isrc[bind_ipi.port] = isrc;
725
726 error = xen_intr_assign_cpu(&isrc->xi_intsrc,
727 cpu_apic_ids[cpu]);
728 if (error)
729 panic("unable to bind xen IPI to CPU#%d: %d",
730 cpu, error);
731
732 evtchn_unmask_port(bind_ipi.port);
733 #else
734 panic("Resume IPI event channel on UP");
735 #endif
736 }
737
738 static void
xen_rebind_virq(struct xenisrc * isrc)739 xen_rebind_virq(struct xenisrc *isrc)
740 {
741 int cpu = isrc->xi_cpu;
742 int vcpu_id = pcpu_find(cpu)->pc_vcpu_id;
743 int error;
744 struct evtchn_bind_virq bind_virq = { .virq = isrc->xi_virq,
745 .vcpu = vcpu_id };
746
747 error = HYPERVISOR_event_channel_op(EVTCHNOP_bind_virq,
748 &bind_virq);
749 if (error != 0)
750 panic("unable to rebind xen VIRQ#%d: %d", isrc->xi_virq, error);
751
752 isrc->xi_port = bind_virq.port;
753 isrc->xi_cpu = 0;
754 xen_intr_port_to_isrc[bind_virq.port] = isrc;
755
756 #ifdef SMP
757 error = xen_intr_assign_cpu(&isrc->xi_intsrc,
758 cpu_apic_ids[cpu]);
759 if (error)
760 panic("unable to bind xen VIRQ#%d to CPU#%d: %d",
761 isrc->xi_virq, cpu, error);
762 #endif
763
764 evtchn_unmask_port(bind_virq.port);
765 }
766
767 /**
768 * Return this PIC to service after being suspended.
769 */
770 static void
xen_intr_resume(struct pic * unused,bool suspend_cancelled)771 xen_intr_resume(struct pic *unused, bool suspend_cancelled)
772 {
773 shared_info_t *s = HYPERVISOR_shared_info;
774 struct xenisrc *isrc;
775 u_int isrc_idx;
776 int i;
777
778 if (suspend_cancelled)
779 return;
780
781 /* Reset the per-CPU masks */
782 CPU_FOREACH(i) {
783 struct xen_intr_pcpu_data *pcpu;
784
785 pcpu = DPCPU_ID_PTR(i, xen_intr_pcpu);
786 memset(pcpu->evtchn_enabled, i == 0 ? ~0 : 0,
787 sizeof(pcpu->evtchn_enabled));
788 }
789
790 /* Mask all event channels. */
791 for (i = 0; i < nitems(s->evtchn_mask); i++)
792 atomic_store_rel_long(&s->evtchn_mask[i], ~0);
793
794 /* Remove port -> isrc mappings */
795 memset(xen_intr_port_to_isrc, 0, sizeof(xen_intr_port_to_isrc));
796
797 /* Free unused isrcs and rebind VIRQs and IPIs */
798 for (isrc_idx = 0; isrc_idx < xen_intr_auto_vector_count; isrc_idx++) {
799 u_int vector;
800
801 vector = first_evtchn_irq + isrc_idx;
802 isrc = (struct xenisrc *)intr_lookup_source(vector);
803 if (isrc != NULL) {
804 isrc->xi_port = 0;
805 switch (isrc->xi_type) {
806 case EVTCHN_TYPE_IPI:
807 xen_rebind_ipi(isrc);
808 break;
809 case EVTCHN_TYPE_VIRQ:
810 xen_rebind_virq(isrc);
811 break;
812 default:
813 break;
814 }
815 }
816 }
817 }
818
819 /**
820 * Disable a Xen interrupt source.
821 *
822 * \param isrc The interrupt source to disable.
823 */
824 static void
xen_intr_disable_intr(struct intsrc * base_isrc)825 xen_intr_disable_intr(struct intsrc *base_isrc)
826 {
827 struct xenisrc *isrc = (struct xenisrc *)base_isrc;
828
829 evtchn_mask_port(isrc->xi_port);
830 }
831
832 /**
833 * Determine the global interrupt vector number for
834 * a Xen interrupt source.
835 *
836 * \param isrc The interrupt source to query.
837 *
838 * \return The vector number corresponding to the given interrupt source.
839 */
840 static int
xen_intr_vector(struct intsrc * base_isrc)841 xen_intr_vector(struct intsrc *base_isrc)
842 {
843 struct xenisrc *isrc = (struct xenisrc *)base_isrc;
844
845 return (isrc->xi_vector);
846 }
847
848 /**
849 * Determine whether or not interrupt events are pending on the
850 * the given interrupt source.
851 *
852 * \param isrc The interrupt source to query.
853 *
854 * \returns 0 if no events are pending, otherwise non-zero.
855 */
856 static int
xen_intr_source_pending(struct intsrc * isrc)857 xen_intr_source_pending(struct intsrc *isrc)
858 {
859 /*
860 * EventChannels are edge triggered and never masked.
861 * There can be no pending events.
862 */
863 return (0);
864 }
865
866 /**
867 * Perform configuration of an interrupt source.
868 *
869 * \param isrc The interrupt source to configure.
870 * \param trig Edge or level.
871 * \param pol Active high or low.
872 *
873 * \returns 0 if no events are pending, otherwise non-zero.
874 */
875 static int
xen_intr_config_intr(struct intsrc * isrc,enum intr_trigger trig,enum intr_polarity pol)876 xen_intr_config_intr(struct intsrc *isrc, enum intr_trigger trig,
877 enum intr_polarity pol)
878 {
879 /* Configuration is only possible via the evtchn apis. */
880 return (ENODEV);
881 }
882
883 /**
884 * Configure CPU affinity for interrupt source event delivery.
885 *
886 * \param isrc The interrupt source to configure.
887 * \param apic_id The apic id of the CPU for handling future events.
888 *
889 * \returns 0 if successful, otherwise an errno.
890 */
891 static int
xen_intr_assign_cpu(struct intsrc * base_isrc,u_int apic_id)892 xen_intr_assign_cpu(struct intsrc *base_isrc, u_int apic_id)
893 {
894 #ifdef SMP
895 struct evtchn_bind_vcpu bind_vcpu;
896 struct xenisrc *isrc;
897 u_int to_cpu, vcpu_id;
898 int error, masked;
899
900 if (xen_vector_callback_enabled == 0)
901 return (EOPNOTSUPP);
902
903 to_cpu = apic_cpuid(apic_id);
904 vcpu_id = pcpu_find(to_cpu)->pc_vcpu_id;
905
906 mtx_lock(&xen_intr_isrc_lock);
907 isrc = (struct xenisrc *)base_isrc;
908 if (!is_valid_evtchn(isrc->xi_port)) {
909 mtx_unlock(&xen_intr_isrc_lock);
910 return (EINVAL);
911 }
912
913 /*
914 * Mask the event channel while binding it to prevent interrupt
915 * delivery with an inconsistent state in isrc->xi_cpu.
916 */
917 masked = evtchn_test_and_set_mask(isrc->xi_port);
918 if ((isrc->xi_type == EVTCHN_TYPE_VIRQ) ||
919 (isrc->xi_type == EVTCHN_TYPE_IPI)) {
920 /*
921 * Virtual IRQs are associated with a cpu by
922 * the Hypervisor at evtchn_bind_virq time, so
923 * all we need to do is update the per-CPU masks.
924 */
925 evtchn_cpu_mask_port(isrc->xi_cpu, isrc->xi_port);
926 isrc->xi_cpu = to_cpu;
927 evtchn_cpu_unmask_port(isrc->xi_cpu, isrc->xi_port);
928 goto out;
929 }
930
931 bind_vcpu.port = isrc->xi_port;
932 bind_vcpu.vcpu = vcpu_id;
933
934 error = HYPERVISOR_event_channel_op(EVTCHNOP_bind_vcpu, &bind_vcpu);
935 if (isrc->xi_cpu != to_cpu) {
936 if (error == 0) {
937 /* Commit to new binding by removing the old one. */
938 evtchn_cpu_mask_port(isrc->xi_cpu, isrc->xi_port);
939 isrc->xi_cpu = to_cpu;
940 evtchn_cpu_unmask_port(isrc->xi_cpu, isrc->xi_port);
941 }
942 }
943
944 out:
945 if (masked == 0)
946 evtchn_unmask_port(isrc->xi_port);
947 mtx_unlock(&xen_intr_isrc_lock);
948 return (0);
949 #else
950 return (EOPNOTSUPP);
951 #endif
952 }
953
954 /*------------------- Virtual Interrupt Source PIC Functions -----------------*/
955 /*
956 * Mask a level triggered interrupt source.
957 *
958 * \param isrc The interrupt source to mask (if necessary).
959 * \param eoi If non-zero, perform any necessary end-of-interrupt
960 * acknowledgements.
961 */
962 static void
xen_intr_disable_source(struct intsrc * base_isrc,int eoi)963 xen_intr_disable_source(struct intsrc *base_isrc, int eoi)
964 {
965 struct xenisrc *isrc;
966
967 isrc = (struct xenisrc *)base_isrc;
968
969 /*
970 * NB: checking if the event channel is already masked is
971 * needed because the event channel user-space device
972 * masks event channels on its filter as part of its
973 * normal operation, and those shouldn't be automatically
974 * unmasked by the generic interrupt code. The event channel
975 * device will unmask them when needed.
976 */
977 isrc->xi_masked = !!evtchn_test_and_set_mask(isrc->xi_port);
978 }
979
980 /*
981 * Unmask a level triggered interrupt source.
982 *
983 * \param isrc The interrupt source to unmask (if necessary).
984 */
985 static void
xen_intr_enable_source(struct intsrc * base_isrc)986 xen_intr_enable_source(struct intsrc *base_isrc)
987 {
988 struct xenisrc *isrc;
989
990 isrc = (struct xenisrc *)base_isrc;
991
992 if (isrc->xi_masked == 0)
993 evtchn_unmask_port(isrc->xi_port);
994 }
995
996 /*
997 * Perform any necessary end-of-interrupt acknowledgements.
998 *
999 * \param isrc The interrupt source to EOI.
1000 */
1001 static void
xen_intr_eoi_source(struct intsrc * base_isrc)1002 xen_intr_eoi_source(struct intsrc *base_isrc)
1003 {
1004 }
1005
1006 /*
1007 * Enable and unmask the interrupt source.
1008 *
1009 * \param isrc The interrupt source to enable.
1010 */
1011 static void
xen_intr_enable_intr(struct intsrc * base_isrc)1012 xen_intr_enable_intr(struct intsrc *base_isrc)
1013 {
1014 struct xenisrc *isrc = (struct xenisrc *)base_isrc;
1015
1016 evtchn_unmask_port(isrc->xi_port);
1017 }
1018
1019 /*------------------ Physical Interrupt Source PIC Functions -----------------*/
1020 /*
1021 * Mask a level triggered interrupt source.
1022 *
1023 * \param isrc The interrupt source to mask (if necessary).
1024 * \param eoi If non-zero, perform any necessary end-of-interrupt
1025 * acknowledgements.
1026 */
1027 static void
xen_intr_pirq_disable_source(struct intsrc * base_isrc,int eoi)1028 xen_intr_pirq_disable_source(struct intsrc *base_isrc, int eoi)
1029 {
1030 struct xenisrc *isrc;
1031
1032 isrc = (struct xenisrc *)base_isrc;
1033
1034 if (isrc->xi_edgetrigger == 0)
1035 evtchn_mask_port(isrc->xi_port);
1036 if (eoi == PIC_EOI)
1037 xen_intr_pirq_eoi_source(base_isrc);
1038 }
1039
1040 /*
1041 * Unmask a level triggered interrupt source.
1042 *
1043 * \param isrc The interrupt source to unmask (if necessary).
1044 */
1045 static void
xen_intr_pirq_enable_source(struct intsrc * base_isrc)1046 xen_intr_pirq_enable_source(struct intsrc *base_isrc)
1047 {
1048 struct xenisrc *isrc;
1049
1050 isrc = (struct xenisrc *)base_isrc;
1051
1052 if (isrc->xi_edgetrigger == 0)
1053 evtchn_unmask_port(isrc->xi_port);
1054 }
1055
1056 /*
1057 * Perform any necessary end-of-interrupt acknowledgements.
1058 *
1059 * \param isrc The interrupt source to EOI.
1060 */
1061 static void
xen_intr_pirq_eoi_source(struct intsrc * base_isrc)1062 xen_intr_pirq_eoi_source(struct intsrc *base_isrc)
1063 {
1064 struct xenisrc *isrc;
1065 int error;
1066
1067 isrc = (struct xenisrc *)base_isrc;
1068
1069 if (xen_test_bit(isrc->xi_pirq, xen_intr_pirq_eoi_map)) {
1070 struct physdev_eoi eoi = { .irq = isrc->xi_pirq };
1071
1072 error = HYPERVISOR_physdev_op(PHYSDEVOP_eoi, &eoi);
1073 if (error != 0)
1074 panic("Unable to EOI PIRQ#%d: %d\n",
1075 isrc->xi_pirq, error);
1076 }
1077 }
1078
1079 /*
1080 * Enable and unmask the interrupt source.
1081 *
1082 * \param isrc The interrupt source to enable.
1083 */
1084 static void
xen_intr_pirq_enable_intr(struct intsrc * base_isrc)1085 xen_intr_pirq_enable_intr(struct intsrc *base_isrc)
1086 {
1087 struct xenisrc *isrc;
1088 struct evtchn_bind_pirq bind_pirq;
1089 struct physdev_irq_status_query irq_status;
1090 int error;
1091
1092 isrc = (struct xenisrc *)base_isrc;
1093
1094 if (!xen_intr_pirq_eoi_map_enabled) {
1095 irq_status.irq = isrc->xi_pirq;
1096 error = HYPERVISOR_physdev_op(PHYSDEVOP_irq_status_query,
1097 &irq_status);
1098 if (error)
1099 panic("unable to get status of IRQ#%d", isrc->xi_pirq);
1100
1101 if (irq_status.flags & XENIRQSTAT_needs_eoi) {
1102 /*
1103 * Since the dynamic PIRQ EOI map is not available
1104 * mark the PIRQ as needing EOI unconditionally.
1105 */
1106 xen_set_bit(isrc->xi_pirq, xen_intr_pirq_eoi_map);
1107 }
1108 }
1109
1110 bind_pirq.pirq = isrc->xi_pirq;
1111 bind_pirq.flags = isrc->xi_edgetrigger ? 0 : BIND_PIRQ__WILL_SHARE;
1112 error = HYPERVISOR_event_channel_op(EVTCHNOP_bind_pirq, &bind_pirq);
1113 if (error)
1114 panic("unable to bind IRQ#%d", isrc->xi_pirq);
1115
1116 isrc->xi_port = bind_pirq.port;
1117
1118 mtx_lock(&xen_intr_isrc_lock);
1119 KASSERT((xen_intr_port_to_isrc[bind_pirq.port] == NULL),
1120 ("trying to override an already setup event channel port"));
1121 xen_intr_port_to_isrc[bind_pirq.port] = isrc;
1122 mtx_unlock(&xen_intr_isrc_lock);
1123
1124 evtchn_unmask_port(isrc->xi_port);
1125 }
1126
1127 /*
1128 * Disable an interrupt source.
1129 *
1130 * \param isrc The interrupt source to disable.
1131 */
1132 static void
xen_intr_pirq_disable_intr(struct intsrc * base_isrc)1133 xen_intr_pirq_disable_intr(struct intsrc *base_isrc)
1134 {
1135 struct xenisrc *isrc;
1136 struct evtchn_close close;
1137 int error;
1138
1139 isrc = (struct xenisrc *)base_isrc;
1140
1141 evtchn_mask_port(isrc->xi_port);
1142
1143 close.port = isrc->xi_port;
1144 error = HYPERVISOR_event_channel_op(EVTCHNOP_close, &close);
1145 if (error)
1146 panic("unable to close event channel %d IRQ#%d",
1147 isrc->xi_port, isrc->xi_pirq);
1148
1149 mtx_lock(&xen_intr_isrc_lock);
1150 xen_intr_port_to_isrc[isrc->xi_port] = NULL;
1151 mtx_unlock(&xen_intr_isrc_lock);
1152
1153 isrc->xi_port = 0;
1154 }
1155
1156 /**
1157 * Perform configuration of an interrupt source.
1158 *
1159 * \param isrc The interrupt source to configure.
1160 * \param trig Edge or level.
1161 * \param pol Active high or low.
1162 *
1163 * \returns 0 if no events are pending, otherwise non-zero.
1164 */
1165 static int
xen_intr_pirq_config_intr(struct intsrc * base_isrc,enum intr_trigger trig,enum intr_polarity pol)1166 xen_intr_pirq_config_intr(struct intsrc *base_isrc, enum intr_trigger trig,
1167 enum intr_polarity pol)
1168 {
1169 struct xenisrc *isrc = (struct xenisrc *)base_isrc;
1170 struct physdev_setup_gsi setup_gsi;
1171 int error;
1172
1173 KASSERT(!(trig == INTR_TRIGGER_CONFORM || pol == INTR_POLARITY_CONFORM),
1174 ("%s: Conforming trigger or polarity\n", __func__));
1175
1176 setup_gsi.gsi = isrc->xi_pirq;
1177 setup_gsi.triggering = trig == INTR_TRIGGER_EDGE ? 0 : 1;
1178 setup_gsi.polarity = pol == INTR_POLARITY_HIGH ? 0 : 1;
1179
1180 error = HYPERVISOR_physdev_op(PHYSDEVOP_setup_gsi, &setup_gsi);
1181 if (error == -XEN_EEXIST) {
1182 if ((isrc->xi_edgetrigger && (trig != INTR_TRIGGER_EDGE)) ||
1183 (isrc->xi_activehi && (pol != INTR_POLARITY_HIGH)))
1184 panic("unable to reconfigure interrupt IRQ#%d",
1185 isrc->xi_pirq);
1186 error = 0;
1187 }
1188 if (error)
1189 panic("unable to configure IRQ#%d\n", isrc->xi_pirq);
1190
1191 isrc->xi_activehi = pol == INTR_POLARITY_HIGH ? 1 : 0;
1192 isrc->xi_edgetrigger = trig == INTR_TRIGGER_EDGE ? 1 : 0;
1193
1194 return (0);
1195 }
1196
1197 /*--------------------------- Public Functions -------------------------------*/
1198 /*------- API comments for these methods can be found in xen/xenintr.h -------*/
1199 int
xen_intr_bind_local_port(device_t dev,evtchn_port_t local_port,driver_filter_t filter,driver_intr_t handler,void * arg,enum intr_type flags,xen_intr_handle_t * port_handlep)1200 xen_intr_bind_local_port(device_t dev, evtchn_port_t local_port,
1201 driver_filter_t filter, driver_intr_t handler, void *arg,
1202 enum intr_type flags, xen_intr_handle_t *port_handlep)
1203 {
1204 struct xenisrc *isrc;
1205 int error;
1206
1207 error = xen_intr_bind_isrc(&isrc, local_port, EVTCHN_TYPE_PORT,
1208 device_get_nameunit(dev), filter, handler, arg, flags,
1209 port_handlep);
1210 if (error != 0)
1211 return (error);
1212
1213 /*
1214 * The Event Channel API didn't open this port, so it is not
1215 * responsible for closing it automatically on unbind.
1216 */
1217 isrc->xi_close = 0;
1218 return (0);
1219 }
1220
1221 int
xen_intr_alloc_and_bind_local_port(device_t dev,u_int remote_domain,driver_filter_t filter,driver_intr_t handler,void * arg,enum intr_type flags,xen_intr_handle_t * port_handlep)1222 xen_intr_alloc_and_bind_local_port(device_t dev, u_int remote_domain,
1223 driver_filter_t filter, driver_intr_t handler, void *arg,
1224 enum intr_type flags, xen_intr_handle_t *port_handlep)
1225 {
1226 struct xenisrc *isrc;
1227 struct evtchn_alloc_unbound alloc_unbound;
1228 int error;
1229
1230 alloc_unbound.dom = DOMID_SELF;
1231 alloc_unbound.remote_dom = remote_domain;
1232 error = HYPERVISOR_event_channel_op(EVTCHNOP_alloc_unbound,
1233 &alloc_unbound);
1234 if (error != 0) {
1235 /*
1236 * XXX Trap Hypercall error code Linuxisms in
1237 * the HYPERCALL layer.
1238 */
1239 return (-error);
1240 }
1241
1242 error = xen_intr_bind_isrc(&isrc, alloc_unbound.port, EVTCHN_TYPE_PORT,
1243 device_get_nameunit(dev), filter, handler, arg, flags,
1244 port_handlep);
1245 if (error != 0) {
1246 evtchn_close_t close = { .port = alloc_unbound.port };
1247 if (HYPERVISOR_event_channel_op(EVTCHNOP_close, &close))
1248 panic("EVTCHNOP_close failed");
1249 return (error);
1250 }
1251
1252 isrc->xi_close = 1;
1253 return (0);
1254 }
1255
1256 int
xen_intr_bind_remote_port(device_t dev,u_int remote_domain,u_int remote_port,driver_filter_t filter,driver_intr_t handler,void * arg,enum intr_type flags,xen_intr_handle_t * port_handlep)1257 xen_intr_bind_remote_port(device_t dev, u_int remote_domain,
1258 u_int remote_port, driver_filter_t filter, driver_intr_t handler,
1259 void *arg, enum intr_type flags, xen_intr_handle_t *port_handlep)
1260 {
1261 struct xenisrc *isrc;
1262 struct evtchn_bind_interdomain bind_interdomain;
1263 int error;
1264
1265 bind_interdomain.remote_dom = remote_domain;
1266 bind_interdomain.remote_port = remote_port;
1267 error = HYPERVISOR_event_channel_op(EVTCHNOP_bind_interdomain,
1268 &bind_interdomain);
1269 if (error != 0) {
1270 /*
1271 * XXX Trap Hypercall error code Linuxisms in
1272 * the HYPERCALL layer.
1273 */
1274 return (-error);
1275 }
1276
1277 error = xen_intr_bind_isrc(&isrc, bind_interdomain.local_port,
1278 EVTCHN_TYPE_PORT, device_get_nameunit(dev), filter, handler, arg,
1279 flags, port_handlep);
1280 if (error) {
1281 evtchn_close_t close = { .port = bind_interdomain.local_port };
1282 if (HYPERVISOR_event_channel_op(EVTCHNOP_close, &close))
1283 panic("EVTCHNOP_close failed");
1284 return (error);
1285 }
1286
1287 /*
1288 * The Event Channel API opened this port, so it is
1289 * responsible for closing it automatically on unbind.
1290 */
1291 isrc->xi_close = 1;
1292 return (0);
1293 }
1294
1295 int
xen_intr_bind_virq(device_t dev,u_int virq,u_int cpu,driver_filter_t filter,driver_intr_t handler,void * arg,enum intr_type flags,xen_intr_handle_t * port_handlep)1296 xen_intr_bind_virq(device_t dev, u_int virq, u_int cpu,
1297 driver_filter_t filter, driver_intr_t handler, void *arg,
1298 enum intr_type flags, xen_intr_handle_t *port_handlep)
1299 {
1300 int vcpu_id = pcpu_find(cpu)->pc_vcpu_id;
1301 struct xenisrc *isrc;
1302 struct evtchn_bind_virq bind_virq = { .virq = virq, .vcpu = vcpu_id };
1303 int error;
1304
1305 isrc = NULL;
1306 error = HYPERVISOR_event_channel_op(EVTCHNOP_bind_virq, &bind_virq);
1307 if (error != 0) {
1308 /*
1309 * XXX Trap Hypercall error code Linuxisms in
1310 * the HYPERCALL layer.
1311 */
1312 return (-error);
1313 }
1314
1315 error = xen_intr_bind_isrc(&isrc, bind_virq.port, EVTCHN_TYPE_VIRQ,
1316 device_get_nameunit(dev), filter, handler, arg, flags,
1317 port_handlep);
1318
1319 #ifdef SMP
1320 if (error == 0)
1321 error = intr_event_bind(isrc->xi_intsrc.is_event, cpu);
1322 #endif
1323
1324 if (error != 0) {
1325 evtchn_close_t close = { .port = bind_virq.port };
1326
1327 xen_intr_unbind(*port_handlep);
1328 if (HYPERVISOR_event_channel_op(EVTCHNOP_close, &close))
1329 panic("EVTCHNOP_close failed");
1330 return (error);
1331 }
1332
1333 #ifdef SMP
1334 if (isrc->xi_cpu != cpu) {
1335 /*
1336 * Too early in the boot process for the generic interrupt
1337 * code to perform the binding. Update our event channel
1338 * masks manually so events can't fire on the wrong cpu
1339 * during AP startup.
1340 */
1341 xen_intr_assign_cpu(&isrc->xi_intsrc, cpu_apic_ids[cpu]);
1342 }
1343 #endif
1344
1345 /*
1346 * The Event Channel API opened this port, so it is
1347 * responsible for closing it automatically on unbind.
1348 */
1349 isrc->xi_close = 1;
1350 isrc->xi_virq = virq;
1351
1352 return (0);
1353 }
1354
1355 int
xen_intr_alloc_and_bind_ipi(u_int cpu,driver_filter_t filter,enum intr_type flags,xen_intr_handle_t * port_handlep)1356 xen_intr_alloc_and_bind_ipi(u_int cpu, driver_filter_t filter,
1357 enum intr_type flags, xen_intr_handle_t *port_handlep)
1358 {
1359 #ifdef SMP
1360 int vcpu_id = pcpu_find(cpu)->pc_vcpu_id;
1361 struct xenisrc *isrc;
1362 struct evtchn_bind_ipi bind_ipi = { .vcpu = vcpu_id };
1363 /* Same size as the one used by intr_handler->ih_name. */
1364 char name[MAXCOMLEN + 1];
1365 int error;
1366
1367 isrc = NULL;
1368 error = HYPERVISOR_event_channel_op(EVTCHNOP_bind_ipi, &bind_ipi);
1369 if (error != 0) {
1370 /*
1371 * XXX Trap Hypercall error code Linuxisms in
1372 * the HYPERCALL layer.
1373 */
1374 return (-error);
1375 }
1376
1377 snprintf(name, sizeof(name), "cpu%u", cpu);
1378
1379 error = xen_intr_bind_isrc(&isrc, bind_ipi.port, EVTCHN_TYPE_IPI,
1380 name, filter, NULL, NULL, flags, port_handlep);
1381 if (error != 0) {
1382 evtchn_close_t close = { .port = bind_ipi.port };
1383
1384 xen_intr_unbind(*port_handlep);
1385 if (HYPERVISOR_event_channel_op(EVTCHNOP_close, &close))
1386 panic("EVTCHNOP_close failed");
1387 return (error);
1388 }
1389
1390 if (isrc->xi_cpu != cpu) {
1391 /*
1392 * Too early in the boot process for the generic interrupt
1393 * code to perform the binding. Update our event channel
1394 * masks manually so events can't fire on the wrong cpu
1395 * during AP startup.
1396 */
1397 xen_intr_assign_cpu(&isrc->xi_intsrc, cpu_apic_ids[cpu]);
1398 }
1399
1400 /*
1401 * The Event Channel API opened this port, so it is
1402 * responsible for closing it automatically on unbind.
1403 */
1404 isrc->xi_close = 1;
1405 return (0);
1406 #else
1407 return (EOPNOTSUPP);
1408 #endif
1409 }
1410
1411 int
xen_register_pirq(int vector,enum intr_trigger trig,enum intr_polarity pol)1412 xen_register_pirq(int vector, enum intr_trigger trig, enum intr_polarity pol)
1413 {
1414 struct physdev_map_pirq map_pirq;
1415 struct xenisrc *isrc;
1416 int error;
1417
1418 if (vector == 0)
1419 return (EINVAL);
1420
1421 if (bootverbose)
1422 printf("xen: register IRQ#%d\n", vector);
1423
1424 map_pirq.domid = DOMID_SELF;
1425 map_pirq.type = MAP_PIRQ_TYPE_GSI;
1426 map_pirq.index = vector;
1427 map_pirq.pirq = vector;
1428
1429 error = HYPERVISOR_physdev_op(PHYSDEVOP_map_pirq, &map_pirq);
1430 if (error) {
1431 printf("xen: unable to map IRQ#%d\n", vector);
1432 return (error);
1433 }
1434
1435 mtx_lock(&xen_intr_isrc_lock);
1436 isrc = xen_intr_alloc_isrc(EVTCHN_TYPE_PIRQ, vector);
1437 mtx_unlock(&xen_intr_isrc_lock);
1438 KASSERT((isrc != NULL), ("xen: unable to allocate isrc for interrupt"));
1439 isrc->xi_pirq = vector;
1440 isrc->xi_activehi = pol == INTR_POLARITY_HIGH ? 1 : 0;
1441 isrc->xi_edgetrigger = trig == INTR_TRIGGER_EDGE ? 1 : 0;
1442
1443 return (0);
1444 }
1445
1446 int
xen_register_msi(device_t dev,int vector,int count)1447 xen_register_msi(device_t dev, int vector, int count)
1448 {
1449 struct physdev_map_pirq msi_irq;
1450 struct xenisrc *isrc;
1451 int ret;
1452
1453 memset(&msi_irq, 0, sizeof(msi_irq));
1454 msi_irq.domid = DOMID_SELF;
1455 msi_irq.type = count == 1 ?
1456 MAP_PIRQ_TYPE_MSI_SEG : MAP_PIRQ_TYPE_MULTI_MSI;
1457 msi_irq.index = -1;
1458 msi_irq.pirq = -1;
1459 msi_irq.bus = pci_get_bus(dev) | (pci_get_domain(dev) << 16);
1460 msi_irq.devfn = (pci_get_slot(dev) << 3) | pci_get_function(dev);
1461 msi_irq.entry_nr = count;
1462
1463 ret = HYPERVISOR_physdev_op(PHYSDEVOP_map_pirq, &msi_irq);
1464 if (ret != 0)
1465 return (ret);
1466 if (count != msi_irq.entry_nr) {
1467 panic("unable to setup all requested MSI vectors "
1468 "(expected %d got %d)", count, msi_irq.entry_nr);
1469 }
1470
1471 mtx_lock(&xen_intr_isrc_lock);
1472 for (int i = 0; i < count; i++) {
1473 isrc = xen_intr_alloc_isrc(EVTCHN_TYPE_PIRQ, vector + i);
1474 KASSERT(isrc != NULL,
1475 ("xen: unable to allocate isrc for interrupt"));
1476 isrc->xi_pirq = msi_irq.pirq + i;
1477 /* MSI interrupts are always edge triggered */
1478 isrc->xi_edgetrigger = 1;
1479 }
1480 mtx_unlock(&xen_intr_isrc_lock);
1481
1482 return (0);
1483 }
1484
1485 int
xen_release_msi(int vector)1486 xen_release_msi(int vector)
1487 {
1488 struct physdev_unmap_pirq unmap;
1489 struct xenisrc *isrc;
1490 int ret;
1491
1492 isrc = (struct xenisrc *)intr_lookup_source(vector);
1493 if (isrc == NULL)
1494 return (ENXIO);
1495
1496 unmap.pirq = isrc->xi_pirq;
1497 ret = HYPERVISOR_physdev_op(PHYSDEVOP_unmap_pirq, &unmap);
1498 if (ret != 0)
1499 return (ret);
1500
1501 xen_intr_release_isrc(isrc);
1502
1503 return (0);
1504 }
1505
1506 int
xen_intr_describe(xen_intr_handle_t port_handle,const char * fmt,...)1507 xen_intr_describe(xen_intr_handle_t port_handle, const char *fmt, ...)
1508 {
1509 char descr[MAXCOMLEN + 1];
1510 struct xenisrc *isrc;
1511 va_list ap;
1512
1513 isrc = xen_intr_isrc(port_handle);
1514 if (isrc == NULL)
1515 return (EINVAL);
1516
1517 va_start(ap, fmt);
1518 vsnprintf(descr, sizeof(descr), fmt, ap);
1519 va_end(ap);
1520 return (intr_describe(isrc->xi_vector, isrc->xi_cookie, descr));
1521 }
1522
1523 void
xen_intr_unbind(xen_intr_handle_t * port_handlep)1524 xen_intr_unbind(xen_intr_handle_t *port_handlep)
1525 {
1526 struct xenisrc *isrc;
1527
1528 KASSERT(port_handlep != NULL,
1529 ("NULL xen_intr_handle_t passed to xen_intr_unbind"));
1530
1531 isrc = xen_intr_isrc(*port_handlep);
1532 *port_handlep = NULL;
1533 if (isrc == NULL)
1534 return;
1535
1536 mtx_lock(&xen_intr_isrc_lock);
1537 if (refcount_release(&isrc->xi_refcount) == 0) {
1538 mtx_unlock(&xen_intr_isrc_lock);
1539 return;
1540 }
1541 mtx_unlock(&xen_intr_isrc_lock);
1542
1543 if (isrc->xi_cookie != NULL)
1544 intr_remove_handler(isrc->xi_cookie);
1545 xen_intr_release_isrc(isrc);
1546 }
1547
1548 void
xen_intr_signal(xen_intr_handle_t handle)1549 xen_intr_signal(xen_intr_handle_t handle)
1550 {
1551 struct xenisrc *isrc;
1552
1553 isrc = xen_intr_isrc(handle);
1554 if (isrc != NULL) {
1555 KASSERT(isrc->xi_type == EVTCHN_TYPE_PORT ||
1556 isrc->xi_type == EVTCHN_TYPE_IPI,
1557 ("evtchn_signal on something other than a local port"));
1558 struct evtchn_send send = { .port = isrc->xi_port };
1559 (void)HYPERVISOR_event_channel_op(EVTCHNOP_send, &send);
1560 }
1561 }
1562
1563 evtchn_port_t
xen_intr_port(xen_intr_handle_t handle)1564 xen_intr_port(xen_intr_handle_t handle)
1565 {
1566 struct xenisrc *isrc;
1567
1568 isrc = xen_intr_isrc(handle);
1569 if (isrc == NULL)
1570 return (0);
1571
1572 return (isrc->xi_port);
1573 }
1574
1575 int
xen_intr_add_handler(const char * name,driver_filter_t filter,driver_intr_t handler,void * arg,enum intr_type flags,xen_intr_handle_t handle)1576 xen_intr_add_handler(const char *name, driver_filter_t filter,
1577 driver_intr_t handler, void *arg, enum intr_type flags,
1578 xen_intr_handle_t handle)
1579 {
1580 struct xenisrc *isrc;
1581 int error;
1582
1583 isrc = xen_intr_isrc(handle);
1584 if (isrc == NULL || isrc->xi_cookie != NULL)
1585 return (EINVAL);
1586
1587 error = intr_add_handler(name, isrc->xi_vector,filter, handler, arg,
1588 flags|INTR_EXCL, &isrc->xi_cookie, 0);
1589 if (error != 0) {
1590 printf(
1591 "%s: xen_intr_add_handler: intr_add_handler failed: %d\n",
1592 name, error);
1593 }
1594
1595 return (error);
1596 }
1597
1598 int
xen_intr_get_evtchn_from_port(evtchn_port_t port,xen_intr_handle_t * handlep)1599 xen_intr_get_evtchn_from_port(evtchn_port_t port, xen_intr_handle_t *handlep)
1600 {
1601
1602 if (!is_valid_evtchn(port) || port >= NR_EVENT_CHANNELS)
1603 return (EINVAL);
1604
1605 if (handlep == NULL) {
1606 return (EINVAL);
1607 }
1608
1609 mtx_lock(&xen_intr_isrc_lock);
1610 if (xen_intr_port_to_isrc[port] == NULL) {
1611 mtx_unlock(&xen_intr_isrc_lock);
1612 return (EINVAL);
1613 }
1614 refcount_acquire(&xen_intr_port_to_isrc[port]->xi_refcount);
1615 mtx_unlock(&xen_intr_isrc_lock);
1616
1617 /* Assign the opaque handler (the event channel port) */
1618 *handlep = &xen_intr_port_to_isrc[port]->xi_vector;
1619
1620 return (0);
1621 }
1622
1623 #ifdef DDB
1624 static const char *
xen_intr_print_type(enum evtchn_type type)1625 xen_intr_print_type(enum evtchn_type type)
1626 {
1627 static const char *evtchn_type_to_string[EVTCHN_TYPE_COUNT] = {
1628 [EVTCHN_TYPE_UNBOUND] = "UNBOUND",
1629 [EVTCHN_TYPE_PIRQ] = "PIRQ",
1630 [EVTCHN_TYPE_VIRQ] = "VIRQ",
1631 [EVTCHN_TYPE_IPI] = "IPI",
1632 [EVTCHN_TYPE_PORT] = "PORT",
1633 };
1634
1635 if (type >= EVTCHN_TYPE_COUNT)
1636 return ("UNKNOWN");
1637
1638 return (evtchn_type_to_string[type]);
1639 }
1640
1641 static void
xen_intr_dump_port(struct xenisrc * isrc)1642 xen_intr_dump_port(struct xenisrc *isrc)
1643 {
1644 struct xen_intr_pcpu_data *pcpu;
1645 shared_info_t *s = HYPERVISOR_shared_info;
1646 int i;
1647
1648 db_printf("Port %d Type: %s\n",
1649 isrc->xi_port, xen_intr_print_type(isrc->xi_type));
1650 if (isrc->xi_type == EVTCHN_TYPE_PIRQ) {
1651 db_printf("\tPirq: %d ActiveHi: %d EdgeTrigger: %d "
1652 "NeedsEOI: %d\n",
1653 isrc->xi_pirq, isrc->xi_activehi, isrc->xi_edgetrigger,
1654 !!xen_test_bit(isrc->xi_pirq, xen_intr_pirq_eoi_map));
1655 }
1656 if (isrc->xi_type == EVTCHN_TYPE_VIRQ)
1657 db_printf("\tVirq: %d\n", isrc->xi_virq);
1658
1659 db_printf("\tMasked: %d Pending: %d\n",
1660 !!xen_test_bit(isrc->xi_port, &s->evtchn_mask[0]),
1661 !!xen_test_bit(isrc->xi_port, &s->evtchn_pending[0]));
1662
1663 db_printf("\tPer-CPU Masks: ");
1664 CPU_FOREACH(i) {
1665 pcpu = DPCPU_ID_PTR(i, xen_intr_pcpu);
1666 db_printf("cpu#%d: %d ", i,
1667 !!xen_test_bit(isrc->xi_port, pcpu->evtchn_enabled));
1668 }
1669 db_printf("\n");
1670 }
1671
DB_SHOW_COMMAND(xen_evtchn,db_show_xen_evtchn)1672 DB_SHOW_COMMAND(xen_evtchn, db_show_xen_evtchn)
1673 {
1674 int i;
1675
1676 if (!xen_domain()) {
1677 db_printf("Only available on Xen guests\n");
1678 return;
1679 }
1680
1681 for (i = 0; i < NR_EVENT_CHANNELS; i++) {
1682 struct xenisrc *isrc;
1683
1684 isrc = xen_intr_port_to_isrc[i];
1685 if (isrc == NULL)
1686 continue;
1687
1688 xen_intr_dump_port(isrc);
1689 }
1690 }
1691 #endif /* DDB */
1692