2007-07-17 18:37:05 -07:00
# ifndef _XEN_EVENTS_H
# define _XEN_EVENTS_H
2007-07-17 18:37:06 -07:00
# include <linux/interrupt.h>
2014-02-27 19:15:35 +01:00
# ifdef CONFIG_PCI_MSI
# include <linux/msi.h>
# endif
2007-07-17 18:37:06 -07:00
# include <xen/interface/event_channel.h>
# include <asm/xen/hypercall.h>
2008-04-02 10:53:56 -07:00
# include <asm/xen/events.h>
2007-07-17 18:37:05 -07:00
2013-09-23 21:03:38 +01:00
unsigned xen_evtchn_nr_channels ( void ) ;
2007-07-17 18:37:06 -07:00
int bind_evtchn_to_irq ( unsigned int evtchn ) ;
2007-07-17 18:37:05 -07:00
int bind_evtchn_to_irqhandler ( unsigned int evtchn ,
2007-07-17 18:37:06 -07:00
irq_handler_t handler ,
2007-07-17 18:37:05 -07:00
unsigned long irqflags , const char * devname ,
void * dev_id ) ;
2015-05-19 18:40:49 +01:00
int bind_virq_to_irq ( unsigned int virq , unsigned int cpu , bool percpu ) ;
2007-07-17 18:37:05 -07:00
int bind_virq_to_irqhandler ( unsigned int virq , unsigned int cpu ,
2007-07-17 18:37:06 -07:00
irq_handler_t handler ,
unsigned long irqflags , const char * devname ,
void * dev_id ) ;
int bind_ipi_to_irqhandler ( enum ipi_vector ipi ,
unsigned int cpu ,
irq_handler_t handler ,
unsigned long irqflags ,
const char * devname ,
void * dev_id ) ;
2014-08-28 06:44:09 +02:00
int bind_interdomain_evtchn_to_irq ( unsigned int remote_domain ,
unsigned int remote_port ) ;
2009-02-09 12:05:50 -08:00
int bind_interdomain_evtchn_to_irqhandler ( unsigned int remote_domain ,
unsigned int remote_port ,
irq_handler_t handler ,
unsigned long irqflags ,
const char * devname ,
void * dev_id ) ;
2007-07-17 18:37:05 -07:00
/*
* Common unbind function for all event sources . Takes IRQ to unbind from .
* Automatically closes the underlying event channel ( even for bindings
* made with bind_evtchn_to_irqhandler ( ) ) .
*/
void unbind_from_irqhandler ( unsigned int irq , void * dev_id ) ;
2013-09-23 12:47:26 +01:00
# define XEN_IRQ_PRIORITY_MAX EVTCHN_FIFO_PRIORITY_MAX
# define XEN_IRQ_PRIORITY_DEFAULT EVTCHN_FIFO_PRIORITY_DEFAULT
# define XEN_IRQ_PRIORITY_MIN EVTCHN_FIFO_PRIORITY_MIN
int xen_set_irq_priority ( unsigned irq , unsigned priority ) ;
2011-10-27 17:58:47 -04:00
/*
* Allow extra references to event channels exposed to userspace by evtchn
*/
int evtchn_make_refcounted ( unsigned int evtchn ) ;
int evtchn_get ( unsigned int evtchn ) ;
void evtchn_put ( unsigned int evtchn ) ;
2007-07-17 18:37:06 -07:00
void xen_send_IPI_one ( unsigned int cpu , enum ipi_vector vector ) ;
2008-05-26 23:31:23 +01:00
void rebind_evtchn_irq ( int evtchn , int irq ) ;
xen-evtchn: Bind dyn evtchn:qemu-dm interrupt to next online VCPU
A HVM domian booting generates around 200K (evtchn:qemu-dm xen-dyn)
interrupts,in a short period of time. All these evtchn:qemu-dm are bound
to VCPU 0, until irqbalance sees these IRQ and moves it to a different VCPU.
In one configuration, irqbalance runs every 10 seconds, which means
irqbalance doesn't get to see these burst of interrupts and doesn't
re-balance interrupts most of the time, making all evtchn:qemu-dm to be
processed by VCPU0. This cause VCPU0 to spend most of time processing
hardirq and very little time on softirq. Moreover, if dom0 kernel PREEMPTION
is disabled, VCPU0 never runs watchdog (process context), triggering a
softlockup detection code to panic.
Binding evtchn:qemu-dm to next online VCPU, will spread hardirq
processing evenly across different CPU. Later, irqbalance will try to balance
evtchn:qemu-dm, if required.
Signed-off-by: Anoob Soman <anoob.soman@citrix.com>
Reviewed-by: Boris Ostrovsky <boris.ostrovsky@oracle.com>
Signed-off-by: Juergen Gross <jgross@suse.com>
2017-06-07 12:46:56 +01:00
int xen_rebind_evtchn_to_cpu ( int evtchn , unsigned tcpu ) ;
2007-07-17 18:37:06 -07:00
2007-07-17 18:37:05 -07:00
static inline void notify_remote_via_evtchn ( int port )
{
struct evtchn_send send = { . port = port } ;
( void ) HYPERVISOR_event_channel_op ( EVTCHNOP_send , & send ) ;
}
2011-03-10 16:08:05 +00:00
void notify_remote_via_irq ( int irq ) ;
2008-05-26 23:31:27 +01:00
2011-03-10 16:08:05 +00:00
void xen_irq_resume ( void ) ;
2008-05-26 23:31:27 +01:00
xen: implement Xen-specific spinlocks
The standard ticket spinlocks are very expensive in a virtual
environment, because their performance depends on Xen's scheduler
giving vcpus time in the order that they're supposed to take the
spinlock.
This implements a Xen-specific spinlock, which should be much more
efficient.
The fast-path is essentially the old Linux-x86 locks, using a single
lock byte. The locker decrements the byte; if the result is 0, then
they have the lock. If the lock is negative, then locker must spin
until the lock is positive again.
When there's contention, the locker spin for 2^16[*] iterations waiting
to get the lock. If it fails to get the lock in that time, it adds
itself to the contention count in the lock and blocks on a per-cpu
event channel.
When unlocking the spinlock, the locker looks to see if there's anyone
blocked waiting for the lock by checking for a non-zero waiter count.
If there's a waiter, it traverses the per-cpu "lock_spinners"
variable, which contains which lock each CPU is waiting on. It picks
one CPU waiting on the lock and sends it an event to wake it up.
This allows efficient fast-path spinlock operation, while allowing
spinning vcpus to give up their processor time while waiting for a
contended lock.
[*] 2^16 iterations is threshold at which 98% locks have been taken
according to Thomas Friebel's Xen Summit talk "Preventing Guests from
Spinning Around". Therefore, we'd expect the lock and unlock slow
paths will only be entered 2% of the time.
Signed-off-by: Jeremy Fitzhardinge <jeremy.fitzhardinge@citrix.com>
Cc: Jens Axboe <axboe@kernel.dk>
Cc: Peter Zijlstra <a.p.zijlstra@chello.nl>
Cc: Christoph Lameter <clameter@linux-foundation.org>
Cc: Petr Tesarik <ptesarik@suse.cz>
Cc: Virtualization <virtualization@lists.linux-foundation.org>
Cc: Xen devel <xen-devel@lists.xensource.com>
Cc: Thomas Friebel <thomas.friebel@amd.com>
Cc: Nick Piggin <nickpiggin@yahoo.com.au>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2008-07-07 12:07:53 -07:00
/* Clear an irq's pending state, in preparation for polling on it */
void xen_clear_irq_pending ( int irq ) ;
2008-08-20 17:02:18 -07:00
void xen_set_irq_pending ( int irq ) ;
bool xen_test_irq_pending ( int irq ) ;
xen: implement Xen-specific spinlocks
The standard ticket spinlocks are very expensive in a virtual
environment, because their performance depends on Xen's scheduler
giving vcpus time in the order that they're supposed to take the
spinlock.
This implements a Xen-specific spinlock, which should be much more
efficient.
The fast-path is essentially the old Linux-x86 locks, using a single
lock byte. The locker decrements the byte; if the result is 0, then
they have the lock. If the lock is negative, then locker must spin
until the lock is positive again.
When there's contention, the locker spin for 2^16[*] iterations waiting
to get the lock. If it fails to get the lock in that time, it adds
itself to the contention count in the lock and blocks on a per-cpu
event channel.
When unlocking the spinlock, the locker looks to see if there's anyone
blocked waiting for the lock by checking for a non-zero waiter count.
If there's a waiter, it traverses the per-cpu "lock_spinners"
variable, which contains which lock each CPU is waiting on. It picks
one CPU waiting on the lock and sends it an event to wake it up.
This allows efficient fast-path spinlock operation, while allowing
spinning vcpus to give up their processor time while waiting for a
contended lock.
[*] 2^16 iterations is threshold at which 98% locks have been taken
according to Thomas Friebel's Xen Summit talk "Preventing Guests from
Spinning Around". Therefore, we'd expect the lock and unlock slow
paths will only be entered 2% of the time.
Signed-off-by: Jeremy Fitzhardinge <jeremy.fitzhardinge@citrix.com>
Cc: Jens Axboe <axboe@kernel.dk>
Cc: Peter Zijlstra <a.p.zijlstra@chello.nl>
Cc: Christoph Lameter <clameter@linux-foundation.org>
Cc: Petr Tesarik <ptesarik@suse.cz>
Cc: Virtualization <virtualization@lists.linux-foundation.org>
Cc: Xen devel <xen-devel@lists.xensource.com>
Cc: Thomas Friebel <thomas.friebel@amd.com>
Cc: Nick Piggin <nickpiggin@yahoo.com.au>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2008-07-07 12:07:53 -07:00
/* Poll waiting for an irq to become pending. In the usual case, the
irq will be disabled so it won ' t deliver an interrupt . */
void xen_poll_irq ( int irq ) ;
2009-11-05 16:33:09 -05:00
/* Poll waiting for an irq to become pending with a timeout. In the usual case,
* the irq will be disabled so it won ' t deliver an interrupt . */
void xen_poll_irq_timeout ( int irq , u64 timeout ) ;
2009-02-06 19:20:31 -08:00
/* Determine the IRQ which is bound to an event channel */
unsigned irq_from_evtchn ( unsigned int evtchn ) ;
2013-03-13 15:29:25 +00:00
int irq_from_virq ( unsigned int cpu , unsigned int virq ) ;
unsigned int evtchn_from_irq ( unsigned irq ) ;
2009-02-06 19:20:31 -08:00
2010-05-14 12:40:51 +01:00
/* Xen HVM evtchn vector callback */
2011-03-10 16:08:05 +00:00
void xen_hvm_callback_vector ( void ) ;
x86, trace: Add irq vector tracepoints
[Purpose of this patch]
As Vaibhav explained in the thread below, tracepoints for irq vectors
are useful.
http://www.spinics.net/lists/mm-commits/msg85707.html
<snip>
The current interrupt traces from irq_handler_entry and irq_handler_exit
provide when an interrupt is handled. They provide good data about when
the system has switched to kernel space and how it affects the currently
running processes.
There are some IRQ vectors which trigger the system into kernel space,
which are not handled in generic IRQ handlers. Tracing such events gives
us the information about IRQ interaction with other system events.
The trace also tells where the system is spending its time. We want to
know which cores are handling interrupts and how they are affecting other
processes in the system. Also, the trace provides information about when
the cores are idle and which interrupts are changing that state.
<snip>
On the other hand, my usecase is tracing just local timer event and
getting a value of instruction pointer.
I suggested to add an argument local timer event to get instruction pointer before.
But there is another way to get it with external module like systemtap.
So, I don't need to add any argument to irq vector tracepoints now.
[Patch Description]
Vaibhav's patch shared a trace point ,irq_vector_entry/irq_vector_exit, in all events.
But there is an above use case to trace specific irq_vector rather than tracing all events.
In this case, we are concerned about overhead due to unwanted events.
So, add following tracepoints instead of introducing irq_vector_entry/exit.
so that we can enable them independently.
- local_timer_vector
- reschedule_vector
- call_function_vector
- call_function_single_vector
- irq_work_entry_vector
- error_apic_vector
- thermal_apic_vector
- threshold_apic_vector
- spurious_apic_vector
- x86_platform_ipi_vector
Also, introduce a logic switching IDT at enabling/disabling time so that a time penalty
makes a zero when tracepoints are disabled. Detailed explanations are as follows.
- Create trace irq handlers with entering_irq()/exiting_irq().
- Create a new IDT, trace_idt_table, at boot time by adding a logic to
_set_gate(). It is just a copy of original idt table.
- Register the new handlers for tracpoints to the new IDT by introducing
macros to alloc_intr_gate() called at registering time of irq_vector handlers.
- Add checking, whether irq vector tracing is on/off, into load_current_idt().
This has to be done below debug checking for these reasons.
- Switching to debug IDT may be kicked while tracing is enabled.
- On the other hands, switching to trace IDT is kicked only when debugging
is disabled.
In addition, the new IDT is created only when CONFIG_TRACING is enabled to avoid being
used for other purposes.
Signed-off-by: Seiji Aguchi <seiji.aguchi@hds.com>
Link: http://lkml.kernel.org/r/51C323ED.5050708@hds.com
Signed-off-by: H. Peter Anvin <hpa@linux.intel.com>
Cc: Steven Rostedt <rostedt@goodmis.org>
2013-06-20 11:46:53 -04:00
# ifdef CONFIG_TRACING
# define trace_xen_hvm_callback_vector xen_hvm_callback_vector
# endif
2010-05-14 12:40:51 +01:00
int xen_set_callback_via ( uint64_t via ) ;
void xen_evtchn_do_upcall ( struct pt_regs * regs ) ;
void xen_hvm_evtchn_do_upcall ( void ) ;
2011-03-10 16:08:07 +00:00
/* Bind a pirq for a physical interrupt to an irq. */
int xen_bind_pirq_gsi_to_irq ( unsigned gsi ,
unsigned pirq , int shareable , char * name ) ;
2010-10-11 15:30:09 +01:00
# ifdef CONFIG_PCI_MSI
2011-03-10 16:08:07 +00:00
/* Allocate a pirq for a MSI style physical interrupt. */
2011-02-18 16:43:32 +00:00
int xen_allocate_pirq_msi ( struct pci_dev * dev , struct msi_desc * msidesc ) ;
2011-03-10 16:08:07 +00:00
/* Bind an PSI pirq to an irq. */
2011-02-18 16:43:32 +00:00
int xen_bind_pirq_msi_to_irq ( struct pci_dev * dev , struct msi_desc * msidesc ,
2014-02-27 19:15:35 +01:00
int pirq , int nvec , const char * name , domid_t domid ) ;
2010-10-11 15:30:09 +01:00
# endif
2010-10-01 12:20:09 -04:00
2010-03-18 16:31:34 -04:00
/* De-allocates the above mentioned physical interrupt. */
int xen_destroy_irq ( int irq ) ;
2010-12-01 14:51:44 +00:00
/* Return irq from pirq */
int xen_irq_from_pirq ( unsigned pirq ) ;
2011-02-24 14:20:12 -05:00
/* Return the pirq allocated to the irq. */
int xen_pirq_from_irq ( unsigned irq ) ;
2012-05-21 16:54:10 +01:00
/* Return the irq allocated to the gsi */
int xen_irq_from_gsi ( unsigned gsi ) ;
2010-11-08 14:26:36 -05:00
/* Determine whether to ignore this IRQ if it is passed to a guest. */
int xen_test_irq_shared ( int irq ) ;
2012-09-14 13:37:32 +00:00
/* initialize Xen IRQ subsystem */
void xen_init_IRQ ( void ) ;
2007-07-17 18:37:05 -07:00
# endif /* _XEN_EVENTS_H */