2014-11-24 14:35:11 +00:00
/*
* Copyright ( C ) 2013 , 2014 ARM Limited , All Rights Reserved .
* Author : Marc Zyngier < marc . zyngier @ arm . com >
*
* This program is free software ; you can redistribute it and / or modify
* it under the terms of the GNU General Public License version 2 as
* published by the Free Software Foundation .
*
* This program is distributed in the hope that it will be useful ,
* but WITHOUT ANY WARRANTY ; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE . See the
* GNU General Public License for more details .
*
* You should have received a copy of the GNU General Public License
* along with this program . If not , see < http : //www.gnu.org/licenses/>.
*/
2016-09-12 20:32:25 +02:00
# include <linux/acpi.h>
2014-11-24 14:35:11 +00:00
# include <linux/bitmap.h>
# include <linux/cpu.h>
# include <linux/delay.h>
2016-09-12 17:13:59 +01:00
# include <linux/dma-iommu.h>
2014-11-24 14:35:11 +00:00
# include <linux/interrupt.h>
2016-09-12 20:32:25 +02:00
# include <linux/irqdomain.h>
# include <linux/acpi_iort.h>
2014-11-24 14:35:11 +00:00
# include <linux/log2.h>
# include <linux/mm.h>
# include <linux/msi.h>
# include <linux/of.h>
# include <linux/of_address.h>
# include <linux/of_irq.h>
# include <linux/of_pci.h>
# include <linux/of_platform.h>
# include <linux/percpu.h>
# include <linux/slab.h>
2015-07-07 17:11:46 -04:00
# include <linux/irqchip.h>
2014-11-24 14:35:11 +00:00
# include <linux/irqchip/arm-gic-v3.h>
# include <asm/cputype.h>
# include <asm/exception.h>
2015-09-21 22:58:37 +02:00
# include "irq-gic-common.h"
2015-09-21 22:58:38 +02:00
# define ITS_FLAGS_CMDQ_NEEDS_FLUSHING (1ULL << 0)
# define ITS_FLAGS_WORKAROUND_CAVIUM_22375 (1ULL << 1)
2016-05-25 15:29:20 +02:00
# define ITS_FLAGS_WORKAROUND_CAVIUM_23144 (1ULL << 2)
2014-11-24 14:35:11 +00:00
2014-11-24 14:35:12 +00:00
# define RDIST_FLAGS_PROPBASE_NEEDS_FLUSHING (1 << 0)
2014-11-24 14:35:11 +00:00
/*
* Collection structure - just an ID , and a redistributor address to
* ping . We use one per CPU as a bag of interrupts assigned to this
* CPU .
*/
struct its_collection {
u64 target_address ;
u16 col_id ;
} ;
2016-03-09 22:10:49 -06:00
/*
2016-06-06 18:17:30 -05:00
* The ITS_BASER structure - contains memory information , cached
* value of BASER register configuration and ITS page size .
2016-03-09 22:10:49 -06:00
*/
struct its_baser {
void * base ;
u64 val ;
u32 order ;
2016-06-06 18:17:30 -05:00
u32 psz ;
2016-03-09 22:10:49 -06:00
} ;
2014-11-24 14:35:11 +00:00
/*
* The ITS structure - contains most of the infrastructure , with the
2015-07-28 14:46:20 +01:00
* top - level MSI domain , the command queue , the collections , and the
* list of devices writing to it .
2014-11-24 14:35:11 +00:00
*/
struct its_node {
raw_spinlock_t lock ;
struct list_head entry ;
void __iomem * base ;
2016-09-12 20:32:24 +02:00
phys_addr_t phys_base ;
2014-11-24 14:35:11 +00:00
struct its_cmd_block * cmd_base ;
struct its_cmd_block * cmd_write ;
2016-03-09 22:10:49 -06:00
struct its_baser tables [ GITS_BASER_NR_REGS ] ;
2014-11-24 14:35:11 +00:00
struct its_collection * collections ;
struct list_head its_device_list ;
u64 flags ;
u32 ite_size ;
2016-03-09 22:10:49 -06:00
u32 device_ids ;
2016-05-25 15:29:20 +02:00
int numa_node ;
2014-11-24 14:35:11 +00:00
} ;
# define ITS_ITT_ALIGN SZ_256
2016-02-16 18:00:36 -06:00
/* Convert page order to size in bytes */
# define PAGE_ORDER_TO_SIZE(o) (PAGE_SIZE << (o))
irqchip/gicv3-its: Fix mapping of LPIs to collections
The GICv3 ITS architecture allows a given [DevID, EventID] pair to be
translated to a [LPI, Collection] pair, where DevID is the device writing
the MSI, EventID is the payload being written, LPI is the actual
interrupt number, and Collection is roughly equivalent to a target CPU.
Each LPI can be mapped to a separate collection, but the ITS driver
insists on maintaining the collection on a device basis, instead of doing
it on a per interrupt basis.
This is obviously flawed, and this patch fixes it by adding a per interrupt
index that indicates which collection number is in use.
Reported-by: Ian Campbell <ian.campbell@citrix.com>
Signed-off-by: Marc Zyngier <marc.zyngier@arm.com>
Cc: <linux-arm-kernel@lists.infradead.org>
Cc: Jason Cooper <jason@lakedaemon.net>
Cc: stable@vger.kernel.org # 4.1, 4.0
Link: http://lkml.kernel.org/r/1437126402-11677-1-git-send-email-marc.zyngier@arm.com
Signed-off-by: Thomas Gleixner <tglx@linutronix.de>
2015-07-17 10:46:42 +01:00
struct event_lpi_map {
unsigned long * lpi_map ;
u16 * col_map ;
irq_hw_number_t lpi_base ;
int nr_lpis ;
} ;
2014-11-24 14:35:11 +00:00
/*
* The ITS view of a device - belongs to an ITS , a collection , owns an
* interrupt translation table , and a list of interrupts .
*/
struct its_device {
struct list_head entry ;
struct its_node * its ;
irqchip/gicv3-its: Fix mapping of LPIs to collections
The GICv3 ITS architecture allows a given [DevID, EventID] pair to be
translated to a [LPI, Collection] pair, where DevID is the device writing
the MSI, EventID is the payload being written, LPI is the actual
interrupt number, and Collection is roughly equivalent to a target CPU.
Each LPI can be mapped to a separate collection, but the ITS driver
insists on maintaining the collection on a device basis, instead of doing
it on a per interrupt basis.
This is obviously flawed, and this patch fixes it by adding a per interrupt
index that indicates which collection number is in use.
Reported-by: Ian Campbell <ian.campbell@citrix.com>
Signed-off-by: Marc Zyngier <marc.zyngier@arm.com>
Cc: <linux-arm-kernel@lists.infradead.org>
Cc: Jason Cooper <jason@lakedaemon.net>
Cc: stable@vger.kernel.org # 4.1, 4.0
Link: http://lkml.kernel.org/r/1437126402-11677-1-git-send-email-marc.zyngier@arm.com
Signed-off-by: Thomas Gleixner <tglx@linutronix.de>
2015-07-17 10:46:42 +01:00
struct event_lpi_map event_map ;
2014-11-24 14:35:11 +00:00
void * itt ;
u32 nr_ites ;
u32 device_id ;
} ;
2014-11-24 14:35:14 +00:00
static LIST_HEAD ( its_nodes ) ;
static DEFINE_SPINLOCK ( its_lock ) ;
static struct rdists * gic_rdists ;
2016-09-12 20:32:24 +02:00
static struct irq_domain * its_parent ;
2014-11-24 14:35:14 +00:00
# define gic_data_rdist() (raw_cpu_ptr(gic_rdists->rdist))
# define gic_data_rdist_rd_base() (gic_data_rdist()->rd_base)
irqchip/gicv3-its: Fix mapping of LPIs to collections
The GICv3 ITS architecture allows a given [DevID, EventID] pair to be
translated to a [LPI, Collection] pair, where DevID is the device writing
the MSI, EventID is the payload being written, LPI is the actual
interrupt number, and Collection is roughly equivalent to a target CPU.
Each LPI can be mapped to a separate collection, but the ITS driver
insists on maintaining the collection on a device basis, instead of doing
it on a per interrupt basis.
This is obviously flawed, and this patch fixes it by adding a per interrupt
index that indicates which collection number is in use.
Reported-by: Ian Campbell <ian.campbell@citrix.com>
Signed-off-by: Marc Zyngier <marc.zyngier@arm.com>
Cc: <linux-arm-kernel@lists.infradead.org>
Cc: Jason Cooper <jason@lakedaemon.net>
Cc: stable@vger.kernel.org # 4.1, 4.0
Link: http://lkml.kernel.org/r/1437126402-11677-1-git-send-email-marc.zyngier@arm.com
Signed-off-by: Thomas Gleixner <tglx@linutronix.de>
2015-07-17 10:46:42 +01:00
static struct its_collection * dev_event_to_col ( struct its_device * its_dev ,
u32 event )
{
struct its_node * its = its_dev - > its ;
return its - > collections + its_dev - > event_map . col_map [ event ] ;
}
2014-11-24 14:35:11 +00:00
/*
* ITS command descriptors - parameters to be encoded in a command
* block .
*/
struct its_cmd_desc {
union {
struct {
struct its_device * dev ;
u32 event_id ;
} its_inv_cmd ;
struct {
struct its_device * dev ;
u32 event_id ;
} its_int_cmd ;
struct {
struct its_device * dev ;
int valid ;
} its_mapd_cmd ;
struct {
struct its_collection * col ;
int valid ;
} its_mapc_cmd ;
struct {
struct its_device * dev ;
u32 phys_id ;
u32 event_id ;
2016-12-20 15:52:26 +00:00
} its_mapti_cmd ;
2014-11-24 14:35:11 +00:00
struct {
struct its_device * dev ;
struct its_collection * col ;
irqchip/gicv3-its: Fix mapping of LPIs to collections
The GICv3 ITS architecture allows a given [DevID, EventID] pair to be
translated to a [LPI, Collection] pair, where DevID is the device writing
the MSI, EventID is the payload being written, LPI is the actual
interrupt number, and Collection is roughly equivalent to a target CPU.
Each LPI can be mapped to a separate collection, but the ITS driver
insists on maintaining the collection on a device basis, instead of doing
it on a per interrupt basis.
This is obviously flawed, and this patch fixes it by adding a per interrupt
index that indicates which collection number is in use.
Reported-by: Ian Campbell <ian.campbell@citrix.com>
Signed-off-by: Marc Zyngier <marc.zyngier@arm.com>
Cc: <linux-arm-kernel@lists.infradead.org>
Cc: Jason Cooper <jason@lakedaemon.net>
Cc: stable@vger.kernel.org # 4.1, 4.0
Link: http://lkml.kernel.org/r/1437126402-11677-1-git-send-email-marc.zyngier@arm.com
Signed-off-by: Thomas Gleixner <tglx@linutronix.de>
2015-07-17 10:46:42 +01:00
u32 event_id ;
2014-11-24 14:35:11 +00:00
} its_movi_cmd ;
struct {
struct its_device * dev ;
u32 event_id ;
} its_discard_cmd ;
struct {
struct its_collection * col ;
} its_invall_cmd ;
} ;
} ;
/*
* The ITS command block , which is what the ITS actually parses .
*/
struct its_cmd_block {
u64 raw_cmd [ 4 ] ;
} ;
# define ITS_CMD_QUEUE_SZ SZ_64K
# define ITS_CMD_QUEUE_NR_ENTRIES (ITS_CMD_QUEUE_SZ / sizeof(struct its_cmd_block))
typedef struct its_collection * ( * its_cmd_builder_t ) ( struct its_cmd_block * ,
struct its_cmd_desc * ) ;
2016-12-19 17:11:52 +00:00
static void its_mask_encode ( u64 * raw_cmd , u64 val , int h , int l )
{
u64 mask = GENMASK_ULL ( h , l ) ;
* raw_cmd & = ~ mask ;
* raw_cmd | = ( val < < l ) & mask ;
}
2014-11-24 14:35:11 +00:00
static void its_encode_cmd ( struct its_cmd_block * cmd , u8 cmd_nr )
{
2016-12-19 17:11:52 +00:00
its_mask_encode ( & cmd - > raw_cmd [ 0 ] , cmd_nr , 7 , 0 ) ;
2014-11-24 14:35:11 +00:00
}
static void its_encode_devid ( struct its_cmd_block * cmd , u32 devid )
{
2016-12-19 17:11:52 +00:00
its_mask_encode ( & cmd - > raw_cmd [ 0 ] , devid , 63 , 32 ) ;
2014-11-24 14:35:11 +00:00
}
static void its_encode_event_id ( struct its_cmd_block * cmd , u32 id )
{
2016-12-19 17:11:52 +00:00
its_mask_encode ( & cmd - > raw_cmd [ 1 ] , id , 31 , 0 ) ;
2014-11-24 14:35:11 +00:00
}
static void its_encode_phys_id ( struct its_cmd_block * cmd , u32 phys_id )
{
2016-12-19 17:11:52 +00:00
its_mask_encode ( & cmd - > raw_cmd [ 1 ] , phys_id , 63 , 32 ) ;
2014-11-24 14:35:11 +00:00
}
static void its_encode_size ( struct its_cmd_block * cmd , u8 size )
{
2016-12-19 17:11:52 +00:00
its_mask_encode ( & cmd - > raw_cmd [ 1 ] , size , 4 , 0 ) ;
2014-11-24 14:35:11 +00:00
}
static void its_encode_itt ( struct its_cmd_block * cmd , u64 itt_addr )
{
2016-12-19 17:11:52 +00:00
its_mask_encode ( & cmd - > raw_cmd [ 2 ] , itt_addr > > 8 , 50 , 8 ) ;
2014-11-24 14:35:11 +00:00
}
static void its_encode_valid ( struct its_cmd_block * cmd , int valid )
{
2016-12-19 17:11:52 +00:00
its_mask_encode ( & cmd - > raw_cmd [ 2 ] , ! ! valid , 63 , 63 ) ;
2014-11-24 14:35:11 +00:00
}
static void its_encode_target ( struct its_cmd_block * cmd , u64 target_addr )
{
2016-12-19 17:11:52 +00:00
its_mask_encode ( & cmd - > raw_cmd [ 2 ] , target_addr > > 16 , 50 , 16 ) ;
2014-11-24 14:35:11 +00:00
}
static void its_encode_collection ( struct its_cmd_block * cmd , u16 col )
{
2016-12-19 17:11:52 +00:00
its_mask_encode ( & cmd - > raw_cmd [ 2 ] , col , 15 , 0 ) ;
2014-11-24 14:35:11 +00:00
}
static inline void its_fixup_cmd ( struct its_cmd_block * cmd )
{
/* Let's fixup BE commands */
cmd - > raw_cmd [ 0 ] = cpu_to_le64 ( cmd - > raw_cmd [ 0 ] ) ;
cmd - > raw_cmd [ 1 ] = cpu_to_le64 ( cmd - > raw_cmd [ 1 ] ) ;
cmd - > raw_cmd [ 2 ] = cpu_to_le64 ( cmd - > raw_cmd [ 2 ] ) ;
cmd - > raw_cmd [ 3 ] = cpu_to_le64 ( cmd - > raw_cmd [ 3 ] ) ;
}
static struct its_collection * its_build_mapd_cmd ( struct its_cmd_block * cmd ,
struct its_cmd_desc * desc )
{
unsigned long itt_addr ;
2014-12-12 10:51:24 +00:00
u8 size = ilog2 ( desc - > its_mapd_cmd . dev - > nr_ites ) ;
2014-11-24 14:35:11 +00:00
itt_addr = virt_to_phys ( desc - > its_mapd_cmd . dev - > itt ) ;
itt_addr = ALIGN ( itt_addr , ITS_ITT_ALIGN ) ;
its_encode_cmd ( cmd , GITS_CMD_MAPD ) ;
its_encode_devid ( cmd , desc - > its_mapd_cmd . dev - > device_id ) ;
its_encode_size ( cmd , size - 1 ) ;
its_encode_itt ( cmd , itt_addr ) ;
its_encode_valid ( cmd , desc - > its_mapd_cmd . valid ) ;
its_fixup_cmd ( cmd ) ;
irqchip/gicv3-its: Fix mapping of LPIs to collections
The GICv3 ITS architecture allows a given [DevID, EventID] pair to be
translated to a [LPI, Collection] pair, where DevID is the device writing
the MSI, EventID is the payload being written, LPI is the actual
interrupt number, and Collection is roughly equivalent to a target CPU.
Each LPI can be mapped to a separate collection, but the ITS driver
insists on maintaining the collection on a device basis, instead of doing
it on a per interrupt basis.
This is obviously flawed, and this patch fixes it by adding a per interrupt
index that indicates which collection number is in use.
Reported-by: Ian Campbell <ian.campbell@citrix.com>
Signed-off-by: Marc Zyngier <marc.zyngier@arm.com>
Cc: <linux-arm-kernel@lists.infradead.org>
Cc: Jason Cooper <jason@lakedaemon.net>
Cc: stable@vger.kernel.org # 4.1, 4.0
Link: http://lkml.kernel.org/r/1437126402-11677-1-git-send-email-marc.zyngier@arm.com
Signed-off-by: Thomas Gleixner <tglx@linutronix.de>
2015-07-17 10:46:42 +01:00
return NULL ;
2014-11-24 14:35:11 +00:00
}
static struct its_collection * its_build_mapc_cmd ( struct its_cmd_block * cmd ,
struct its_cmd_desc * desc )
{
its_encode_cmd ( cmd , GITS_CMD_MAPC ) ;
its_encode_collection ( cmd , desc - > its_mapc_cmd . col - > col_id ) ;
its_encode_target ( cmd , desc - > its_mapc_cmd . col - > target_address ) ;
its_encode_valid ( cmd , desc - > its_mapc_cmd . valid ) ;
its_fixup_cmd ( cmd ) ;
return desc - > its_mapc_cmd . col ;
}
2016-12-20 15:52:26 +00:00
static struct its_collection * its_build_mapti_cmd ( struct its_cmd_block * cmd ,
2014-11-24 14:35:11 +00:00
struct its_cmd_desc * desc )
{
irqchip/gicv3-its: Fix mapping of LPIs to collections
The GICv3 ITS architecture allows a given [DevID, EventID] pair to be
translated to a [LPI, Collection] pair, where DevID is the device writing
the MSI, EventID is the payload being written, LPI is the actual
interrupt number, and Collection is roughly equivalent to a target CPU.
Each LPI can be mapped to a separate collection, but the ITS driver
insists on maintaining the collection on a device basis, instead of doing
it on a per interrupt basis.
This is obviously flawed, and this patch fixes it by adding a per interrupt
index that indicates which collection number is in use.
Reported-by: Ian Campbell <ian.campbell@citrix.com>
Signed-off-by: Marc Zyngier <marc.zyngier@arm.com>
Cc: <linux-arm-kernel@lists.infradead.org>
Cc: Jason Cooper <jason@lakedaemon.net>
Cc: stable@vger.kernel.org # 4.1, 4.0
Link: http://lkml.kernel.org/r/1437126402-11677-1-git-send-email-marc.zyngier@arm.com
Signed-off-by: Thomas Gleixner <tglx@linutronix.de>
2015-07-17 10:46:42 +01:00
struct its_collection * col ;
2016-12-20 15:52:26 +00:00
col = dev_event_to_col ( desc - > its_mapti_cmd . dev ,
desc - > its_mapti_cmd . event_id ) ;
irqchip/gicv3-its: Fix mapping of LPIs to collections
The GICv3 ITS architecture allows a given [DevID, EventID] pair to be
translated to a [LPI, Collection] pair, where DevID is the device writing
the MSI, EventID is the payload being written, LPI is the actual
interrupt number, and Collection is roughly equivalent to a target CPU.
Each LPI can be mapped to a separate collection, but the ITS driver
insists on maintaining the collection on a device basis, instead of doing
it on a per interrupt basis.
This is obviously flawed, and this patch fixes it by adding a per interrupt
index that indicates which collection number is in use.
Reported-by: Ian Campbell <ian.campbell@citrix.com>
Signed-off-by: Marc Zyngier <marc.zyngier@arm.com>
Cc: <linux-arm-kernel@lists.infradead.org>
Cc: Jason Cooper <jason@lakedaemon.net>
Cc: stable@vger.kernel.org # 4.1, 4.0
Link: http://lkml.kernel.org/r/1437126402-11677-1-git-send-email-marc.zyngier@arm.com
Signed-off-by: Thomas Gleixner <tglx@linutronix.de>
2015-07-17 10:46:42 +01:00
2016-12-20 15:52:26 +00:00
its_encode_cmd ( cmd , GITS_CMD_MAPTI ) ;
its_encode_devid ( cmd , desc - > its_mapti_cmd . dev - > device_id ) ;
its_encode_event_id ( cmd , desc - > its_mapti_cmd . event_id ) ;
its_encode_phys_id ( cmd , desc - > its_mapti_cmd . phys_id ) ;
irqchip/gicv3-its: Fix mapping of LPIs to collections
The GICv3 ITS architecture allows a given [DevID, EventID] pair to be
translated to a [LPI, Collection] pair, where DevID is the device writing
the MSI, EventID is the payload being written, LPI is the actual
interrupt number, and Collection is roughly equivalent to a target CPU.
Each LPI can be mapped to a separate collection, but the ITS driver
insists on maintaining the collection on a device basis, instead of doing
it on a per interrupt basis.
This is obviously flawed, and this patch fixes it by adding a per interrupt
index that indicates which collection number is in use.
Reported-by: Ian Campbell <ian.campbell@citrix.com>
Signed-off-by: Marc Zyngier <marc.zyngier@arm.com>
Cc: <linux-arm-kernel@lists.infradead.org>
Cc: Jason Cooper <jason@lakedaemon.net>
Cc: stable@vger.kernel.org # 4.1, 4.0
Link: http://lkml.kernel.org/r/1437126402-11677-1-git-send-email-marc.zyngier@arm.com
Signed-off-by: Thomas Gleixner <tglx@linutronix.de>
2015-07-17 10:46:42 +01:00
its_encode_collection ( cmd , col - > col_id ) ;
2014-11-24 14:35:11 +00:00
its_fixup_cmd ( cmd ) ;
irqchip/gicv3-its: Fix mapping of LPIs to collections
The GICv3 ITS architecture allows a given [DevID, EventID] pair to be
translated to a [LPI, Collection] pair, where DevID is the device writing
the MSI, EventID is the payload being written, LPI is the actual
interrupt number, and Collection is roughly equivalent to a target CPU.
Each LPI can be mapped to a separate collection, but the ITS driver
insists on maintaining the collection on a device basis, instead of doing
it on a per interrupt basis.
This is obviously flawed, and this patch fixes it by adding a per interrupt
index that indicates which collection number is in use.
Reported-by: Ian Campbell <ian.campbell@citrix.com>
Signed-off-by: Marc Zyngier <marc.zyngier@arm.com>
Cc: <linux-arm-kernel@lists.infradead.org>
Cc: Jason Cooper <jason@lakedaemon.net>
Cc: stable@vger.kernel.org # 4.1, 4.0
Link: http://lkml.kernel.org/r/1437126402-11677-1-git-send-email-marc.zyngier@arm.com
Signed-off-by: Thomas Gleixner <tglx@linutronix.de>
2015-07-17 10:46:42 +01:00
return col ;
2014-11-24 14:35:11 +00:00
}
static struct its_collection * its_build_movi_cmd ( struct its_cmd_block * cmd ,
struct its_cmd_desc * desc )
{
irqchip/gicv3-its: Fix mapping of LPIs to collections
The GICv3 ITS architecture allows a given [DevID, EventID] pair to be
translated to a [LPI, Collection] pair, where DevID is the device writing
the MSI, EventID is the payload being written, LPI is the actual
interrupt number, and Collection is roughly equivalent to a target CPU.
Each LPI can be mapped to a separate collection, but the ITS driver
insists on maintaining the collection on a device basis, instead of doing
it on a per interrupt basis.
This is obviously flawed, and this patch fixes it by adding a per interrupt
index that indicates which collection number is in use.
Reported-by: Ian Campbell <ian.campbell@citrix.com>
Signed-off-by: Marc Zyngier <marc.zyngier@arm.com>
Cc: <linux-arm-kernel@lists.infradead.org>
Cc: Jason Cooper <jason@lakedaemon.net>
Cc: stable@vger.kernel.org # 4.1, 4.0
Link: http://lkml.kernel.org/r/1437126402-11677-1-git-send-email-marc.zyngier@arm.com
Signed-off-by: Thomas Gleixner <tglx@linutronix.de>
2015-07-17 10:46:42 +01:00
struct its_collection * col ;
col = dev_event_to_col ( desc - > its_movi_cmd . dev ,
desc - > its_movi_cmd . event_id ) ;
2014-11-24 14:35:11 +00:00
its_encode_cmd ( cmd , GITS_CMD_MOVI ) ;
its_encode_devid ( cmd , desc - > its_movi_cmd . dev - > device_id ) ;
irqchip/gicv3-its: Fix mapping of LPIs to collections
The GICv3 ITS architecture allows a given [DevID, EventID] pair to be
translated to a [LPI, Collection] pair, where DevID is the device writing
the MSI, EventID is the payload being written, LPI is the actual
interrupt number, and Collection is roughly equivalent to a target CPU.
Each LPI can be mapped to a separate collection, but the ITS driver
insists on maintaining the collection on a device basis, instead of doing
it on a per interrupt basis.
This is obviously flawed, and this patch fixes it by adding a per interrupt
index that indicates which collection number is in use.
Reported-by: Ian Campbell <ian.campbell@citrix.com>
Signed-off-by: Marc Zyngier <marc.zyngier@arm.com>
Cc: <linux-arm-kernel@lists.infradead.org>
Cc: Jason Cooper <jason@lakedaemon.net>
Cc: stable@vger.kernel.org # 4.1, 4.0
Link: http://lkml.kernel.org/r/1437126402-11677-1-git-send-email-marc.zyngier@arm.com
Signed-off-by: Thomas Gleixner <tglx@linutronix.de>
2015-07-17 10:46:42 +01:00
its_encode_event_id ( cmd , desc - > its_movi_cmd . event_id ) ;
2014-11-24 14:35:11 +00:00
its_encode_collection ( cmd , desc - > its_movi_cmd . col - > col_id ) ;
its_fixup_cmd ( cmd ) ;
irqchip/gicv3-its: Fix mapping of LPIs to collections
The GICv3 ITS architecture allows a given [DevID, EventID] pair to be
translated to a [LPI, Collection] pair, where DevID is the device writing
the MSI, EventID is the payload being written, LPI is the actual
interrupt number, and Collection is roughly equivalent to a target CPU.
Each LPI can be mapped to a separate collection, but the ITS driver
insists on maintaining the collection on a device basis, instead of doing
it on a per interrupt basis.
This is obviously flawed, and this patch fixes it by adding a per interrupt
index that indicates which collection number is in use.
Reported-by: Ian Campbell <ian.campbell@citrix.com>
Signed-off-by: Marc Zyngier <marc.zyngier@arm.com>
Cc: <linux-arm-kernel@lists.infradead.org>
Cc: Jason Cooper <jason@lakedaemon.net>
Cc: stable@vger.kernel.org # 4.1, 4.0
Link: http://lkml.kernel.org/r/1437126402-11677-1-git-send-email-marc.zyngier@arm.com
Signed-off-by: Thomas Gleixner <tglx@linutronix.de>
2015-07-17 10:46:42 +01:00
return col ;
2014-11-24 14:35:11 +00:00
}
static struct its_collection * its_build_discard_cmd ( struct its_cmd_block * cmd ,
struct its_cmd_desc * desc )
{
irqchip/gicv3-its: Fix mapping of LPIs to collections
The GICv3 ITS architecture allows a given [DevID, EventID] pair to be
translated to a [LPI, Collection] pair, where DevID is the device writing
the MSI, EventID is the payload being written, LPI is the actual
interrupt number, and Collection is roughly equivalent to a target CPU.
Each LPI can be mapped to a separate collection, but the ITS driver
insists on maintaining the collection on a device basis, instead of doing
it on a per interrupt basis.
This is obviously flawed, and this patch fixes it by adding a per interrupt
index that indicates which collection number is in use.
Reported-by: Ian Campbell <ian.campbell@citrix.com>
Signed-off-by: Marc Zyngier <marc.zyngier@arm.com>
Cc: <linux-arm-kernel@lists.infradead.org>
Cc: Jason Cooper <jason@lakedaemon.net>
Cc: stable@vger.kernel.org # 4.1, 4.0
Link: http://lkml.kernel.org/r/1437126402-11677-1-git-send-email-marc.zyngier@arm.com
Signed-off-by: Thomas Gleixner <tglx@linutronix.de>
2015-07-17 10:46:42 +01:00
struct its_collection * col ;
col = dev_event_to_col ( desc - > its_discard_cmd . dev ,
desc - > its_discard_cmd . event_id ) ;
2014-11-24 14:35:11 +00:00
its_encode_cmd ( cmd , GITS_CMD_DISCARD ) ;
its_encode_devid ( cmd , desc - > its_discard_cmd . dev - > device_id ) ;
its_encode_event_id ( cmd , desc - > its_discard_cmd . event_id ) ;
its_fixup_cmd ( cmd ) ;
irqchip/gicv3-its: Fix mapping of LPIs to collections
The GICv3 ITS architecture allows a given [DevID, EventID] pair to be
translated to a [LPI, Collection] pair, where DevID is the device writing
the MSI, EventID is the payload being written, LPI is the actual
interrupt number, and Collection is roughly equivalent to a target CPU.
Each LPI can be mapped to a separate collection, but the ITS driver
insists on maintaining the collection on a device basis, instead of doing
it on a per interrupt basis.
This is obviously flawed, and this patch fixes it by adding a per interrupt
index that indicates which collection number is in use.
Reported-by: Ian Campbell <ian.campbell@citrix.com>
Signed-off-by: Marc Zyngier <marc.zyngier@arm.com>
Cc: <linux-arm-kernel@lists.infradead.org>
Cc: Jason Cooper <jason@lakedaemon.net>
Cc: stable@vger.kernel.org # 4.1, 4.0
Link: http://lkml.kernel.org/r/1437126402-11677-1-git-send-email-marc.zyngier@arm.com
Signed-off-by: Thomas Gleixner <tglx@linutronix.de>
2015-07-17 10:46:42 +01:00
return col ;
2014-11-24 14:35:11 +00:00
}
static struct its_collection * its_build_inv_cmd ( struct its_cmd_block * cmd ,
struct its_cmd_desc * desc )
{
irqchip/gicv3-its: Fix mapping of LPIs to collections
The GICv3 ITS architecture allows a given [DevID, EventID] pair to be
translated to a [LPI, Collection] pair, where DevID is the device writing
the MSI, EventID is the payload being written, LPI is the actual
interrupt number, and Collection is roughly equivalent to a target CPU.
Each LPI can be mapped to a separate collection, but the ITS driver
insists on maintaining the collection on a device basis, instead of doing
it on a per interrupt basis.
This is obviously flawed, and this patch fixes it by adding a per interrupt
index that indicates which collection number is in use.
Reported-by: Ian Campbell <ian.campbell@citrix.com>
Signed-off-by: Marc Zyngier <marc.zyngier@arm.com>
Cc: <linux-arm-kernel@lists.infradead.org>
Cc: Jason Cooper <jason@lakedaemon.net>
Cc: stable@vger.kernel.org # 4.1, 4.0
Link: http://lkml.kernel.org/r/1437126402-11677-1-git-send-email-marc.zyngier@arm.com
Signed-off-by: Thomas Gleixner <tglx@linutronix.de>
2015-07-17 10:46:42 +01:00
struct its_collection * col ;
col = dev_event_to_col ( desc - > its_inv_cmd . dev ,
desc - > its_inv_cmd . event_id ) ;
2014-11-24 14:35:11 +00:00
its_encode_cmd ( cmd , GITS_CMD_INV ) ;
its_encode_devid ( cmd , desc - > its_inv_cmd . dev - > device_id ) ;
its_encode_event_id ( cmd , desc - > its_inv_cmd . event_id ) ;
its_fixup_cmd ( cmd ) ;
irqchip/gicv3-its: Fix mapping of LPIs to collections
The GICv3 ITS architecture allows a given [DevID, EventID] pair to be
translated to a [LPI, Collection] pair, where DevID is the device writing
the MSI, EventID is the payload being written, LPI is the actual
interrupt number, and Collection is roughly equivalent to a target CPU.
Each LPI can be mapped to a separate collection, but the ITS driver
insists on maintaining the collection on a device basis, instead of doing
it on a per interrupt basis.
This is obviously flawed, and this patch fixes it by adding a per interrupt
index that indicates which collection number is in use.
Reported-by: Ian Campbell <ian.campbell@citrix.com>
Signed-off-by: Marc Zyngier <marc.zyngier@arm.com>
Cc: <linux-arm-kernel@lists.infradead.org>
Cc: Jason Cooper <jason@lakedaemon.net>
Cc: stable@vger.kernel.org # 4.1, 4.0
Link: http://lkml.kernel.org/r/1437126402-11677-1-git-send-email-marc.zyngier@arm.com
Signed-off-by: Thomas Gleixner <tglx@linutronix.de>
2015-07-17 10:46:42 +01:00
return col ;
2014-11-24 14:35:11 +00:00
}
static struct its_collection * its_build_invall_cmd ( struct its_cmd_block * cmd ,
struct its_cmd_desc * desc )
{
its_encode_cmd ( cmd , GITS_CMD_INVALL ) ;
its_encode_collection ( cmd , desc - > its_mapc_cmd . col - > col_id ) ;
its_fixup_cmd ( cmd ) ;
return NULL ;
}
static u64 its_cmd_ptr_to_offset ( struct its_node * its ,
struct its_cmd_block * ptr )
{
return ( ptr - its - > cmd_base ) * sizeof ( * ptr ) ;
}
static int its_queue_full ( struct its_node * its )
{
int widx ;
int ridx ;
widx = its - > cmd_write - its - > cmd_base ;
ridx = readl_relaxed ( its - > base + GITS_CREADR ) / sizeof ( struct its_cmd_block ) ;
/* This is incredibly unlikely to happen, unless the ITS locks up. */
if ( ( ( widx + 1 ) % ITS_CMD_QUEUE_NR_ENTRIES ) = = ridx )
return 1 ;
return 0 ;
}
static struct its_cmd_block * its_allocate_entry ( struct its_node * its )
{
struct its_cmd_block * cmd ;
u32 count = 1000000 ; /* 1s! */
while ( its_queue_full ( its ) ) {
count - - ;
if ( ! count ) {
pr_err_ratelimited ( " ITS queue not draining \n " ) ;
return NULL ;
}
cpu_relax ( ) ;
udelay ( 1 ) ;
}
cmd = its - > cmd_write + + ;
/* Handle queue wrapping */
if ( its - > cmd_write = = ( its - > cmd_base + ITS_CMD_QUEUE_NR_ENTRIES ) )
its - > cmd_write = its - > cmd_base ;
2016-12-19 17:16:45 +00:00
/* Clear command */
cmd - > raw_cmd [ 0 ] = 0 ;
cmd - > raw_cmd [ 1 ] = 0 ;
cmd - > raw_cmd [ 2 ] = 0 ;
cmd - > raw_cmd [ 3 ] = 0 ;
2014-11-24 14:35:11 +00:00
return cmd ;
}
static struct its_cmd_block * its_post_commands ( struct its_node * its )
{
u64 wr = its_cmd_ptr_to_offset ( its , its - > cmd_write ) ;
writel_relaxed ( wr , its - > base + GITS_CWRITER ) ;
return its - > cmd_write ;
}
static void its_flush_cmd ( struct its_node * its , struct its_cmd_block * cmd )
{
/*
* Make sure the commands written to memory are observable by
* the ITS .
*/
if ( its - > flags & ITS_FLAGS_CMDQ_NEEDS_FLUSHING )
2016-11-02 11:54:05 +00:00
gic_flush_dcache_to_poc ( cmd , sizeof ( * cmd ) ) ;
2014-11-24 14:35:11 +00:00
else
dsb ( ishst ) ;
}
static void its_wait_for_range_completion ( struct its_node * its ,
struct its_cmd_block * from ,
struct its_cmd_block * to )
{
u64 rd_idx , from_idx , to_idx ;
u32 count = 1000000 ; /* 1s! */
from_idx = its_cmd_ptr_to_offset ( its , from ) ;
to_idx = its_cmd_ptr_to_offset ( its , to ) ;
while ( 1 ) {
rd_idx = readl_relaxed ( its - > base + GITS_CREADR ) ;
if ( rd_idx > = to_idx | | rd_idx < from_idx )
break ;
count - - ;
if ( ! count ) {
pr_err_ratelimited ( " ITS queue timeout \n " ) ;
return ;
}
cpu_relax ( ) ;
udelay ( 1 ) ;
}
}
static void its_send_single_command ( struct its_node * its ,
its_cmd_builder_t builder ,
struct its_cmd_desc * desc )
{
struct its_cmd_block * cmd , * sync_cmd , * next_cmd ;
struct its_collection * sync_col ;
2015-03-06 16:37:43 +00:00
unsigned long flags ;
2014-11-24 14:35:11 +00:00
2015-03-06 16:37:43 +00:00
raw_spin_lock_irqsave ( & its - > lock , flags ) ;
2014-11-24 14:35:11 +00:00
cmd = its_allocate_entry ( its ) ;
if ( ! cmd ) { /* We're soooooo screewed... */
pr_err_ratelimited ( " ITS can't allocate, dropping command \n " ) ;
2015-03-06 16:37:43 +00:00
raw_spin_unlock_irqrestore ( & its - > lock , flags ) ;
2014-11-24 14:35:11 +00:00
return ;
}
sync_col = builder ( cmd , desc ) ;
its_flush_cmd ( its , cmd ) ;
if ( sync_col ) {
sync_cmd = its_allocate_entry ( its ) ;
if ( ! sync_cmd ) {
pr_err_ratelimited ( " ITS can't SYNC, skipping \n " ) ;
goto post ;
}
its_encode_cmd ( sync_cmd , GITS_CMD_SYNC ) ;
its_encode_target ( sync_cmd , sync_col - > target_address ) ;
its_fixup_cmd ( sync_cmd ) ;
its_flush_cmd ( its , sync_cmd ) ;
}
post :
next_cmd = its_post_commands ( its ) ;
2015-03-06 16:37:43 +00:00
raw_spin_unlock_irqrestore ( & its - > lock , flags ) ;
2014-11-24 14:35:11 +00:00
its_wait_for_range_completion ( its , cmd , next_cmd ) ;
}
static void its_send_inv ( struct its_device * dev , u32 event_id )
{
struct its_cmd_desc desc ;
desc . its_inv_cmd . dev = dev ;
desc . its_inv_cmd . event_id = event_id ;
its_send_single_command ( dev - > its , its_build_inv_cmd , & desc ) ;
}
static void its_send_mapd ( struct its_device * dev , int valid )
{
struct its_cmd_desc desc ;
desc . its_mapd_cmd . dev = dev ;
desc . its_mapd_cmd . valid = ! ! valid ;
its_send_single_command ( dev - > its , its_build_mapd_cmd , & desc ) ;
}
static void its_send_mapc ( struct its_node * its , struct its_collection * col ,
int valid )
{
struct its_cmd_desc desc ;
desc . its_mapc_cmd . col = col ;
desc . its_mapc_cmd . valid = ! ! valid ;
its_send_single_command ( its , its_build_mapc_cmd , & desc ) ;
}
2016-12-20 15:52:26 +00:00
static void its_send_mapti ( struct its_device * dev , u32 irq_id , u32 id )
2014-11-24 14:35:11 +00:00
{
struct its_cmd_desc desc ;
2016-12-20 15:52:26 +00:00
desc . its_mapti_cmd . dev = dev ;
desc . its_mapti_cmd . phys_id = irq_id ;
desc . its_mapti_cmd . event_id = id ;
2014-11-24 14:35:11 +00:00
2016-12-20 15:52:26 +00:00
its_send_single_command ( dev - > its , its_build_mapti_cmd , & desc ) ;
2014-11-24 14:35:11 +00:00
}
static void its_send_movi ( struct its_device * dev ,
struct its_collection * col , u32 id )
{
struct its_cmd_desc desc ;
desc . its_movi_cmd . dev = dev ;
desc . its_movi_cmd . col = col ;
irqchip/gicv3-its: Fix mapping of LPIs to collections
The GICv3 ITS architecture allows a given [DevID, EventID] pair to be
translated to a [LPI, Collection] pair, where DevID is the device writing
the MSI, EventID is the payload being written, LPI is the actual
interrupt number, and Collection is roughly equivalent to a target CPU.
Each LPI can be mapped to a separate collection, but the ITS driver
insists on maintaining the collection on a device basis, instead of doing
it on a per interrupt basis.
This is obviously flawed, and this patch fixes it by adding a per interrupt
index that indicates which collection number is in use.
Reported-by: Ian Campbell <ian.campbell@citrix.com>
Signed-off-by: Marc Zyngier <marc.zyngier@arm.com>
Cc: <linux-arm-kernel@lists.infradead.org>
Cc: Jason Cooper <jason@lakedaemon.net>
Cc: stable@vger.kernel.org # 4.1, 4.0
Link: http://lkml.kernel.org/r/1437126402-11677-1-git-send-email-marc.zyngier@arm.com
Signed-off-by: Thomas Gleixner <tglx@linutronix.de>
2015-07-17 10:46:42 +01:00
desc . its_movi_cmd . event_id = id ;
2014-11-24 14:35:11 +00:00
its_send_single_command ( dev - > its , its_build_movi_cmd , & desc ) ;
}
static void its_send_discard ( struct its_device * dev , u32 id )
{
struct its_cmd_desc desc ;
desc . its_discard_cmd . dev = dev ;
desc . its_discard_cmd . event_id = id ;
its_send_single_command ( dev - > its , its_build_discard_cmd , & desc ) ;
}
static void its_send_invall ( struct its_node * its , struct its_collection * col )
{
struct its_cmd_desc desc ;
desc . its_invall_cmd . col = col ;
its_send_single_command ( its , its_build_invall_cmd , & desc ) ;
}
2014-11-24 14:35:12 +00:00
/*
* irqchip functions - assumes MSI , mostly .
*/
static inline u32 its_get_event_id ( struct irq_data * d )
{
struct its_device * its_dev = irq_data_get_irq_chip_data ( d ) ;
irqchip/gicv3-its: Fix mapping of LPIs to collections
The GICv3 ITS architecture allows a given [DevID, EventID] pair to be
translated to a [LPI, Collection] pair, where DevID is the device writing
the MSI, EventID is the payload being written, LPI is the actual
interrupt number, and Collection is roughly equivalent to a target CPU.
Each LPI can be mapped to a separate collection, but the ITS driver
insists on maintaining the collection on a device basis, instead of doing
it on a per interrupt basis.
This is obviously flawed, and this patch fixes it by adding a per interrupt
index that indicates which collection number is in use.
Reported-by: Ian Campbell <ian.campbell@citrix.com>
Signed-off-by: Marc Zyngier <marc.zyngier@arm.com>
Cc: <linux-arm-kernel@lists.infradead.org>
Cc: Jason Cooper <jason@lakedaemon.net>
Cc: stable@vger.kernel.org # 4.1, 4.0
Link: http://lkml.kernel.org/r/1437126402-11677-1-git-send-email-marc.zyngier@arm.com
Signed-off-by: Thomas Gleixner <tglx@linutronix.de>
2015-07-17 10:46:42 +01:00
return d - > hwirq - its_dev - > event_map . lpi_base ;
2014-11-24 14:35:12 +00:00
}
static void lpi_set_config ( struct irq_data * d , bool enable )
{
struct its_device * its_dev = irq_data_get_irq_chip_data ( d ) ;
irq_hw_number_t hwirq = d - > hwirq ;
u32 id = its_get_event_id ( d ) ;
u8 * cfg = page_address ( gic_rdists - > prop_page ) + hwirq - 8192 ;
if ( enable )
* cfg | = LPI_PROP_ENABLED ;
else
* cfg & = ~ LPI_PROP_ENABLED ;
/*
* Make the above write visible to the redistributors .
* And yes , we ' re flushing exactly : One . Single . Byte .
* Humpf . . .
*/
if ( gic_rdists - > flags & RDIST_FLAGS_PROPBASE_NEEDS_FLUSHING )
2016-11-02 11:54:05 +00:00
gic_flush_dcache_to_poc ( cfg , sizeof ( * cfg ) ) ;
2014-11-24 14:35:12 +00:00
else
dsb ( ishst ) ;
its_send_inv ( its_dev , id ) ;
}
static void its_mask_irq ( struct irq_data * d )
{
lpi_set_config ( d , false ) ;
}
static void its_unmask_irq ( struct irq_data * d )
{
lpi_set_config ( d , true ) ;
}
static int its_set_affinity ( struct irq_data * d , const struct cpumask * mask_val ,
bool force )
{
2016-05-25 15:29:20 +02:00
unsigned int cpu ;
const struct cpumask * cpu_mask = cpu_online_mask ;
2014-11-24 14:35:12 +00:00
struct its_device * its_dev = irq_data_get_irq_chip_data ( d ) ;
struct its_collection * target_col ;
u32 id = its_get_event_id ( d ) ;
2016-05-25 15:29:20 +02:00
/* lpi cannot be routed to a redistributor that is on a foreign node */
if ( its_dev - > its - > flags & ITS_FLAGS_WORKAROUND_CAVIUM_23144 ) {
if ( its_dev - > its - > numa_node > = 0 ) {
cpu_mask = cpumask_of_node ( its_dev - > its - > numa_node ) ;
if ( ! cpumask_intersects ( mask_val , cpu_mask ) )
return - EINVAL ;
}
}
cpu = cpumask_any_and ( mask_val , cpu_mask ) ;
2014-11-24 14:35:12 +00:00
if ( cpu > = nr_cpu_ids )
return - EINVAL ;
target_col = & its_dev - > its - > collections [ cpu ] ;
its_send_movi ( its_dev , target_col , id ) ;
irqchip/gicv3-its: Fix mapping of LPIs to collections
The GICv3 ITS architecture allows a given [DevID, EventID] pair to be
translated to a [LPI, Collection] pair, where DevID is the device writing
the MSI, EventID is the payload being written, LPI is the actual
interrupt number, and Collection is roughly equivalent to a target CPU.
Each LPI can be mapped to a separate collection, but the ITS driver
insists on maintaining the collection on a device basis, instead of doing
it on a per interrupt basis.
This is obviously flawed, and this patch fixes it by adding a per interrupt
index that indicates which collection number is in use.
Reported-by: Ian Campbell <ian.campbell@citrix.com>
Signed-off-by: Marc Zyngier <marc.zyngier@arm.com>
Cc: <linux-arm-kernel@lists.infradead.org>
Cc: Jason Cooper <jason@lakedaemon.net>
Cc: stable@vger.kernel.org # 4.1, 4.0
Link: http://lkml.kernel.org/r/1437126402-11677-1-git-send-email-marc.zyngier@arm.com
Signed-off-by: Thomas Gleixner <tglx@linutronix.de>
2015-07-17 10:46:42 +01:00
its_dev - > event_map . col_map [ id ] = cpu ;
2014-11-24 14:35:12 +00:00
return IRQ_SET_MASK_OK_DONE ;
}
2014-11-24 14:35:16 +00:00
static void its_irq_compose_msi_msg ( struct irq_data * d , struct msi_msg * msg )
{
struct its_device * its_dev = irq_data_get_irq_chip_data ( d ) ;
struct its_node * its ;
u64 addr ;
its = its_dev - > its ;
addr = its - > phys_base + GITS_TRANSLATER ;
2016-11-02 11:54:03 +00:00
msg - > address_lo = lower_32_bits ( addr ) ;
msg - > address_hi = upper_32_bits ( addr ) ;
2014-11-24 14:35:16 +00:00
msg - > data = its_get_event_id ( d ) ;
2016-09-12 17:13:59 +01:00
iommu_dma_map_msi_msg ( d - > irq , msg ) ;
2014-11-24 14:35:16 +00:00
}
2014-11-24 14:35:12 +00:00
static struct irq_chip its_irq_chip = {
. name = " ITS " ,
. irq_mask = its_mask_irq ,
. irq_unmask = its_unmask_irq ,
2016-02-11 05:38:53 -08:00
. irq_eoi = irq_chip_eoi_parent ,
2014-11-24 14:35:12 +00:00
. irq_set_affinity = its_set_affinity ,
2014-11-24 14:35:16 +00:00
. irq_compose_msi_msg = its_irq_compose_msi_msg ,
} ;
2014-11-24 14:35:13 +00:00
/*
* How we allocate LPIs :
*
* The GIC has id_bits bits for interrupt identifiers . From there , we
* must subtract 8192 which are reserved for SGIs / PPIs / SPIs . Then , as
* we allocate LPIs by chunks of 32 , we can shift the whole thing by 5
* bits to the right .
*
* This gives us ( ( ( 1UL < < id_bits ) - 8192 ) > > 5 ) possible allocations .
*/
# define IRQS_PER_CHUNK_SHIFT 5
# define IRQS_PER_CHUNK (1 << IRQS_PER_CHUNK_SHIFT)
static unsigned long * lpi_bitmap ;
static u32 lpi_chunks ;
static DEFINE_SPINLOCK ( lpi_lock ) ;
static int its_lpi_to_chunk ( int lpi )
{
return ( lpi - 8192 ) > > IRQS_PER_CHUNK_SHIFT ;
}
static int its_chunk_to_lpi ( int chunk )
{
return ( chunk < < IRQS_PER_CHUNK_SHIFT ) + 8192 ;
}
2016-01-19 14:11:18 +01:00
static int __init its_lpi_init ( u32 id_bits )
2014-11-24 14:35:13 +00:00
{
lpi_chunks = its_lpi_to_chunk ( 1UL < < id_bits ) ;
lpi_bitmap = kzalloc ( BITS_TO_LONGS ( lpi_chunks ) * sizeof ( long ) ,
GFP_KERNEL ) ;
if ( ! lpi_bitmap ) {
lpi_chunks = 0 ;
return - ENOMEM ;
}
pr_info ( " ITS: Allocated %d chunks for LPIs \n " , ( int ) lpi_chunks ) ;
return 0 ;
}
static unsigned long * its_lpi_alloc_chunks ( int nr_irqs , int * base , int * nr_ids )
{
unsigned long * bitmap = NULL ;
int chunk_id ;
int nr_chunks ;
int i ;
nr_chunks = DIV_ROUND_UP ( nr_irqs , IRQS_PER_CHUNK ) ;
spin_lock ( & lpi_lock ) ;
do {
chunk_id = bitmap_find_next_zero_area ( lpi_bitmap , lpi_chunks ,
0 , nr_chunks , 0 ) ;
if ( chunk_id < lpi_chunks )
break ;
nr_chunks - - ;
} while ( nr_chunks > 0 ) ;
if ( ! nr_chunks )
goto out ;
bitmap = kzalloc ( BITS_TO_LONGS ( nr_chunks * IRQS_PER_CHUNK ) * sizeof ( long ) ,
GFP_ATOMIC ) ;
if ( ! bitmap )
goto out ;
for ( i = 0 ; i < nr_chunks ; i + + )
set_bit ( chunk_id + i , lpi_bitmap ) ;
* base = its_chunk_to_lpi ( chunk_id ) ;
* nr_ids = nr_chunks * IRQS_PER_CHUNK ;
out :
spin_unlock ( & lpi_lock ) ;
2015-10-02 16:44:05 +01:00
if ( ! bitmap )
* base = * nr_ids = 0 ;
2014-11-24 14:35:13 +00:00
return bitmap ;
}
irqchip/gicv3-its: Fix mapping of LPIs to collections
The GICv3 ITS architecture allows a given [DevID, EventID] pair to be
translated to a [LPI, Collection] pair, where DevID is the device writing
the MSI, EventID is the payload being written, LPI is the actual
interrupt number, and Collection is roughly equivalent to a target CPU.
Each LPI can be mapped to a separate collection, but the ITS driver
insists on maintaining the collection on a device basis, instead of doing
it on a per interrupt basis.
This is obviously flawed, and this patch fixes it by adding a per interrupt
index that indicates which collection number is in use.
Reported-by: Ian Campbell <ian.campbell@citrix.com>
Signed-off-by: Marc Zyngier <marc.zyngier@arm.com>
Cc: <linux-arm-kernel@lists.infradead.org>
Cc: Jason Cooper <jason@lakedaemon.net>
Cc: stable@vger.kernel.org # 4.1, 4.0
Link: http://lkml.kernel.org/r/1437126402-11677-1-git-send-email-marc.zyngier@arm.com
Signed-off-by: Thomas Gleixner <tglx@linutronix.de>
2015-07-17 10:46:42 +01:00
static void its_lpi_free ( struct event_lpi_map * map )
2014-11-24 14:35:13 +00:00
{
irqchip/gicv3-its: Fix mapping of LPIs to collections
The GICv3 ITS architecture allows a given [DevID, EventID] pair to be
translated to a [LPI, Collection] pair, where DevID is the device writing
the MSI, EventID is the payload being written, LPI is the actual
interrupt number, and Collection is roughly equivalent to a target CPU.
Each LPI can be mapped to a separate collection, but the ITS driver
insists on maintaining the collection on a device basis, instead of doing
it on a per interrupt basis.
This is obviously flawed, and this patch fixes it by adding a per interrupt
index that indicates which collection number is in use.
Reported-by: Ian Campbell <ian.campbell@citrix.com>
Signed-off-by: Marc Zyngier <marc.zyngier@arm.com>
Cc: <linux-arm-kernel@lists.infradead.org>
Cc: Jason Cooper <jason@lakedaemon.net>
Cc: stable@vger.kernel.org # 4.1, 4.0
Link: http://lkml.kernel.org/r/1437126402-11677-1-git-send-email-marc.zyngier@arm.com
Signed-off-by: Thomas Gleixner <tglx@linutronix.de>
2015-07-17 10:46:42 +01:00
int base = map - > lpi_base ;
int nr_ids = map - > nr_lpis ;
2014-11-24 14:35:13 +00:00
int lpi ;
spin_lock ( & lpi_lock ) ;
for ( lpi = base ; lpi < ( base + nr_ids ) ; lpi + = IRQS_PER_CHUNK ) {
int chunk = its_lpi_to_chunk ( lpi ) ;
BUG_ON ( chunk > lpi_chunks ) ;
if ( test_bit ( chunk , lpi_bitmap ) ) {
clear_bit ( chunk , lpi_bitmap ) ;
} else {
pr_err ( " Bad LPI chunk %d \n " , chunk ) ;
}
}
spin_unlock ( & lpi_lock ) ;
irqchip/gicv3-its: Fix mapping of LPIs to collections
The GICv3 ITS architecture allows a given [DevID, EventID] pair to be
translated to a [LPI, Collection] pair, where DevID is the device writing
the MSI, EventID is the payload being written, LPI is the actual
interrupt number, and Collection is roughly equivalent to a target CPU.
Each LPI can be mapped to a separate collection, but the ITS driver
insists on maintaining the collection on a device basis, instead of doing
it on a per interrupt basis.
This is obviously flawed, and this patch fixes it by adding a per interrupt
index that indicates which collection number is in use.
Reported-by: Ian Campbell <ian.campbell@citrix.com>
Signed-off-by: Marc Zyngier <marc.zyngier@arm.com>
Cc: <linux-arm-kernel@lists.infradead.org>
Cc: Jason Cooper <jason@lakedaemon.net>
Cc: stable@vger.kernel.org # 4.1, 4.0
Link: http://lkml.kernel.org/r/1437126402-11677-1-git-send-email-marc.zyngier@arm.com
Signed-off-by: Thomas Gleixner <tglx@linutronix.de>
2015-07-17 10:46:42 +01:00
kfree ( map - > lpi_map ) ;
kfree ( map - > col_map ) ;
2014-11-24 14:35:13 +00:00
}
2014-11-24 14:35:14 +00:00
/*
* We allocate 64 kB for PROPBASE . That gives us at most 64 K LPIs to
* deal with ( one configuration byte per interrupt ) . PENDBASE has to
* be 64 kB aligned ( one bit per LPI , plus 8192 bits for SPI / PPI / SGI ) .
*/
# define LPI_PROPBASE_SZ SZ_64K
# define LPI_PENDBASE_SZ (LPI_PROPBASE_SZ / 8 + SZ_1K)
/*
* This is how many bits of ID we need , including the useless ones .
*/
# define LPI_NRBITS ilog2(LPI_PROPBASE_SZ + SZ_8K)
# define LPI_PROP_DEFAULT_PRIO 0xa0
static int __init its_alloc_lpi_tables ( void )
{
phys_addr_t paddr ;
gic_rdists - > prop_page = alloc_pages ( GFP_NOWAIT ,
get_order ( LPI_PROPBASE_SZ ) ) ;
if ( ! gic_rdists - > prop_page ) {
pr_err ( " Failed to allocate PROPBASE \n " ) ;
return - ENOMEM ;
}
paddr = page_to_phys ( gic_rdists - > prop_page ) ;
pr_info ( " GIC: using LPI property table @%pa \n " , & paddr ) ;
/* Priority 0xa0, Group-1, disabled */
memset ( page_address ( gic_rdists - > prop_page ) ,
LPI_PROP_DEFAULT_PRIO | LPI_PROP_GROUP1 ,
LPI_PROPBASE_SZ ) ;
/* Make sure the GIC will observe the written configuration */
2016-11-02 11:54:05 +00:00
gic_flush_dcache_to_poc ( page_address ( gic_rdists - > prop_page ) , LPI_PROPBASE_SZ ) ;
2014-11-24 14:35:14 +00:00
return 0 ;
}
static const char * its_base_type_string [ ] = {
[ GITS_BASER_TYPE_DEVICE ] = " Devices " ,
[ GITS_BASER_TYPE_VCPU ] = " Virtual CPUs " ,
2016-12-20 15:50:14 +00:00
[ GITS_BASER_TYPE_RESERVED3 ] = " Reserved (3) " ,
2014-11-24 14:35:14 +00:00
[ GITS_BASER_TYPE_COLLECTION ] = " Interrupt Collections " ,
[ GITS_BASER_TYPE_RESERVED5 ] = " Reserved (5) " ,
[ GITS_BASER_TYPE_RESERVED6 ] = " Reserved (6) " ,
[ GITS_BASER_TYPE_RESERVED7 ] = " Reserved (7) " ,
} ;
2016-06-06 18:17:28 -05:00
static u64 its_read_baser ( struct its_node * its , struct its_baser * baser )
{
u32 idx = baser - its - > tables ;
2016-11-02 11:54:06 +00:00
return gits_read_baser ( its - > base + GITS_BASER + ( idx < < 3 ) ) ;
2016-06-06 18:17:28 -05:00
}
static void its_write_baser ( struct its_node * its , struct its_baser * baser ,
u64 val )
{
u32 idx = baser - its - > tables ;
2016-11-02 11:54:06 +00:00
gits_write_baser ( val , its - > base + GITS_BASER + ( idx < < 3 ) ) ;
2016-06-06 18:17:28 -05:00
baser - > val = its_read_baser ( its , baser ) ;
}
2016-06-06 18:17:30 -05:00
static int its_setup_baser ( struct its_node * its , struct its_baser * baser ,
2016-06-06 18:17:32 -05:00
u64 cache , u64 shr , u32 psz , u32 order ,
bool indirect )
2016-06-06 18:17:30 -05:00
{
u64 val = its_read_baser ( its , baser ) ;
u64 esz = GITS_BASER_ENTRY_SIZE ( val ) ;
u64 type = GITS_BASER_TYPE ( val ) ;
u32 alloc_pages ;
void * base ;
u64 tmp ;
retry_alloc_baser :
alloc_pages = ( PAGE_ORDER_TO_SIZE ( order ) / psz ) ;
if ( alloc_pages > GITS_BASER_PAGES_MAX ) {
pr_warn ( " ITS@%pa: %s too large, reduce ITS pages %u->%u \n " ,
& its - > phys_base , its_base_type_string [ type ] ,
alloc_pages , GITS_BASER_PAGES_MAX ) ;
alloc_pages = GITS_BASER_PAGES_MAX ;
order = get_order ( GITS_BASER_PAGES_MAX * psz ) ;
}
base = ( void * ) __get_free_pages ( GFP_KERNEL | __GFP_ZERO , order ) ;
if ( ! base )
return - ENOMEM ;
retry_baser :
val = ( virt_to_phys ( base ) |
( type < < GITS_BASER_TYPE_SHIFT ) |
( ( esz - 1 ) < < GITS_BASER_ENTRY_SIZE_SHIFT ) |
( ( alloc_pages - 1 ) < < GITS_BASER_PAGES_SHIFT ) |
cache |
shr |
GITS_BASER_VALID ) ;
2016-06-06 18:17:32 -05:00
val | = indirect ? GITS_BASER_INDIRECT : 0x0 ;
2016-06-06 18:17:30 -05:00
switch ( psz ) {
case SZ_4K :
val | = GITS_BASER_PAGE_SIZE_4K ;
break ;
case SZ_16K :
val | = GITS_BASER_PAGE_SIZE_16K ;
break ;
case SZ_64K :
val | = GITS_BASER_PAGE_SIZE_64K ;
break ;
}
its_write_baser ( its , baser , val ) ;
tmp = baser - > val ;
if ( ( val ^ tmp ) & GITS_BASER_SHAREABILITY_MASK ) {
/*
* Shareability didn ' t stick . Just use
* whatever the read reported , which is likely
* to be the only thing this redistributor
* supports . If that ' s zero , make it
* non - cacheable as well .
*/
shr = tmp & GITS_BASER_SHAREABILITY_MASK ;
if ( ! shr ) {
cache = GITS_BASER_nC ;
2016-11-02 11:54:05 +00:00
gic_flush_dcache_to_poc ( base , PAGE_ORDER_TO_SIZE ( order ) ) ;
2016-06-06 18:17:30 -05:00
}
goto retry_baser ;
}
if ( ( val ^ tmp ) & GITS_BASER_PAGE_SIZE_MASK ) {
/*
* Page size didn ' t stick . Let ' s try a smaller
* size and retry . If we reach 4 K , then
* something is horribly wrong . . .
*/
free_pages ( ( unsigned long ) base , order ) ;
baser - > base = NULL ;
switch ( psz ) {
case SZ_16K :
psz = SZ_4K ;
goto retry_alloc_baser ;
case SZ_64K :
psz = SZ_16K ;
goto retry_alloc_baser ;
}
}
if ( val ! = tmp ) {
2016-11-02 11:54:03 +00:00
pr_err ( " ITS@%pa: %s doesn't stick: %llx %llx \n " ,
2016-06-06 18:17:30 -05:00
& its - > phys_base , its_base_type_string [ type ] ,
2016-11-02 11:54:03 +00:00
val , tmp ) ;
2016-06-06 18:17:30 -05:00
free_pages ( ( unsigned long ) base , order ) ;
return - ENXIO ;
}
baser - > order = order ;
baser - > base = base ;
baser - > psz = psz ;
2016-06-06 18:17:32 -05:00
tmp = indirect ? GITS_LVL1_ENTRY_SIZE : esz ;
2016-06-06 18:17:30 -05:00
2016-06-06 18:17:32 -05:00
pr_info ( " ITS@%pa: allocated %d %s @%lx (%s, esz %d, psz %dK, shr %d) \n " ,
2016-11-02 11:54:04 +00:00
& its - > phys_base , ( int ) ( PAGE_ORDER_TO_SIZE ( order ) / ( int ) tmp ) ,
2016-06-06 18:17:30 -05:00
its_base_type_string [ type ] ,
( unsigned long ) virt_to_phys ( base ) ,
2016-06-06 18:17:32 -05:00
indirect ? " indirect " : " flat " , ( int ) esz ,
2016-06-06 18:17:30 -05:00
psz / SZ_1K , ( int ) shr > > GITS_BASER_SHAREABILITY_SHIFT ) ;
return 0 ;
}
2016-06-06 18:17:32 -05:00
static bool its_parse_baser_device ( struct its_node * its , struct its_baser * baser ,
u32 psz , u32 * order )
2016-06-06 18:17:29 -05:00
{
u64 esz = GITS_BASER_ENTRY_SIZE ( its_read_baser ( its , baser ) ) ;
2017-01-25 21:51:41 -06:00
u64 val = GITS_BASER_InnerShareable | GITS_BASER_RaWaWb ;
2016-06-06 18:17:29 -05:00
u32 ids = its - > device_ids ;
u32 new_order = * order ;
2016-06-06 18:17:32 -05:00
bool indirect = false ;
/* No need to enable Indirection if memory requirement < (psz*2)bytes */
if ( ( esz < < ids ) > ( psz * 2 ) ) {
/*
* Find out whether hw supports a single or two - level table by
* table by reading bit at offset ' 62 ' after writing ' 1 ' to it .
*/
its_write_baser ( its , baser , val | GITS_BASER_INDIRECT ) ;
indirect = ! ! ( baser - > val & GITS_BASER_INDIRECT ) ;
if ( indirect ) {
/*
* The size of the lvl2 table is equal to ITS page size
* which is ' psz ' . For computing lvl1 table size ,
* subtract ID bits that sparse lvl2 table from ' ids '
* which is reported by ITS hardware times lvl1 table
* entry size .
*/
2016-11-02 11:54:04 +00:00
ids - = ilog2 ( psz / ( int ) esz ) ;
2016-06-06 18:17:32 -05:00
esz = GITS_LVL1_ENTRY_SIZE ;
}
}
2016-06-06 18:17:29 -05:00
/*
* Allocate as many entries as required to fit the
* range of device IDs that the ITS can grok . . . The ID
* space being incredibly sparse , this results in a
2016-06-06 18:17:32 -05:00
* massive waste of memory if two - level device table
* feature is not supported by hardware .
2016-06-06 18:17:29 -05:00
*/
new_order = max_t ( u32 , get_order ( esz < < ids ) , new_order ) ;
if ( new_order > = MAX_ORDER ) {
new_order = MAX_ORDER - 1 ;
2016-11-02 11:54:04 +00:00
ids = ilog2 ( PAGE_ORDER_TO_SIZE ( new_order ) / ( int ) esz ) ;
2016-06-06 18:17:29 -05:00
pr_warn ( " ITS@%pa: Device Table too large, reduce ids %u->%u \n " ,
& its - > phys_base , its - > device_ids , ids ) ;
}
* order = new_order ;
2016-06-06 18:17:32 -05:00
return indirect ;
2016-06-06 18:17:29 -05:00
}
2014-11-24 14:35:14 +00:00
static void its_free_tables ( struct its_node * its )
{
int i ;
for ( i = 0 ; i < GITS_BASER_NR_REGS ; i + + ) {
2016-02-01 20:19:44 -06:00
if ( its - > tables [ i ] . base ) {
free_pages ( ( unsigned long ) its - > tables [ i ] . base ,
its - > tables [ i ] . order ) ;
its - > tables [ i ] . base = NULL ;
2014-11-24 14:35:14 +00:00
}
}
}
2016-06-06 18:17:31 -05:00
static int its_alloc_tables ( struct its_node * its )
2014-11-24 14:35:14 +00:00
{
2016-10-14 15:13:07 +01:00
u64 typer = gic_read_typer ( its - > base + GITS_TYPER ) ;
2016-06-06 18:17:30 -05:00
u32 ids = GITS_TYPER_DEVBITS ( typer ) ;
2014-11-24 14:35:14 +00:00
u64 shr = GITS_BASER_InnerShareable ;
2017-01-25 21:51:41 -06:00
u64 cache = GITS_BASER_RaWaWb ;
2016-06-06 18:17:30 -05:00
u32 psz = SZ_64K ;
int err , i ;
2015-09-21 22:58:38 +02:00
if ( its - > flags & ITS_FLAGS_WORKAROUND_CAVIUM_22375 ) {
/*
2016-06-06 18:17:30 -05:00
* erratum 22375 : only alloc 8 MB table size
* erratum 24313 : ignore memory access type
*/
cache = GITS_BASER_nCnB ;
ids = 0x14 ; /* 20 bits, 8MB */
2015-09-21 22:58:38 +02:00
}
2014-11-24 14:35:14 +00:00
2016-03-09 22:10:49 -06:00
its - > device_ids = ids ;
2014-11-24 14:35:14 +00:00
for ( i = 0 ; i < GITS_BASER_NR_REGS ; i + + ) {
2016-06-06 18:17:28 -05:00
struct its_baser * baser = its - > tables + i ;
u64 val = its_read_baser ( its , baser ) ;
2014-11-24 14:35:14 +00:00
u64 type = GITS_BASER_TYPE ( val ) ;
2016-06-06 18:17:30 -05:00
u32 order = get_order ( psz ) ;
2016-06-06 18:17:32 -05:00
bool indirect = false ;
2014-11-24 14:35:14 +00:00
if ( type = = GITS_BASER_TYPE_NONE )
continue ;
2016-06-06 18:17:29 -05:00
if ( type = = GITS_BASER_TYPE_DEVICE )
2016-06-06 18:17:32 -05:00
indirect = its_parse_baser_device ( its , baser , psz , & order ) ;
2015-03-06 16:37:41 +00:00
2016-06-06 18:17:32 -05:00
err = its_setup_baser ( its , baser , cache , shr , psz , order , indirect ) ;
2016-06-06 18:17:30 -05:00
if ( err < 0 ) {
its_free_tables ( its ) ;
return err ;
2014-11-24 14:35:14 +00:00
}
2016-06-06 18:17:30 -05:00
/* Update settings which will be used for next BASERn */
psz = baser - > psz ;
cache = baser - > val & GITS_BASER_CACHEABILITY_MASK ;
shr = baser - > val & GITS_BASER_SHAREABILITY_MASK ;
2014-11-24 14:35:14 +00:00
}
return 0 ;
}
static int its_alloc_collections ( struct its_node * its )
{
its - > collections = kzalloc ( nr_cpu_ids * sizeof ( * its - > collections ) ,
GFP_KERNEL ) ;
if ( ! its - > collections )
return - ENOMEM ;
return 0 ;
}
static void its_cpu_init_lpis ( void )
{
void __iomem * rbase = gic_data_rdist_rd_base ( ) ;
struct page * pend_page ;
u64 val , tmp ;
/* If we didn't allocate the pending table yet, do it now */
pend_page = gic_data_rdist ( ) - > pend_page ;
if ( ! pend_page ) {
phys_addr_t paddr ;
/*
* The pending pages have to be at least 64 kB aligned ,
* hence the ' max ( LPI_PENDBASE_SZ , SZ_64K ) ' below .
*/
pend_page = alloc_pages ( GFP_NOWAIT | __GFP_ZERO ,
get_order ( max ( LPI_PENDBASE_SZ , SZ_64K ) ) ) ;
if ( ! pend_page ) {
pr_err ( " Failed to allocate PENDBASE for CPU%d \n " ,
smp_processor_id ( ) ) ;
return ;
}
/* Make sure the GIC will observe the zero-ed page */
2016-11-02 11:54:05 +00:00
gic_flush_dcache_to_poc ( page_address ( pend_page ) , LPI_PENDBASE_SZ ) ;
2014-11-24 14:35:14 +00:00
paddr = page_to_phys ( pend_page ) ;
pr_info ( " CPU%d: using LPI pending table @%pa \n " ,
smp_processor_id ( ) , & paddr ) ;
gic_data_rdist ( ) - > pend_page = pend_page ;
}
/* Disable LPIs */
val = readl_relaxed ( rbase + GICR_CTLR ) ;
val & = ~ GICR_CTLR_ENABLE_LPIS ;
writel_relaxed ( val , rbase + GICR_CTLR ) ;
/*
* Make sure any change to the table is observable by the GIC .
*/
dsb ( sy ) ;
/* set PROPBASE */
val = ( page_to_phys ( gic_rdists - > prop_page ) |
GICR_PROPBASER_InnerShareable |
2017-01-25 21:51:41 -06:00
GICR_PROPBASER_RaWaWb |
2014-11-24 14:35:14 +00:00
( ( LPI_NRBITS - 1 ) & GICR_PROPBASER_IDBITS_MASK ) ) ;
2016-11-02 11:54:06 +00:00
gicr_write_propbaser ( val , rbase + GICR_PROPBASER ) ;
tmp = gicr_read_propbaser ( rbase + GICR_PROPBASER ) ;
2014-11-24 14:35:14 +00:00
if ( ( tmp ^ val ) & GICR_PROPBASER_SHAREABILITY_MASK ) {
2015-03-27 14:15:05 +00:00
if ( ! ( tmp & GICR_PROPBASER_SHAREABILITY_MASK ) ) {
/*
* The HW reports non - shareable , we must
* remove the cacheability attributes as
* well .
*/
val & = ~ ( GICR_PROPBASER_SHAREABILITY_MASK |
GICR_PROPBASER_CACHEABILITY_MASK ) ;
val | = GICR_PROPBASER_nC ;
2016-11-02 11:54:06 +00:00
gicr_write_propbaser ( val , rbase + GICR_PROPBASER ) ;
2015-03-27 14:15:05 +00:00
}
2014-11-24 14:35:14 +00:00
pr_info_once ( " GIC: using cache flushing for LPI property table \n " ) ;
gic_rdists - > flags | = RDIST_FLAGS_PROPBASE_NEEDS_FLUSHING ;
}
/* set PENDBASE */
val = ( page_to_phys ( pend_page ) |
2015-03-27 14:15:04 +00:00
GICR_PENDBASER_InnerShareable |
2017-01-25 21:51:41 -06:00
GICR_PENDBASER_RaWaWb ) ;
2014-11-24 14:35:14 +00:00
2016-11-02 11:54:06 +00:00
gicr_write_pendbaser ( val , rbase + GICR_PENDBASER ) ;
tmp = gicr_read_pendbaser ( rbase + GICR_PENDBASER ) ;
2015-03-27 14:15:05 +00:00
if ( ! ( tmp & GICR_PENDBASER_SHAREABILITY_MASK ) ) {
/*
* The HW reports non - shareable , we must remove the
* cacheability attributes as well .
*/
val & = ~ ( GICR_PENDBASER_SHAREABILITY_MASK |
GICR_PENDBASER_CACHEABILITY_MASK ) ;
val | = GICR_PENDBASER_nC ;
2016-11-02 11:54:06 +00:00
gicr_write_pendbaser ( val , rbase + GICR_PENDBASER ) ;
2015-03-27 14:15:05 +00:00
}
2014-11-24 14:35:14 +00:00
/* Enable LPIs */
val = readl_relaxed ( rbase + GICR_CTLR ) ;
val | = GICR_CTLR_ENABLE_LPIS ;
writel_relaxed ( val , rbase + GICR_CTLR ) ;
/* Make sure the GIC has seen the above */
dsb ( sy ) ;
}
static void its_cpu_init_collection ( void )
{
struct its_node * its ;
int cpu ;
spin_lock ( & its_lock ) ;
cpu = smp_processor_id ( ) ;
list_for_each_entry ( its , & its_nodes , entry ) {
u64 target ;
2016-05-25 15:29:20 +02:00
/* avoid cross node collections and its mapping */
if ( its - > flags & ITS_FLAGS_WORKAROUND_CAVIUM_23144 ) {
struct device_node * cpu_node ;
cpu_node = of_get_cpu_node ( cpu , NULL ) ;
if ( its - > numa_node ! = NUMA_NO_NODE & &
its - > numa_node ! = of_node_to_nid ( cpu_node ) )
continue ;
}
2014-11-24 14:35:14 +00:00
/*
* We now have to bind each collection to its target
* redistributor .
*/
2016-10-14 15:13:07 +01:00
if ( gic_read_typer ( its - > base + GITS_TYPER ) & GITS_TYPER_PTA ) {
2014-11-24 14:35:14 +00:00
/*
* This ITS wants the physical address of the
* redistributor .
*/
target = gic_data_rdist ( ) - > phys_base ;
} else {
/*
* This ITS wants a linear CPU number .
*/
2016-10-14 15:13:07 +01:00
target = gic_read_typer ( gic_data_rdist_rd_base ( ) + GICR_TYPER ) ;
2015-03-27 14:15:02 +00:00
target = GICR_TYPER_CPU_NUMBER ( target ) < < 16 ;
2014-11-24 14:35:14 +00:00
}
/* Perform collection mapping */
its - > collections [ cpu ] . target_address = target ;
its - > collections [ cpu ] . col_id = cpu ;
its_send_mapc ( its , & its - > collections [ cpu ] , 1 ) ;
its_send_invall ( its , & its - > collections [ cpu ] ) ;
}
spin_unlock ( & its_lock ) ;
}
2014-11-24 14:35:15 +00:00
static struct its_device * its_find_device ( struct its_node * its , u32 dev_id )
{
struct its_device * its_dev = NULL , * tmp ;
2015-03-06 16:37:43 +00:00
unsigned long flags ;
2014-11-24 14:35:15 +00:00
2015-03-06 16:37:43 +00:00
raw_spin_lock_irqsave ( & its - > lock , flags ) ;
2014-11-24 14:35:15 +00:00
list_for_each_entry ( tmp , & its - > its_device_list , entry ) {
if ( tmp - > device_id = = dev_id ) {
its_dev = tmp ;
break ;
}
}
2015-03-06 16:37:43 +00:00
raw_spin_unlock_irqrestore ( & its - > lock , flags ) ;
2014-11-24 14:35:15 +00:00
return its_dev ;
}
2016-03-09 22:10:49 -06:00
static struct its_baser * its_get_baser ( struct its_node * its , u32 type )
{
int i ;
for ( i = 0 ; i < GITS_BASER_NR_REGS ; i + + ) {
if ( GITS_BASER_TYPE ( its - > tables [ i ] . val ) = = type )
return & its - > tables [ i ] ;
}
return NULL ;
}
2016-06-06 18:17:32 -05:00
static bool its_alloc_device_table ( struct its_node * its , u32 dev_id )
{
struct its_baser * baser ;
struct page * page ;
u32 esz , idx ;
__le64 * table ;
baser = its_get_baser ( its , GITS_BASER_TYPE_DEVICE ) ;
/* Don't allow device id that exceeds ITS hardware limit */
if ( ! baser )
return ( ilog2 ( dev_id ) < its - > device_ids ) ;
/* Don't allow device id that exceeds single, flat table limit */
esz = GITS_BASER_ENTRY_SIZE ( baser - > val ) ;
if ( ! ( baser - > val & GITS_BASER_INDIRECT ) )
return ( dev_id < ( PAGE_ORDER_TO_SIZE ( baser - > order ) / esz ) ) ;
/* Compute 1st level table index & check if that exceeds table limit */
idx = dev_id > > ilog2 ( baser - > psz / esz ) ;
if ( idx > = ( PAGE_ORDER_TO_SIZE ( baser - > order ) / GITS_LVL1_ENTRY_SIZE ) )
return false ;
table = baser - > base ;
/* Allocate memory for 2nd level table */
if ( ! table [ idx ] ) {
page = alloc_pages ( GFP_KERNEL | __GFP_ZERO , get_order ( baser - > psz ) ) ;
if ( ! page )
return false ;
/* Flush Lvl2 table to PoC if hw doesn't support coherency */
if ( ! ( baser - > val & GITS_BASER_SHAREABILITY_MASK ) )
2016-11-02 11:54:05 +00:00
gic_flush_dcache_to_poc ( page_address ( page ) , baser - > psz ) ;
2016-06-06 18:17:32 -05:00
table [ idx ] = cpu_to_le64 ( page_to_phys ( page ) | GITS_BASER_VALID ) ;
/* Flush Lvl1 entry to PoC if hw doesn't support coherency */
if ( ! ( baser - > val & GITS_BASER_SHAREABILITY_MASK ) )
2016-11-02 11:54:05 +00:00
gic_flush_dcache_to_poc ( table + idx , GITS_LVL1_ENTRY_SIZE ) ;
2016-06-06 18:17:32 -05:00
/* Ensure updated table contents are visible to ITS hardware */
dsb ( sy ) ;
}
return true ;
}
2014-11-24 14:35:15 +00:00
static struct its_device * its_create_device ( struct its_node * its , u32 dev_id ,
int nvecs )
{
struct its_device * dev ;
unsigned long * lpi_map ;
2015-03-06 16:37:43 +00:00
unsigned long flags ;
irqchip/gicv3-its: Fix mapping of LPIs to collections
The GICv3 ITS architecture allows a given [DevID, EventID] pair to be
translated to a [LPI, Collection] pair, where DevID is the device writing
the MSI, EventID is the payload being written, LPI is the actual
interrupt number, and Collection is roughly equivalent to a target CPU.
Each LPI can be mapped to a separate collection, but the ITS driver
insists on maintaining the collection on a device basis, instead of doing
it on a per interrupt basis.
This is obviously flawed, and this patch fixes it by adding a per interrupt
index that indicates which collection number is in use.
Reported-by: Ian Campbell <ian.campbell@citrix.com>
Signed-off-by: Marc Zyngier <marc.zyngier@arm.com>
Cc: <linux-arm-kernel@lists.infradead.org>
Cc: Jason Cooper <jason@lakedaemon.net>
Cc: stable@vger.kernel.org # 4.1, 4.0
Link: http://lkml.kernel.org/r/1437126402-11677-1-git-send-email-marc.zyngier@arm.com
Signed-off-by: Thomas Gleixner <tglx@linutronix.de>
2015-07-17 10:46:42 +01:00
u16 * col_map = NULL ;
2014-11-24 14:35:15 +00:00
void * itt ;
int lpi_base ;
int nr_lpis ;
2014-12-12 10:51:24 +00:00
int nr_ites ;
2014-11-24 14:35:15 +00:00
int sz ;
2016-06-06 18:17:32 -05:00
if ( ! its_alloc_device_table ( its , dev_id ) )
2016-03-09 22:10:49 -06:00
return NULL ;
2014-11-24 14:35:15 +00:00
dev = kzalloc ( sizeof ( * dev ) , GFP_KERNEL ) ;
2014-12-12 10:51:24 +00:00
/*
* At least one bit of EventID is being used , hence a minimum
* of two entries . No , the architecture doesn ' t let you
* express an ITT with a single entry .
*/
2014-12-17 14:11:09 +00:00
nr_ites = max ( 2UL , roundup_pow_of_two ( nvecs ) ) ;
2014-12-12 10:51:24 +00:00
sz = nr_ites * its - > ite_size ;
2014-11-24 14:35:15 +00:00
sz = max ( sz , ITS_ITT_ALIGN ) + ITS_ITT_ALIGN - 1 ;
2015-03-06 16:37:46 +00:00
itt = kzalloc ( sz , GFP_KERNEL ) ;
2014-11-24 14:35:15 +00:00
lpi_map = its_lpi_alloc_chunks ( nvecs , & lpi_base , & nr_lpis ) ;
irqchip/gicv3-its: Fix mapping of LPIs to collections
The GICv3 ITS architecture allows a given [DevID, EventID] pair to be
translated to a [LPI, Collection] pair, where DevID is the device writing
the MSI, EventID is the payload being written, LPI is the actual
interrupt number, and Collection is roughly equivalent to a target CPU.
Each LPI can be mapped to a separate collection, but the ITS driver
insists on maintaining the collection on a device basis, instead of doing
it on a per interrupt basis.
This is obviously flawed, and this patch fixes it by adding a per interrupt
index that indicates which collection number is in use.
Reported-by: Ian Campbell <ian.campbell@citrix.com>
Signed-off-by: Marc Zyngier <marc.zyngier@arm.com>
Cc: <linux-arm-kernel@lists.infradead.org>
Cc: Jason Cooper <jason@lakedaemon.net>
Cc: stable@vger.kernel.org # 4.1, 4.0
Link: http://lkml.kernel.org/r/1437126402-11677-1-git-send-email-marc.zyngier@arm.com
Signed-off-by: Thomas Gleixner <tglx@linutronix.de>
2015-07-17 10:46:42 +01:00
if ( lpi_map )
col_map = kzalloc ( sizeof ( * col_map ) * nr_lpis , GFP_KERNEL ) ;
2014-11-24 14:35:15 +00:00
irqchip/gicv3-its: Fix mapping of LPIs to collections
The GICv3 ITS architecture allows a given [DevID, EventID] pair to be
translated to a [LPI, Collection] pair, where DevID is the device writing
the MSI, EventID is the payload being written, LPI is the actual
interrupt number, and Collection is roughly equivalent to a target CPU.
Each LPI can be mapped to a separate collection, but the ITS driver
insists on maintaining the collection on a device basis, instead of doing
it on a per interrupt basis.
This is obviously flawed, and this patch fixes it by adding a per interrupt
index that indicates which collection number is in use.
Reported-by: Ian Campbell <ian.campbell@citrix.com>
Signed-off-by: Marc Zyngier <marc.zyngier@arm.com>
Cc: <linux-arm-kernel@lists.infradead.org>
Cc: Jason Cooper <jason@lakedaemon.net>
Cc: stable@vger.kernel.org # 4.1, 4.0
Link: http://lkml.kernel.org/r/1437126402-11677-1-git-send-email-marc.zyngier@arm.com
Signed-off-by: Thomas Gleixner <tglx@linutronix.de>
2015-07-17 10:46:42 +01:00
if ( ! dev | | ! itt | | ! lpi_map | | ! col_map ) {
2014-11-24 14:35:15 +00:00
kfree ( dev ) ;
kfree ( itt ) ;
kfree ( lpi_map ) ;
irqchip/gicv3-its: Fix mapping of LPIs to collections
The GICv3 ITS architecture allows a given [DevID, EventID] pair to be
translated to a [LPI, Collection] pair, where DevID is the device writing
the MSI, EventID is the payload being written, LPI is the actual
interrupt number, and Collection is roughly equivalent to a target CPU.
Each LPI can be mapped to a separate collection, but the ITS driver
insists on maintaining the collection on a device basis, instead of doing
it on a per interrupt basis.
This is obviously flawed, and this patch fixes it by adding a per interrupt
index that indicates which collection number is in use.
Reported-by: Ian Campbell <ian.campbell@citrix.com>
Signed-off-by: Marc Zyngier <marc.zyngier@arm.com>
Cc: <linux-arm-kernel@lists.infradead.org>
Cc: Jason Cooper <jason@lakedaemon.net>
Cc: stable@vger.kernel.org # 4.1, 4.0
Link: http://lkml.kernel.org/r/1437126402-11677-1-git-send-email-marc.zyngier@arm.com
Signed-off-by: Thomas Gleixner <tglx@linutronix.de>
2015-07-17 10:46:42 +01:00
kfree ( col_map ) ;
2014-11-24 14:35:15 +00:00
return NULL ;
}
2016-11-02 11:54:05 +00:00
gic_flush_dcache_to_poc ( itt , sz ) ;
2015-09-13 12:14:32 +01:00
2014-11-24 14:35:15 +00:00
dev - > its = its ;
dev - > itt = itt ;
2014-12-12 10:51:24 +00:00
dev - > nr_ites = nr_ites ;
irqchip/gicv3-its: Fix mapping of LPIs to collections
The GICv3 ITS architecture allows a given [DevID, EventID] pair to be
translated to a [LPI, Collection] pair, where DevID is the device writing
the MSI, EventID is the payload being written, LPI is the actual
interrupt number, and Collection is roughly equivalent to a target CPU.
Each LPI can be mapped to a separate collection, but the ITS driver
insists on maintaining the collection on a device basis, instead of doing
it on a per interrupt basis.
This is obviously flawed, and this patch fixes it by adding a per interrupt
index that indicates which collection number is in use.
Reported-by: Ian Campbell <ian.campbell@citrix.com>
Signed-off-by: Marc Zyngier <marc.zyngier@arm.com>
Cc: <linux-arm-kernel@lists.infradead.org>
Cc: Jason Cooper <jason@lakedaemon.net>
Cc: stable@vger.kernel.org # 4.1, 4.0
Link: http://lkml.kernel.org/r/1437126402-11677-1-git-send-email-marc.zyngier@arm.com
Signed-off-by: Thomas Gleixner <tglx@linutronix.de>
2015-07-17 10:46:42 +01:00
dev - > event_map . lpi_map = lpi_map ;
dev - > event_map . col_map = col_map ;
dev - > event_map . lpi_base = lpi_base ;
dev - > event_map . nr_lpis = nr_lpis ;
2014-11-24 14:35:15 +00:00
dev - > device_id = dev_id ;
INIT_LIST_HEAD ( & dev - > entry ) ;
2015-03-06 16:37:43 +00:00
raw_spin_lock_irqsave ( & its - > lock , flags ) ;
2014-11-24 14:35:15 +00:00
list_add ( & dev - > entry , & its - > its_device_list ) ;
2015-03-06 16:37:43 +00:00
raw_spin_unlock_irqrestore ( & its - > lock , flags ) ;
2014-11-24 14:35:15 +00:00
/* Map device to its ITT */
its_send_mapd ( dev , 1 ) ;
return dev ;
}
static void its_free_device ( struct its_device * its_dev )
{
2015-03-06 16:37:43 +00:00
unsigned long flags ;
raw_spin_lock_irqsave ( & its_dev - > its - > lock , flags ) ;
2014-11-24 14:35:15 +00:00
list_del ( & its_dev - > entry ) ;
2015-03-06 16:37:43 +00:00
raw_spin_unlock_irqrestore ( & its_dev - > its - > lock , flags ) ;
2014-11-24 14:35:15 +00:00
kfree ( its_dev - > itt ) ;
kfree ( its_dev ) ;
}
2014-11-24 14:35:16 +00:00
static int its_alloc_device_irq ( struct its_device * dev , irq_hw_number_t * hwirq )
{
int idx ;
irqchip/gicv3-its: Fix mapping of LPIs to collections
The GICv3 ITS architecture allows a given [DevID, EventID] pair to be
translated to a [LPI, Collection] pair, where DevID is the device writing
the MSI, EventID is the payload being written, LPI is the actual
interrupt number, and Collection is roughly equivalent to a target CPU.
Each LPI can be mapped to a separate collection, but the ITS driver
insists on maintaining the collection on a device basis, instead of doing
it on a per interrupt basis.
This is obviously flawed, and this patch fixes it by adding a per interrupt
index that indicates which collection number is in use.
Reported-by: Ian Campbell <ian.campbell@citrix.com>
Signed-off-by: Marc Zyngier <marc.zyngier@arm.com>
Cc: <linux-arm-kernel@lists.infradead.org>
Cc: Jason Cooper <jason@lakedaemon.net>
Cc: stable@vger.kernel.org # 4.1, 4.0
Link: http://lkml.kernel.org/r/1437126402-11677-1-git-send-email-marc.zyngier@arm.com
Signed-off-by: Thomas Gleixner <tglx@linutronix.de>
2015-07-17 10:46:42 +01:00
idx = find_first_zero_bit ( dev - > event_map . lpi_map ,
dev - > event_map . nr_lpis ) ;
if ( idx = = dev - > event_map . nr_lpis )
2014-11-24 14:35:16 +00:00
return - ENOSPC ;
irqchip/gicv3-its: Fix mapping of LPIs to collections
The GICv3 ITS architecture allows a given [DevID, EventID] pair to be
translated to a [LPI, Collection] pair, where DevID is the device writing
the MSI, EventID is the payload being written, LPI is the actual
interrupt number, and Collection is roughly equivalent to a target CPU.
Each LPI can be mapped to a separate collection, but the ITS driver
insists on maintaining the collection on a device basis, instead of doing
it on a per interrupt basis.
This is obviously flawed, and this patch fixes it by adding a per interrupt
index that indicates which collection number is in use.
Reported-by: Ian Campbell <ian.campbell@citrix.com>
Signed-off-by: Marc Zyngier <marc.zyngier@arm.com>
Cc: <linux-arm-kernel@lists.infradead.org>
Cc: Jason Cooper <jason@lakedaemon.net>
Cc: stable@vger.kernel.org # 4.1, 4.0
Link: http://lkml.kernel.org/r/1437126402-11677-1-git-send-email-marc.zyngier@arm.com
Signed-off-by: Thomas Gleixner <tglx@linutronix.de>
2015-07-17 10:46:42 +01:00
* hwirq = dev - > event_map . lpi_base + idx ;
set_bit ( idx , dev - > event_map . lpi_map ) ;
2014-11-24 14:35:16 +00:00
return 0 ;
}
2015-07-28 14:46:21 +01:00
static int its_msi_prepare ( struct irq_domain * domain , struct device * dev ,
int nvec , msi_alloc_info_t * info )
2015-03-06 16:37:42 +00:00
{
2014-11-24 14:35:16 +00:00
struct its_node * its ;
struct its_device * its_dev ;
2015-07-28 14:46:21 +01:00
struct msi_domain_info * msi_info ;
u32 dev_id ;
/*
* We ignore " dev " entierely , and rely on the dev_id that has
* been passed via the scratchpad . This limits this domain ' s
* usefulness to upper layers that definitely know that they
* are built on top of the ITS .
*/
dev_id = info - > scratchpad [ 0 ] . ul ;
msi_info = msi_get_domain_info ( domain ) ;
its = msi_info - > data ;
2015-03-06 16:37:42 +00:00
2015-07-28 14:46:18 +01:00
its_dev = its_find_device ( its , dev_id ) ;
2015-03-06 16:37:42 +00:00
if ( its_dev ) {
/*
* We already have seen this ID , probably through
* another alias ( PCI bridge of some sort ) . No need to
* create the device .
*/
2015-07-28 14:46:18 +01:00
pr_debug ( " Reusing ITT for devID %x \n " , dev_id ) ;
2015-03-06 16:37:42 +00:00
goto out ;
}
2014-11-24 14:35:16 +00:00
2015-07-28 14:46:18 +01:00
its_dev = its_create_device ( its , dev_id , nvec ) ;
2014-11-24 14:35:16 +00:00
if ( ! its_dev )
return - ENOMEM ;
2015-07-28 14:46:18 +01:00
pr_debug ( " ITT %d entries, %d bits \n " , nvec , ilog2 ( nvec ) ) ;
2015-03-06 16:37:42 +00:00
out :
2014-11-24 14:35:16 +00:00
info - > scratchpad [ 0 ] . ptr = its_dev ;
return 0 ;
}
2015-07-28 14:46:21 +01:00
static struct msi_domain_ops its_msi_domain_ops = {
. msi_prepare = its_msi_prepare ,
} ;
2014-11-24 14:35:16 +00:00
static int its_irq_gic_domain_alloc ( struct irq_domain * domain ,
unsigned int virq ,
irq_hw_number_t hwirq )
{
2015-10-13 12:51:33 +01:00
struct irq_fwspec fwspec ;
if ( irq_domain_get_of_node ( domain - > parent ) ) {
fwspec . fwnode = domain - > parent - > fwnode ;
fwspec . param_count = 3 ;
fwspec . param [ 0 ] = GIC_IRQ_TYPE_LPI ;
fwspec . param [ 1 ] = hwirq ;
fwspec . param [ 2 ] = IRQ_TYPE_EDGE_RISING ;
2016-09-12 20:32:25 +02:00
} else if ( is_fwnode_irqchip ( domain - > parent - > fwnode ) ) {
fwspec . fwnode = domain - > parent - > fwnode ;
fwspec . param_count = 2 ;
fwspec . param [ 0 ] = hwirq ;
fwspec . param [ 1 ] = IRQ_TYPE_EDGE_RISING ;
2015-10-13 12:51:33 +01:00
} else {
return - EINVAL ;
}
2014-11-24 14:35:16 +00:00
2015-10-13 12:51:33 +01:00
return irq_domain_alloc_irqs_parent ( domain , virq , 1 , & fwspec ) ;
2014-11-24 14:35:16 +00:00
}
static int its_irq_domain_alloc ( struct irq_domain * domain , unsigned int virq ,
unsigned int nr_irqs , void * args )
{
msi_alloc_info_t * info = args ;
struct its_device * its_dev = info - > scratchpad [ 0 ] . ptr ;
irq_hw_number_t hwirq ;
int err ;
int i ;
for ( i = 0 ; i < nr_irqs ; i + + ) {
err = its_alloc_device_irq ( its_dev , & hwirq ) ;
if ( err )
return err ;
err = its_irq_gic_domain_alloc ( domain , virq + i , hwirq ) ;
if ( err )
return err ;
irq_domain_set_hwirq_and_chip ( domain , virq + i ,
hwirq , & its_irq_chip , its_dev ) ;
2015-07-28 14:46:18 +01:00
pr_debug ( " ID:%d pID:%d vID:%d \n " ,
( int ) ( hwirq - its_dev - > event_map . lpi_base ) ,
( int ) hwirq , virq + i ) ;
2014-11-24 14:35:16 +00:00
}
return 0 ;
}
2014-12-12 10:51:23 +00:00
static void its_irq_domain_activate ( struct irq_domain * domain ,
struct irq_data * d )
{
struct its_device * its_dev = irq_data_get_irq_chip_data ( d ) ;
u32 event = its_get_event_id ( d ) ;
2016-05-25 15:29:20 +02:00
const struct cpumask * cpu_mask = cpu_online_mask ;
/* get the cpu_mask of local node */
if ( its_dev - > its - > numa_node > = 0 )
cpu_mask = cpumask_of_node ( its_dev - > its - > numa_node ) ;
2014-12-12 10:51:23 +00:00
irqchip/gicv3-its: Fix mapping of LPIs to collections
The GICv3 ITS architecture allows a given [DevID, EventID] pair to be
translated to a [LPI, Collection] pair, where DevID is the device writing
the MSI, EventID is the payload being written, LPI is the actual
interrupt number, and Collection is roughly equivalent to a target CPU.
Each LPI can be mapped to a separate collection, but the ITS driver
insists on maintaining the collection on a device basis, instead of doing
it on a per interrupt basis.
This is obviously flawed, and this patch fixes it by adding a per interrupt
index that indicates which collection number is in use.
Reported-by: Ian Campbell <ian.campbell@citrix.com>
Signed-off-by: Marc Zyngier <marc.zyngier@arm.com>
Cc: <linux-arm-kernel@lists.infradead.org>
Cc: Jason Cooper <jason@lakedaemon.net>
Cc: stable@vger.kernel.org # 4.1, 4.0
Link: http://lkml.kernel.org/r/1437126402-11677-1-git-send-email-marc.zyngier@arm.com
Signed-off-by: Thomas Gleixner <tglx@linutronix.de>
2015-07-17 10:46:42 +01:00
/* Bind the LPI to the first possible CPU */
2016-05-25 15:29:20 +02:00
its_dev - > event_map . col_map [ event ] = cpumask_first ( cpu_mask ) ;
irqchip/gicv3-its: Fix mapping of LPIs to collections
The GICv3 ITS architecture allows a given [DevID, EventID] pair to be
translated to a [LPI, Collection] pair, where DevID is the device writing
the MSI, EventID is the payload being written, LPI is the actual
interrupt number, and Collection is roughly equivalent to a target CPU.
Each LPI can be mapped to a separate collection, but the ITS driver
insists on maintaining the collection on a device basis, instead of doing
it on a per interrupt basis.
This is obviously flawed, and this patch fixes it by adding a per interrupt
index that indicates which collection number is in use.
Reported-by: Ian Campbell <ian.campbell@citrix.com>
Signed-off-by: Marc Zyngier <marc.zyngier@arm.com>
Cc: <linux-arm-kernel@lists.infradead.org>
Cc: Jason Cooper <jason@lakedaemon.net>
Cc: stable@vger.kernel.org # 4.1, 4.0
Link: http://lkml.kernel.org/r/1437126402-11677-1-git-send-email-marc.zyngier@arm.com
Signed-off-by: Thomas Gleixner <tglx@linutronix.de>
2015-07-17 10:46:42 +01:00
2014-12-12 10:51:23 +00:00
/* Map the GIC IRQ and event to the device */
2016-12-20 15:52:26 +00:00
its_send_mapti ( its_dev , d - > hwirq , event ) ;
2014-12-12 10:51:23 +00:00
}
static void its_irq_domain_deactivate ( struct irq_domain * domain ,
struct irq_data * d )
{
struct its_device * its_dev = irq_data_get_irq_chip_data ( d ) ;
u32 event = its_get_event_id ( d ) ;
/* Stop the delivery of interrupts */
its_send_discard ( its_dev , event ) ;
}
2014-11-24 14:35:16 +00:00
static void its_irq_domain_free ( struct irq_domain * domain , unsigned int virq ,
unsigned int nr_irqs )
{
struct irq_data * d = irq_domain_get_irq_data ( domain , virq ) ;
struct its_device * its_dev = irq_data_get_irq_chip_data ( d ) ;
int i ;
for ( i = 0 ; i < nr_irqs ; i + + ) {
struct irq_data * data = irq_domain_get_irq_data ( domain ,
virq + i ) ;
2014-12-12 10:51:23 +00:00
u32 event = its_get_event_id ( data ) ;
2014-11-24 14:35:16 +00:00
/* Mark interrupt index as unused */
irqchip/gicv3-its: Fix mapping of LPIs to collections
The GICv3 ITS architecture allows a given [DevID, EventID] pair to be
translated to a [LPI, Collection] pair, where DevID is the device writing
the MSI, EventID is the payload being written, LPI is the actual
interrupt number, and Collection is roughly equivalent to a target CPU.
Each LPI can be mapped to a separate collection, but the ITS driver
insists on maintaining the collection on a device basis, instead of doing
it on a per interrupt basis.
This is obviously flawed, and this patch fixes it by adding a per interrupt
index that indicates which collection number is in use.
Reported-by: Ian Campbell <ian.campbell@citrix.com>
Signed-off-by: Marc Zyngier <marc.zyngier@arm.com>
Cc: <linux-arm-kernel@lists.infradead.org>
Cc: Jason Cooper <jason@lakedaemon.net>
Cc: stable@vger.kernel.org # 4.1, 4.0
Link: http://lkml.kernel.org/r/1437126402-11677-1-git-send-email-marc.zyngier@arm.com
Signed-off-by: Thomas Gleixner <tglx@linutronix.de>
2015-07-17 10:46:42 +01:00
clear_bit ( event , its_dev - > event_map . lpi_map ) ;
2014-11-24 14:35:16 +00:00
/* Nuke the entry in the domain */
2014-12-12 10:51:22 +00:00
irq_domain_reset_irq_data ( data ) ;
2014-11-24 14:35:16 +00:00
}
/* If all interrupts have been freed, start mopping the floor */
irqchip/gicv3-its: Fix mapping of LPIs to collections
The GICv3 ITS architecture allows a given [DevID, EventID] pair to be
translated to a [LPI, Collection] pair, where DevID is the device writing
the MSI, EventID is the payload being written, LPI is the actual
interrupt number, and Collection is roughly equivalent to a target CPU.
Each LPI can be mapped to a separate collection, but the ITS driver
insists on maintaining the collection on a device basis, instead of doing
it on a per interrupt basis.
This is obviously flawed, and this patch fixes it by adding a per interrupt
index that indicates which collection number is in use.
Reported-by: Ian Campbell <ian.campbell@citrix.com>
Signed-off-by: Marc Zyngier <marc.zyngier@arm.com>
Cc: <linux-arm-kernel@lists.infradead.org>
Cc: Jason Cooper <jason@lakedaemon.net>
Cc: stable@vger.kernel.org # 4.1, 4.0
Link: http://lkml.kernel.org/r/1437126402-11677-1-git-send-email-marc.zyngier@arm.com
Signed-off-by: Thomas Gleixner <tglx@linutronix.de>
2015-07-17 10:46:42 +01:00
if ( bitmap_empty ( its_dev - > event_map . lpi_map ,
its_dev - > event_map . nr_lpis ) ) {
its_lpi_free ( & its_dev - > event_map ) ;
2014-11-24 14:35:16 +00:00
/* Unmap device/itt */
its_send_mapd ( its_dev , 0 ) ;
its_free_device ( its_dev ) ;
}
irq_domain_free_irqs_parent ( domain , virq , nr_irqs ) ;
}
static const struct irq_domain_ops its_domain_ops = {
. alloc = its_irq_domain_alloc ,
. free = its_irq_domain_free ,
2014-12-12 10:51:23 +00:00
. activate = its_irq_domain_activate ,
. deactivate = its_irq_domain_deactivate ,
2014-11-24 14:35:16 +00:00
} ;
2014-11-24 14:35:17 +00:00
2015-03-06 16:37:50 +00:00
static int its_force_quiescent ( void __iomem * base )
{
u32 count = 1000000 ; /* 1s */
u32 val ;
val = readl_relaxed ( base + GITS_CTLR ) ;
2016-08-18 15:41:58 -07:00
/*
* GIC architecture specification requires the ITS to be both
* disabled and quiescent for writes to GITS_BASER < n > or
* GITS_CBASER to not have UNPREDICTABLE results .
*/
if ( ( val & GITS_CTLR_QUIESCENT ) & & ! ( val & GITS_CTLR_ENABLE ) )
2015-03-06 16:37:50 +00:00
return 0 ;
/* Disable the generation of all interrupts to this ITS */
val & = ~ GITS_CTLR_ENABLE ;
writel_relaxed ( val , base + GITS_CTLR ) ;
/* Poll GITS_CTLR and wait until ITS becomes quiescent */
while ( 1 ) {
val = readl_relaxed ( base + GITS_CTLR ) ;
if ( val & GITS_CTLR_QUIESCENT )
return 0 ;
count - - ;
if ( ! count )
return - EBUSY ;
cpu_relax ( ) ;
udelay ( 1 ) ;
}
}
2015-09-21 22:58:38 +02:00
static void __maybe_unused its_enable_quirk_cavium_22375 ( void * data )
{
struct its_node * its = data ;
its - > flags | = ITS_FLAGS_WORKAROUND_CAVIUM_22375 ;
}
2016-05-25 15:29:20 +02:00
static void __maybe_unused its_enable_quirk_cavium_23144 ( void * data )
{
struct its_node * its = data ;
its - > flags | = ITS_FLAGS_WORKAROUND_CAVIUM_23144 ;
}
2015-09-21 22:58:37 +02:00
static const struct gic_quirk its_quirks [ ] = {
2015-09-21 22:58:38 +02:00
# ifdef CONFIG_CAVIUM_ERRATUM_22375
{
. desc = " ITS: Cavium errata 22375, 24313 " ,
. iidr = 0xa100034c , /* ThunderX pass 1.x */
. mask = 0xffff0fff ,
. init = its_enable_quirk_cavium_22375 ,
} ,
2016-05-25 15:29:20 +02:00
# endif
# ifdef CONFIG_CAVIUM_ERRATUM_23144
{
. desc = " ITS: Cavium erratum 23144 " ,
. iidr = 0xa100034c , /* ThunderX pass 1.x */
. mask = 0xffff0fff ,
. init = its_enable_quirk_cavium_23144 ,
} ,
2015-09-21 22:58:38 +02:00
# endif
2015-09-21 22:58:37 +02:00
{
}
} ;
static void its_enable_quirks ( struct its_node * its )
{
u32 iidr = readl_relaxed ( its - > base + GITS_IIDR ) ;
gic_enable_quirks ( iidr , its_quirks , its ) ;
}
2016-09-12 20:32:24 +02:00
static int its_init_domain ( struct fwnode_handle * handle , struct its_node * its )
2016-09-12 20:32:23 +02:00
{
struct irq_domain * inner_domain ;
struct msi_domain_info * info ;
info = kzalloc ( sizeof ( * info ) , GFP_KERNEL ) ;
if ( ! info )
return - ENOMEM ;
2016-09-12 20:32:24 +02:00
inner_domain = irq_domain_create_tree ( handle , & its_domain_ops , its ) ;
2016-09-12 20:32:23 +02:00
if ( ! inner_domain ) {
kfree ( info ) ;
return - ENOMEM ;
}
2016-09-12 20:32:24 +02:00
inner_domain - > parent = its_parent ;
2016-09-12 20:32:23 +02:00
inner_domain - > bus_token = DOMAIN_BUS_NEXUS ;
2017-01-19 20:58:00 +00:00
inner_domain - > flags | = IRQ_DOMAIN_FLAG_MSI_REMAP ;
2016-09-12 20:32:23 +02:00
info - > ops = & its_msi_domain_ops ;
info - > data = its ;
inner_domain - > host_data = info ;
return 0 ;
}
2016-09-12 20:32:24 +02:00
static int __init its_probe_one ( struct resource * res ,
struct fwnode_handle * handle , int numa_node )
2014-11-24 14:35:17 +00:00
{
struct its_node * its ;
void __iomem * its_base ;
u32 val ;
u64 baser , tmp ;
int err ;
2016-09-12 20:32:24 +02:00
its_base = ioremap ( res - > start , resource_size ( res ) ) ;
2014-11-24 14:35:17 +00:00
if ( ! its_base ) {
2016-09-12 20:32:24 +02:00
pr_warn ( " ITS@%pa: Unable to map ITS registers \n " , & res - > start ) ;
2014-11-24 14:35:17 +00:00
return - ENOMEM ;
}
val = readl_relaxed ( its_base + GITS_PIDR2 ) & GIC_PIDR2_ARCH_MASK ;
if ( val ! = 0x30 & & val ! = 0x40 ) {
2016-09-12 20:32:24 +02:00
pr_warn ( " ITS@%pa: No ITS detected, giving up \n " , & res - > start ) ;
2014-11-24 14:35:17 +00:00
err = - ENODEV ;
goto out_unmap ;
}
2015-03-06 16:37:50 +00:00
err = its_force_quiescent ( its_base ) ;
if ( err ) {
2016-09-12 20:32:24 +02:00
pr_warn ( " ITS@%pa: Failed to quiesce, giving up \n " , & res - > start ) ;
2015-03-06 16:37:50 +00:00
goto out_unmap ;
}
2016-09-12 20:32:24 +02:00
pr_info ( " ITS %pR \n " , res ) ;
2014-11-24 14:35:17 +00:00
its = kzalloc ( sizeof ( * its ) , GFP_KERNEL ) ;
if ( ! its ) {
err = - ENOMEM ;
goto out_unmap ;
}
raw_spin_lock_init ( & its - > lock ) ;
INIT_LIST_HEAD ( & its - > entry ) ;
INIT_LIST_HEAD ( & its - > its_device_list ) ;
its - > base = its_base ;
2016-09-12 20:32:24 +02:00
its - > phys_base = res - > start ;
2016-10-14 15:13:07 +01:00
its - > ite_size = ( ( gic_read_typer ( its_base + GITS_TYPER ) > > 4 ) & 0xf ) + 1 ;
2016-09-12 20:32:24 +02:00
its - > numa_node = numa_node ;
2014-11-24 14:35:17 +00:00
2017-02-01 18:38:25 +01:00
its - > cmd_base = ( void * ) __get_free_pages ( GFP_KERNEL | __GFP_ZERO ,
get_order ( ITS_CMD_QUEUE_SZ ) ) ;
2014-11-24 14:35:17 +00:00
if ( ! its - > cmd_base ) {
err = - ENOMEM ;
goto out_free_its ;
}
its - > cmd_write = its - > cmd_base ;
2015-09-21 22:58:37 +02:00
its_enable_quirks ( its ) ;
2016-06-06 18:17:31 -05:00
err = its_alloc_tables ( its ) ;
2014-11-24 14:35:17 +00:00
if ( err )
goto out_free_cmd ;
err = its_alloc_collections ( its ) ;
if ( err )
goto out_free_tables ;
baser = ( virt_to_phys ( its - > cmd_base ) |
2017-01-25 21:51:41 -06:00
GITS_CBASER_RaWaWb |
2014-11-24 14:35:17 +00:00
GITS_CBASER_InnerShareable |
( ITS_CMD_QUEUE_SZ / SZ_4K - 1 ) |
GITS_CBASER_VALID ) ;
2016-11-02 11:54:06 +00:00
gits_write_cbaser ( baser , its - > base + GITS_CBASER ) ;
tmp = gits_read_cbaser ( its - > base + GITS_CBASER ) ;
2014-11-24 14:35:17 +00:00
2015-03-27 14:15:04 +00:00
if ( ( tmp ^ baser ) & GITS_CBASER_SHAREABILITY_MASK ) {
2015-03-27 14:15:05 +00:00
if ( ! ( tmp & GITS_CBASER_SHAREABILITY_MASK ) ) {
/*
* The HW reports non - shareable , we must
* remove the cacheability attributes as
* well .
*/
baser & = ~ ( GITS_CBASER_SHAREABILITY_MASK |
GITS_CBASER_CACHEABILITY_MASK ) ;
baser | = GITS_CBASER_nC ;
2016-11-02 11:54:06 +00:00
gits_write_cbaser ( baser , its - > base + GITS_CBASER ) ;
2015-03-27 14:15:05 +00:00
}
2014-11-24 14:35:17 +00:00
pr_info ( " ITS: using cache flushing for cmd queue \n " ) ;
its - > flags | = ITS_FLAGS_CMDQ_NEEDS_FLUSHING ;
}
2016-11-02 11:54:06 +00:00
gits_write_cwriter ( 0 , its - > base + GITS_CWRITER ) ;
2015-03-27 14:15:05 +00:00
writel_relaxed ( GITS_CTLR_ENABLE , its - > base + GITS_CTLR ) ;
2016-09-12 20:32:24 +02:00
err = its_init_domain ( handle , its ) ;
2016-09-12 20:32:23 +02:00
if ( err )
goto out_free_tables ;
2014-11-24 14:35:17 +00:00
spin_lock ( & its_lock ) ;
list_add ( & its - > entry , & its_nodes ) ;
spin_unlock ( & its_lock ) ;
return 0 ;
out_free_tables :
its_free_tables ( its ) ;
out_free_cmd :
2017-02-01 18:38:25 +01:00
free_pages ( ( unsigned long ) its - > cmd_base , get_order ( ITS_CMD_QUEUE_SZ ) ) ;
2014-11-24 14:35:17 +00:00
out_free_its :
kfree ( its ) ;
out_unmap :
iounmap ( its_base ) ;
2016-09-12 20:32:24 +02:00
pr_err ( " ITS@%pa: failed probing (%d) \n " , & res - > start , err ) ;
2014-11-24 14:35:17 +00:00
return err ;
}
static bool gic_rdists_supports_plpis ( void )
{
2016-10-14 15:13:07 +01:00
return ! ! ( gic_read_typer ( gic_data_rdist_rd_base ( ) + GICR_TYPER ) & GICR_TYPER_PLPIS ) ;
2014-11-24 14:35:17 +00:00
}
int its_cpu_init ( void )
{
if ( ! list_empty ( & its_nodes ) ) {
2015-03-06 16:37:40 +00:00
if ( ! gic_rdists_supports_plpis ( ) ) {
pr_info ( " CPU%d: LPIs not supported \n " , smp_processor_id ( ) ) ;
return - ENXIO ;
}
2014-11-24 14:35:17 +00:00
its_cpu_init_lpis ( ) ;
its_cpu_init_collection ( ) ;
}
return 0 ;
}
static struct of_device_id its_device_id [ ] = {
{ . compatible = " arm,gic-v3-its " , } ,
{ } ,
} ;
2016-09-12 20:32:24 +02:00
static int __init its_of_probe ( struct device_node * node )
2014-11-24 14:35:17 +00:00
{
struct device_node * np ;
2016-09-12 20:32:24 +02:00
struct resource res ;
2014-11-24 14:35:17 +00:00
for ( np = of_find_matching_node ( node , its_device_id ) ; np ;
np = of_find_matching_node ( np , its_device_id ) ) {
2016-09-12 20:32:23 +02:00
if ( ! of_property_read_bool ( np , " msi-controller " ) ) {
pr_warn ( " %s: no msi-controller property, ITS ignored \n " ,
np - > full_name ) ;
continue ;
}
2016-09-12 20:32:24 +02:00
if ( of_address_to_resource ( np , 0 , & res ) ) {
pr_warn ( " %s: no regs? \n " , np - > full_name ) ;
continue ;
}
its_probe_one ( & res , & np - > fwnode , of_node_to_nid ( np ) ) ;
2014-11-24 14:35:17 +00:00
}
2016-09-12 20:32:24 +02:00
return 0 ;
}
2016-09-12 20:32:25 +02:00
# ifdef CONFIG_ACPI
# define ACPI_GICV3_ITS_MEM_SIZE (SZ_128K)
static int __init gic_acpi_parse_madt_its ( struct acpi_subtable_header * header ,
const unsigned long end )
{
struct acpi_madt_generic_translator * its_entry ;
struct fwnode_handle * dom_handle ;
struct resource res ;
int err ;
its_entry = ( struct acpi_madt_generic_translator * ) header ;
memset ( & res , 0 , sizeof ( res ) ) ;
res . start = its_entry - > base_address ;
res . end = its_entry - > base_address + ACPI_GICV3_ITS_MEM_SIZE - 1 ;
res . flags = IORESOURCE_MEM ;
dom_handle = irq_domain_alloc_fwnode ( ( void * ) its_entry - > base_address ) ;
if ( ! dom_handle ) {
pr_err ( " ITS@%pa: Unable to allocate GICv3 ITS domain token \n " ,
& res . start ) ;
return - ENOMEM ;
}
err = iort_register_domain_token ( its_entry - > translation_id , dom_handle ) ;
if ( err ) {
pr_err ( " ITS@%pa: Unable to register GICv3 ITS domain token (ITS ID %d) to IORT \n " ,
& res . start , its_entry - > translation_id ) ;
goto dom_err ;
}
err = its_probe_one ( & res , dom_handle , NUMA_NO_NODE ) ;
if ( ! err )
return 0 ;
iort_deregister_domain_token ( its_entry - > translation_id ) ;
dom_err :
irq_domain_free_fwnode ( dom_handle ) ;
return err ;
}
static void __init its_acpi_probe ( void )
{
acpi_table_parse_madt ( ACPI_MADT_TYPE_GENERIC_TRANSLATOR ,
gic_acpi_parse_madt_its , 0 ) ;
}
# else
static void __init its_acpi_probe ( void ) { }
# endif
2016-09-12 20:32:24 +02:00
int __init its_init ( struct fwnode_handle * handle , struct rdists * rdists ,
struct irq_domain * parent_domain )
{
struct device_node * of_node ;
its_parent = parent_domain ;
of_node = to_of_node ( handle ) ;
if ( of_node )
its_of_probe ( of_node ) ;
else
2016-09-12 20:32:25 +02:00
its_acpi_probe ( ) ;
2014-11-24 14:35:17 +00:00
if ( list_empty ( & its_nodes ) ) {
pr_warn ( " ITS: No ITS available, not enabling LPIs \n " ) ;
return - ENXIO ;
}
gic_rdists = rdists ;
its_alloc_lpi_tables ( ) ;
its_lpi_init ( rdists - > id_bits ) ;
return 0 ;
}