7c3dc440b1
- CXL RAM region enumeration: instantiate 'struct cxl_region' objects for platform firmware created memory regions - CXL RAM region provisioning: complement the existing PMEM region creation support with RAM region support - "Soft Reservation" policy change: Online (memory hot-add) soft-reserved memory (EFI_MEMORY_SP) by default, but still allow for setting aside such memory for dedicated access via device-dax. - CXL Events and Interrupts: Takeover CXL event handling from platform-firmware (ACPI calls this CXL Memory Error Reporting) and export CXL Events via Linux Trace Events. - Convey CXL _OSC results to drivers: Similar to PCI, let the CXL subsystem interrogate the result of CXL _OSC negotiation. - Emulate CXL DVSEC Range Registers as "decoders": Allow for first-generation devices that pre-date the definition of the CXL HDM Decoder Capability to translate the CXL DVSEC Range Registers into 'struct cxl_decoder' objects. - Set timestamp: Per spec, set the device timestamp in case of hotplug, or if platform-firwmare failed to set it. - General fixups: linux-next build issues, non-urgent fixes for pre-production hardware, unit test fixes, spelling and debug message improvements. -----BEGIN PGP SIGNATURE----- iHUEABYKAB0WIQSbo+XnGs+rwLz9XGXfioYZHlFsZwUCY/WYcgAKCRDfioYZHlFs Z6m3APkBUtiEEm1o8ikdu5llUS1OTLBwqjJDwGMTyf8X/WDXhgD+J2mLsCgARS7X 5IS0RAtefutrW5sQpUucPM7QiLuraAY= =kOXC -----END PGP SIGNATURE----- Merge tag 'cxl-for-6.3' of git://git.kernel.org/pub/scm/linux/kernel/git/cxl/cxl Pull Compute Express Link (CXL) updates from Dan Williams: "To date Linux has been dependent on platform-firmware to map CXL RAM regions and handle events / errors from devices. With this update we can now parse / update the CXL memory layout, and report events / errors from devices. This is a precursor for the CXL subsystem to handle the end-to-end "RAS" flow for CXL memory. i.e. the flow that for DDR-attached-DRAM is handled by the EDAC driver where it maps system physical address events to a field-replaceable-unit (FRU / endpoint device). In general, CXL has the potential to standardize what has historically been a pile of memory-controller-specific error handling logic. Another change of note is the default policy for handling RAM-backed device-dax instances. Previously the default access mode was "device", mmap(2) a device special file to access memory. The new default is "kmem" where the address range is assigned to the core-mm via add_memory_driver_managed(). This saves typical users from wondering why their platform memory is not visible via free(1) and stuck behind a device-file. At the same time it allows expert users to deploy policy to, for example, get dedicated access to high performance memory, or hide low performance memory from general purpose kernel allocations. This affects not only CXL, but also systems with high-bandwidth-memory that platform-firmware tags with the EFI_MEMORY_SP (special purpose) designation. Summary: - CXL RAM region enumeration: instantiate 'struct cxl_region' objects for platform firmware created memory regions - CXL RAM region provisioning: complement the existing PMEM region creation support with RAM region support - "Soft Reservation" policy change: Online (memory hot-add) soft-reserved memory (EFI_MEMORY_SP) by default, but still allow for setting aside such memory for dedicated access via device-dax. - CXL Events and Interrupts: Takeover CXL event handling from platform-firmware (ACPI calls this CXL Memory Error Reporting) and export CXL Events via Linux Trace Events. - Convey CXL _OSC results to drivers: Similar to PCI, let the CXL subsystem interrogate the result of CXL _OSC negotiation. - Emulate CXL DVSEC Range Registers as "decoders": Allow for first-generation devices that pre-date the definition of the CXL HDM Decoder Capability to translate the CXL DVSEC Range Registers into 'struct cxl_decoder' objects. - Set timestamp: Per spec, set the device timestamp in case of hotplug, or if platform-firwmare failed to set it. - General fixups: linux-next build issues, non-urgent fixes for pre-production hardware, unit test fixes, spelling and debug message improvements" * tag 'cxl-for-6.3' of git://git.kernel.org/pub/scm/linux/kernel/git/cxl/cxl: (66 commits) dax/kmem: Fix leak of memory-hotplug resources cxl/mem: Add kdoc param for event log driver state cxl/trace: Add serial number to trace points cxl/trace: Add host output to trace points cxl/trace: Standardize device information output cxl/pci: Remove locked check for dvsec_range_allowed() cxl/hdm: Add emulation when HDM decoders are not committed cxl/hdm: Create emulated cxl_hdm for devices that do not have HDM decoders cxl/hdm: Emulate HDM decoder from DVSEC range registers cxl/pci: Refactor cxl_hdm_decode_init() cxl/port: Export cxl_dvsec_rr_decode() to cxl_port cxl/pci: Break out range register decoding from cxl_hdm_decode_init() cxl: add RAS status unmasking for CXL cxl: remove unnecessary calling of pci_enable_pcie_error_reporting() dax/hmem: build hmem device support as module if possible dax: cxl: add CXL_REGION dependency cxl: avoid returning uninitialized error code cxl/pmem: Fix nvdimm registration races cxl/mem: Fix UAPI command comment cxl/uapi: Tag commands from cxl_query_cmd() ...
798 lines
25 KiB
C
798 lines
25 KiB
C
/* SPDX-License-Identifier: GPL-2.0-only */
|
|
/* Copyright(c) 2020 Intel Corporation. */
|
|
|
|
#ifndef __CXL_H__
|
|
#define __CXL_H__
|
|
|
|
#include <linux/libnvdimm.h>
|
|
#include <linux/bitfield.h>
|
|
#include <linux/bitops.h>
|
|
#include <linux/log2.h>
|
|
#include <linux/io.h>
|
|
|
|
/**
|
|
* DOC: cxl objects
|
|
*
|
|
* The CXL core objects like ports, decoders, and regions are shared
|
|
* between the subsystem drivers cxl_acpi, cxl_pci, and core drivers
|
|
* (port-driver, region-driver, nvdimm object-drivers... etc).
|
|
*/
|
|
|
|
/* CXL 2.0 8.2.4 CXL Component Register Layout and Definition */
|
|
#define CXL_COMPONENT_REG_BLOCK_SIZE SZ_64K
|
|
|
|
/* CXL 2.0 8.2.5 CXL.cache and CXL.mem Registers*/
|
|
#define CXL_CM_OFFSET 0x1000
|
|
#define CXL_CM_CAP_HDR_OFFSET 0x0
|
|
#define CXL_CM_CAP_HDR_ID_MASK GENMASK(15, 0)
|
|
#define CM_CAP_HDR_CAP_ID 1
|
|
#define CXL_CM_CAP_HDR_VERSION_MASK GENMASK(19, 16)
|
|
#define CM_CAP_HDR_CAP_VERSION 1
|
|
#define CXL_CM_CAP_HDR_CACHE_MEM_VERSION_MASK GENMASK(23, 20)
|
|
#define CM_CAP_HDR_CACHE_MEM_VERSION 1
|
|
#define CXL_CM_CAP_HDR_ARRAY_SIZE_MASK GENMASK(31, 24)
|
|
#define CXL_CM_CAP_PTR_MASK GENMASK(31, 20)
|
|
|
|
#define CXL_CM_CAP_CAP_ID_RAS 0x2
|
|
#define CXL_CM_CAP_CAP_ID_HDM 0x5
|
|
#define CXL_CM_CAP_CAP_HDM_VERSION 1
|
|
|
|
/* HDM decoders CXL 2.0 8.2.5.12 CXL HDM Decoder Capability Structure */
|
|
#define CXL_HDM_DECODER_CAP_OFFSET 0x0
|
|
#define CXL_HDM_DECODER_COUNT_MASK GENMASK(3, 0)
|
|
#define CXL_HDM_DECODER_TARGET_COUNT_MASK GENMASK(7, 4)
|
|
#define CXL_HDM_DECODER_INTERLEAVE_11_8 BIT(8)
|
|
#define CXL_HDM_DECODER_INTERLEAVE_14_12 BIT(9)
|
|
#define CXL_HDM_DECODER_CTRL_OFFSET 0x4
|
|
#define CXL_HDM_DECODER_ENABLE BIT(1)
|
|
#define CXL_HDM_DECODER0_BASE_LOW_OFFSET(i) (0x20 * (i) + 0x10)
|
|
#define CXL_HDM_DECODER0_BASE_HIGH_OFFSET(i) (0x20 * (i) + 0x14)
|
|
#define CXL_HDM_DECODER0_SIZE_LOW_OFFSET(i) (0x20 * (i) + 0x18)
|
|
#define CXL_HDM_DECODER0_SIZE_HIGH_OFFSET(i) (0x20 * (i) + 0x1c)
|
|
#define CXL_HDM_DECODER0_CTRL_OFFSET(i) (0x20 * (i) + 0x20)
|
|
#define CXL_HDM_DECODER0_CTRL_IG_MASK GENMASK(3, 0)
|
|
#define CXL_HDM_DECODER0_CTRL_IW_MASK GENMASK(7, 4)
|
|
#define CXL_HDM_DECODER0_CTRL_LOCK BIT(8)
|
|
#define CXL_HDM_DECODER0_CTRL_COMMIT BIT(9)
|
|
#define CXL_HDM_DECODER0_CTRL_COMMITTED BIT(10)
|
|
#define CXL_HDM_DECODER0_CTRL_COMMIT_ERROR BIT(11)
|
|
#define CXL_HDM_DECODER0_CTRL_TYPE BIT(12)
|
|
#define CXL_HDM_DECODER0_TL_LOW(i) (0x20 * (i) + 0x24)
|
|
#define CXL_HDM_DECODER0_TL_HIGH(i) (0x20 * (i) + 0x28)
|
|
#define CXL_HDM_DECODER0_SKIP_LOW(i) CXL_HDM_DECODER0_TL_LOW(i)
|
|
#define CXL_HDM_DECODER0_SKIP_HIGH(i) CXL_HDM_DECODER0_TL_HIGH(i)
|
|
|
|
/* HDM decoder control register constants CXL 3.0 8.2.5.19.7 */
|
|
#define CXL_DECODER_MIN_GRANULARITY 256
|
|
#define CXL_DECODER_MAX_ENCODED_IG 6
|
|
|
|
static inline int cxl_hdm_decoder_count(u32 cap_hdr)
|
|
{
|
|
int val = FIELD_GET(CXL_HDM_DECODER_COUNT_MASK, cap_hdr);
|
|
|
|
return val ? val * 2 : 1;
|
|
}
|
|
|
|
/* Encode defined in CXL 2.0 8.2.5.12.7 HDM Decoder Control Register */
|
|
static inline int eig_to_granularity(u16 eig, unsigned int *granularity)
|
|
{
|
|
if (eig > CXL_DECODER_MAX_ENCODED_IG)
|
|
return -EINVAL;
|
|
*granularity = CXL_DECODER_MIN_GRANULARITY << eig;
|
|
return 0;
|
|
}
|
|
|
|
/* Encode defined in CXL ECN "3, 6, 12 and 16-way memory Interleaving" */
|
|
static inline int eiw_to_ways(u8 eiw, unsigned int *ways)
|
|
{
|
|
switch (eiw) {
|
|
case 0 ... 4:
|
|
*ways = 1 << eiw;
|
|
break;
|
|
case 8 ... 10:
|
|
*ways = 3 << (eiw - 8);
|
|
break;
|
|
default:
|
|
return -EINVAL;
|
|
}
|
|
|
|
return 0;
|
|
}
|
|
|
|
static inline int granularity_to_eig(int granularity, u16 *eig)
|
|
{
|
|
if (granularity > SZ_16K || granularity < CXL_DECODER_MIN_GRANULARITY ||
|
|
!is_power_of_2(granularity))
|
|
return -EINVAL;
|
|
*eig = ilog2(granularity) - 8;
|
|
return 0;
|
|
}
|
|
|
|
static inline int ways_to_eiw(unsigned int ways, u8 *eiw)
|
|
{
|
|
if (ways > 16)
|
|
return -EINVAL;
|
|
if (is_power_of_2(ways)) {
|
|
*eiw = ilog2(ways);
|
|
return 0;
|
|
}
|
|
if (ways % 3)
|
|
return -EINVAL;
|
|
ways /= 3;
|
|
if (!is_power_of_2(ways))
|
|
return -EINVAL;
|
|
*eiw = ilog2(ways) + 8;
|
|
return 0;
|
|
}
|
|
|
|
/* RAS Registers CXL 2.0 8.2.5.9 CXL RAS Capability Structure */
|
|
#define CXL_RAS_UNCORRECTABLE_STATUS_OFFSET 0x0
|
|
#define CXL_RAS_UNCORRECTABLE_STATUS_MASK (GENMASK(16, 14) | GENMASK(11, 0))
|
|
#define CXL_RAS_UNCORRECTABLE_MASK_OFFSET 0x4
|
|
#define CXL_RAS_UNCORRECTABLE_MASK_MASK (GENMASK(16, 14) | GENMASK(11, 0))
|
|
#define CXL_RAS_UNCORRECTABLE_MASK_F256B_MASK BIT(8)
|
|
#define CXL_RAS_UNCORRECTABLE_SEVERITY_OFFSET 0x8
|
|
#define CXL_RAS_UNCORRECTABLE_SEVERITY_MASK (GENMASK(16, 14) | GENMASK(11, 0))
|
|
#define CXL_RAS_CORRECTABLE_STATUS_OFFSET 0xC
|
|
#define CXL_RAS_CORRECTABLE_STATUS_MASK GENMASK(6, 0)
|
|
#define CXL_RAS_CORRECTABLE_MASK_OFFSET 0x10
|
|
#define CXL_RAS_CORRECTABLE_MASK_MASK GENMASK(6, 0)
|
|
#define CXL_RAS_CAP_CONTROL_OFFSET 0x14
|
|
#define CXL_RAS_CAP_CONTROL_FE_MASK GENMASK(5, 0)
|
|
#define CXL_RAS_HEADER_LOG_OFFSET 0x18
|
|
#define CXL_RAS_CAPABILITY_LENGTH 0x58
|
|
#define CXL_HEADERLOG_SIZE SZ_512
|
|
#define CXL_HEADERLOG_SIZE_U32 SZ_512 / sizeof(u32)
|
|
|
|
/* CXL 2.0 8.2.8.1 Device Capabilities Array Register */
|
|
#define CXLDEV_CAP_ARRAY_OFFSET 0x0
|
|
#define CXLDEV_CAP_ARRAY_CAP_ID 0
|
|
#define CXLDEV_CAP_ARRAY_ID_MASK GENMASK_ULL(15, 0)
|
|
#define CXLDEV_CAP_ARRAY_COUNT_MASK GENMASK_ULL(47, 32)
|
|
/* CXL 2.0 8.2.8.2 CXL Device Capability Header Register */
|
|
#define CXLDEV_CAP_HDR_CAP_ID_MASK GENMASK(15, 0)
|
|
/* CXL 2.0 8.2.8.2.1 CXL Device Capabilities */
|
|
#define CXLDEV_CAP_CAP_ID_DEVICE_STATUS 0x1
|
|
#define CXLDEV_CAP_CAP_ID_PRIMARY_MAILBOX 0x2
|
|
#define CXLDEV_CAP_CAP_ID_SECONDARY_MAILBOX 0x3
|
|
#define CXLDEV_CAP_CAP_ID_MEMDEV 0x4000
|
|
|
|
/* CXL 3.0 8.2.8.3.1 Event Status Register */
|
|
#define CXLDEV_DEV_EVENT_STATUS_OFFSET 0x00
|
|
#define CXLDEV_EVENT_STATUS_INFO BIT(0)
|
|
#define CXLDEV_EVENT_STATUS_WARN BIT(1)
|
|
#define CXLDEV_EVENT_STATUS_FAIL BIT(2)
|
|
#define CXLDEV_EVENT_STATUS_FATAL BIT(3)
|
|
|
|
#define CXLDEV_EVENT_STATUS_ALL (CXLDEV_EVENT_STATUS_INFO | \
|
|
CXLDEV_EVENT_STATUS_WARN | \
|
|
CXLDEV_EVENT_STATUS_FAIL | \
|
|
CXLDEV_EVENT_STATUS_FATAL)
|
|
|
|
/* CXL rev 3.0 section 8.2.9.2.4; Table 8-52 */
|
|
#define CXLDEV_EVENT_INT_MODE_MASK GENMASK(1, 0)
|
|
#define CXLDEV_EVENT_INT_MSGNUM_MASK GENMASK(7, 4)
|
|
|
|
/* CXL 2.0 8.2.8.4 Mailbox Registers */
|
|
#define CXLDEV_MBOX_CAPS_OFFSET 0x00
|
|
#define CXLDEV_MBOX_CAP_PAYLOAD_SIZE_MASK GENMASK(4, 0)
|
|
#define CXLDEV_MBOX_CTRL_OFFSET 0x04
|
|
#define CXLDEV_MBOX_CTRL_DOORBELL BIT(0)
|
|
#define CXLDEV_MBOX_CMD_OFFSET 0x08
|
|
#define CXLDEV_MBOX_CMD_COMMAND_OPCODE_MASK GENMASK_ULL(15, 0)
|
|
#define CXLDEV_MBOX_CMD_PAYLOAD_LENGTH_MASK GENMASK_ULL(36, 16)
|
|
#define CXLDEV_MBOX_STATUS_OFFSET 0x10
|
|
#define CXLDEV_MBOX_STATUS_RET_CODE_MASK GENMASK_ULL(47, 32)
|
|
#define CXLDEV_MBOX_BG_CMD_STATUS_OFFSET 0x18
|
|
#define CXLDEV_MBOX_PAYLOAD_OFFSET 0x20
|
|
|
|
/*
|
|
* Using struct_group() allows for per register-block-type helper routines,
|
|
* without requiring block-type agnostic code to include the prefix.
|
|
*/
|
|
struct cxl_regs {
|
|
/*
|
|
* Common set of CXL Component register block base pointers
|
|
* @hdm_decoder: CXL 2.0 8.2.5.12 CXL HDM Decoder Capability Structure
|
|
* @ras: CXL 2.0 8.2.5.9 CXL RAS Capability Structure
|
|
*/
|
|
struct_group_tagged(cxl_component_regs, component,
|
|
void __iomem *hdm_decoder;
|
|
void __iomem *ras;
|
|
);
|
|
/*
|
|
* Common set of CXL Device register block base pointers
|
|
* @status: CXL 2.0 8.2.8.3 Device Status Registers
|
|
* @mbox: CXL 2.0 8.2.8.4 Mailbox Registers
|
|
* @memdev: CXL 2.0 8.2.8.5 Memory Device Registers
|
|
*/
|
|
struct_group_tagged(cxl_device_regs, device_regs,
|
|
void __iomem *status, *mbox, *memdev;
|
|
);
|
|
};
|
|
|
|
struct cxl_reg_map {
|
|
bool valid;
|
|
int id;
|
|
unsigned long offset;
|
|
unsigned long size;
|
|
};
|
|
|
|
struct cxl_component_reg_map {
|
|
struct cxl_reg_map hdm_decoder;
|
|
struct cxl_reg_map ras;
|
|
};
|
|
|
|
struct cxl_device_reg_map {
|
|
struct cxl_reg_map status;
|
|
struct cxl_reg_map mbox;
|
|
struct cxl_reg_map memdev;
|
|
};
|
|
|
|
/**
|
|
* struct cxl_register_map - DVSEC harvested register block mapping parameters
|
|
* @base: virtual base of the register-block-BAR + @block_offset
|
|
* @resource: physical resource base of the register block
|
|
* @max_size: maximum mapping size to perform register search
|
|
* @reg_type: see enum cxl_regloc_type
|
|
* @component_map: cxl_reg_map for component registers
|
|
* @device_map: cxl_reg_maps for device registers
|
|
*/
|
|
struct cxl_register_map {
|
|
void __iomem *base;
|
|
resource_size_t resource;
|
|
resource_size_t max_size;
|
|
u8 reg_type;
|
|
union {
|
|
struct cxl_component_reg_map component_map;
|
|
struct cxl_device_reg_map device_map;
|
|
};
|
|
};
|
|
|
|
void cxl_probe_component_regs(struct device *dev, void __iomem *base,
|
|
struct cxl_component_reg_map *map);
|
|
void cxl_probe_device_regs(struct device *dev, void __iomem *base,
|
|
struct cxl_device_reg_map *map);
|
|
int cxl_map_component_regs(struct device *dev, struct cxl_component_regs *regs,
|
|
struct cxl_register_map *map,
|
|
unsigned long map_mask);
|
|
int cxl_map_device_regs(struct device *dev, struct cxl_device_regs *regs,
|
|
struct cxl_register_map *map);
|
|
|
|
enum cxl_regloc_type;
|
|
int cxl_find_regblock(struct pci_dev *pdev, enum cxl_regloc_type type,
|
|
struct cxl_register_map *map);
|
|
|
|
enum cxl_rcrb {
|
|
CXL_RCRB_DOWNSTREAM,
|
|
CXL_RCRB_UPSTREAM,
|
|
};
|
|
resource_size_t cxl_rcrb_to_component(struct device *dev,
|
|
resource_size_t rcrb,
|
|
enum cxl_rcrb which);
|
|
|
|
#define CXL_RESOURCE_NONE ((resource_size_t) -1)
|
|
#define CXL_TARGET_STRLEN 20
|
|
|
|
/*
|
|
* cxl_decoder flags that define the type of memory / devices this
|
|
* decoder supports as well as configuration lock status See "CXL 2.0
|
|
* 8.2.5.12.7 CXL HDM Decoder 0 Control Register" for details.
|
|
* Additionally indicate whether decoder settings were autodetected,
|
|
* user customized.
|
|
*/
|
|
#define CXL_DECODER_F_RAM BIT(0)
|
|
#define CXL_DECODER_F_PMEM BIT(1)
|
|
#define CXL_DECODER_F_TYPE2 BIT(2)
|
|
#define CXL_DECODER_F_TYPE3 BIT(3)
|
|
#define CXL_DECODER_F_LOCK BIT(4)
|
|
#define CXL_DECODER_F_ENABLE BIT(5)
|
|
#define CXL_DECODER_F_MASK GENMASK(5, 0)
|
|
|
|
enum cxl_decoder_type {
|
|
CXL_DECODER_ACCELERATOR = 2,
|
|
CXL_DECODER_EXPANDER = 3,
|
|
};
|
|
|
|
/*
|
|
* Current specification goes up to 8, double that seems a reasonable
|
|
* software max for the foreseeable future
|
|
*/
|
|
#define CXL_DECODER_MAX_INTERLEAVE 16
|
|
|
|
|
|
/**
|
|
* struct cxl_decoder - Common CXL HDM Decoder Attributes
|
|
* @dev: this decoder's device
|
|
* @id: kernel device name id
|
|
* @hpa_range: Host physical address range mapped by this decoder
|
|
* @interleave_ways: number of cxl_dports in this decode
|
|
* @interleave_granularity: data stride per dport
|
|
* @target_type: accelerator vs expander (type2 vs type3) selector
|
|
* @region: currently assigned region for this decoder
|
|
* @flags: memory type capabilities and locking
|
|
* @commit: device/decoder-type specific callback to commit settings to hw
|
|
* @reset: device/decoder-type specific callback to reset hw settings
|
|
*/
|
|
struct cxl_decoder {
|
|
struct device dev;
|
|
int id;
|
|
struct range hpa_range;
|
|
int interleave_ways;
|
|
int interleave_granularity;
|
|
enum cxl_decoder_type target_type;
|
|
struct cxl_region *region;
|
|
unsigned long flags;
|
|
int (*commit)(struct cxl_decoder *cxld);
|
|
int (*reset)(struct cxl_decoder *cxld);
|
|
};
|
|
|
|
/*
|
|
* CXL_DECODER_DEAD prevents endpoints from being reattached to regions
|
|
* while cxld_unregister() is running
|
|
*/
|
|
enum cxl_decoder_mode {
|
|
CXL_DECODER_NONE,
|
|
CXL_DECODER_RAM,
|
|
CXL_DECODER_PMEM,
|
|
CXL_DECODER_MIXED,
|
|
CXL_DECODER_DEAD,
|
|
};
|
|
|
|
static inline const char *cxl_decoder_mode_name(enum cxl_decoder_mode mode)
|
|
{
|
|
static const char * const names[] = {
|
|
[CXL_DECODER_NONE] = "none",
|
|
[CXL_DECODER_RAM] = "ram",
|
|
[CXL_DECODER_PMEM] = "pmem",
|
|
[CXL_DECODER_MIXED] = "mixed",
|
|
};
|
|
|
|
if (mode >= CXL_DECODER_NONE && mode <= CXL_DECODER_MIXED)
|
|
return names[mode];
|
|
return "mixed";
|
|
}
|
|
|
|
/*
|
|
* Track whether this decoder is reserved for region autodiscovery, or
|
|
* free for userspace provisioning.
|
|
*/
|
|
enum cxl_decoder_state {
|
|
CXL_DECODER_STATE_MANUAL,
|
|
CXL_DECODER_STATE_AUTO,
|
|
};
|
|
|
|
/**
|
|
* struct cxl_endpoint_decoder - Endpoint / SPA to DPA decoder
|
|
* @cxld: base cxl_decoder_object
|
|
* @dpa_res: actively claimed DPA span of this decoder
|
|
* @skip: offset into @dpa_res where @cxld.hpa_range maps
|
|
* @mode: which memory type / access-mode-partition this decoder targets
|
|
* @state: autodiscovery state
|
|
* @pos: interleave position in @cxld.region
|
|
*/
|
|
struct cxl_endpoint_decoder {
|
|
struct cxl_decoder cxld;
|
|
struct resource *dpa_res;
|
|
resource_size_t skip;
|
|
enum cxl_decoder_mode mode;
|
|
enum cxl_decoder_state state;
|
|
int pos;
|
|
};
|
|
|
|
/**
|
|
* struct cxl_switch_decoder - Switch specific CXL HDM Decoder
|
|
* @cxld: base cxl_decoder object
|
|
* @target_lock: coordinate coherent reads of the target list
|
|
* @nr_targets: number of elements in @target
|
|
* @target: active ordered target list in current decoder configuration
|
|
*
|
|
* The 'switch' decoder type represents the decoder instances of cxl_port's that
|
|
* route from the root of a CXL memory decode topology to the endpoints. They
|
|
* come in two flavors, root-level decoders, statically defined by platform
|
|
* firmware, and mid-level decoders, where interleave-granularity,
|
|
* interleave-width, and the target list are mutable.
|
|
*/
|
|
struct cxl_switch_decoder {
|
|
struct cxl_decoder cxld;
|
|
seqlock_t target_lock;
|
|
int nr_targets;
|
|
struct cxl_dport *target[];
|
|
};
|
|
|
|
struct cxl_root_decoder;
|
|
typedef struct cxl_dport *(*cxl_calc_hb_fn)(struct cxl_root_decoder *cxlrd,
|
|
int pos);
|
|
|
|
/**
|
|
* struct cxl_root_decoder - Static platform CXL address decoder
|
|
* @res: host / parent resource for region allocations
|
|
* @region_id: region id for next region provisioning event
|
|
* @calc_hb: which host bridge covers the n'th position by granularity
|
|
* @platform_data: platform specific configuration data
|
|
* @range_lock: sync region autodiscovery by address range
|
|
* @cxlsd: base cxl switch decoder
|
|
*/
|
|
struct cxl_root_decoder {
|
|
struct resource *res;
|
|
atomic_t region_id;
|
|
cxl_calc_hb_fn calc_hb;
|
|
void *platform_data;
|
|
struct mutex range_lock;
|
|
struct cxl_switch_decoder cxlsd;
|
|
};
|
|
|
|
/*
|
|
* enum cxl_config_state - State machine for region configuration
|
|
* @CXL_CONFIG_IDLE: Any sysfs attribute can be written freely
|
|
* @CXL_CONFIG_INTERLEAVE_ACTIVE: region size has been set, no more
|
|
* changes to interleave_ways or interleave_granularity
|
|
* @CXL_CONFIG_ACTIVE: All targets have been added the region is now
|
|
* active
|
|
* @CXL_CONFIG_RESET_PENDING: see commit_store()
|
|
* @CXL_CONFIG_COMMIT: Soft-config has been committed to hardware
|
|
*/
|
|
enum cxl_config_state {
|
|
CXL_CONFIG_IDLE,
|
|
CXL_CONFIG_INTERLEAVE_ACTIVE,
|
|
CXL_CONFIG_ACTIVE,
|
|
CXL_CONFIG_RESET_PENDING,
|
|
CXL_CONFIG_COMMIT,
|
|
};
|
|
|
|
/**
|
|
* struct cxl_region_params - region settings
|
|
* @state: allow the driver to lockdown further parameter changes
|
|
* @uuid: unique id for persistent regions
|
|
* @interleave_ways: number of endpoints in the region
|
|
* @interleave_granularity: capacity each endpoint contributes to a stripe
|
|
* @res: allocated iomem capacity for this region
|
|
* @targets: active ordered targets in current decoder configuration
|
|
* @nr_targets: number of targets
|
|
*
|
|
* State transitions are protected by the cxl_region_rwsem
|
|
*/
|
|
struct cxl_region_params {
|
|
enum cxl_config_state state;
|
|
uuid_t uuid;
|
|
int interleave_ways;
|
|
int interleave_granularity;
|
|
struct resource *res;
|
|
struct cxl_endpoint_decoder *targets[CXL_DECODER_MAX_INTERLEAVE];
|
|
int nr_targets;
|
|
};
|
|
|
|
/*
|
|
* Flag whether this region needs to have its HPA span synchronized with
|
|
* CPU cache state at region activation time.
|
|
*/
|
|
#define CXL_REGION_F_INCOHERENT 0
|
|
|
|
/*
|
|
* Indicate whether this region has been assembled by autodetection or
|
|
* userspace assembly. Prevent endpoint decoders outside of automatic
|
|
* detection from being added to the region.
|
|
*/
|
|
#define CXL_REGION_F_AUTO 1
|
|
|
|
/**
|
|
* struct cxl_region - CXL region
|
|
* @dev: This region's device
|
|
* @id: This region's id. Id is globally unique across all regions
|
|
* @mode: Endpoint decoder allocation / access mode
|
|
* @type: Endpoint decoder target type
|
|
* @cxl_nvb: nvdimm bridge for coordinating @cxlr_pmem setup / shutdown
|
|
* @cxlr_pmem: (for pmem regions) cached copy of the nvdimm bridge
|
|
* @flags: Region state flags
|
|
* @params: active + config params for the region
|
|
*/
|
|
struct cxl_region {
|
|
struct device dev;
|
|
int id;
|
|
enum cxl_decoder_mode mode;
|
|
enum cxl_decoder_type type;
|
|
struct cxl_nvdimm_bridge *cxl_nvb;
|
|
struct cxl_pmem_region *cxlr_pmem;
|
|
unsigned long flags;
|
|
struct cxl_region_params params;
|
|
};
|
|
|
|
struct cxl_nvdimm_bridge {
|
|
int id;
|
|
struct device dev;
|
|
struct cxl_port *port;
|
|
struct nvdimm_bus *nvdimm_bus;
|
|
struct nvdimm_bus_descriptor nd_desc;
|
|
};
|
|
|
|
#define CXL_DEV_ID_LEN 19
|
|
|
|
struct cxl_nvdimm {
|
|
struct device dev;
|
|
struct cxl_memdev *cxlmd;
|
|
u8 dev_id[CXL_DEV_ID_LEN]; /* for nvdimm, string of 'serial' */
|
|
};
|
|
|
|
struct cxl_pmem_region_mapping {
|
|
struct cxl_memdev *cxlmd;
|
|
struct cxl_nvdimm *cxl_nvd;
|
|
u64 start;
|
|
u64 size;
|
|
int position;
|
|
};
|
|
|
|
struct cxl_pmem_region {
|
|
struct device dev;
|
|
struct cxl_region *cxlr;
|
|
struct nd_region *nd_region;
|
|
struct range hpa_range;
|
|
int nr_mappings;
|
|
struct cxl_pmem_region_mapping mapping[];
|
|
};
|
|
|
|
struct cxl_dax_region {
|
|
struct device dev;
|
|
struct cxl_region *cxlr;
|
|
struct range hpa_range;
|
|
};
|
|
|
|
/**
|
|
* struct cxl_port - logical collection of upstream port devices and
|
|
* downstream port devices to construct a CXL memory
|
|
* decode hierarchy.
|
|
* @dev: this port's device
|
|
* @uport: PCI or platform device implementing the upstream port capability
|
|
* @host_bridge: Shortcut to the platform attach point for this port
|
|
* @id: id for port device-name
|
|
* @dports: cxl_dport instances referenced by decoders
|
|
* @endpoints: cxl_ep instances, endpoints that are a descendant of this port
|
|
* @regions: cxl_region_ref instances, regions mapped by this port
|
|
* @parent_dport: dport that points to this port in the parent
|
|
* @decoder_ida: allocator for decoder ids
|
|
* @nr_dports: number of entries in @dports
|
|
* @hdm_end: track last allocated HDM decoder instance for allocation ordering
|
|
* @commit_end: cursor to track highest committed decoder for commit ordering
|
|
* @component_reg_phys: component register capability base address (optional)
|
|
* @dead: last ep has been removed, force port re-creation
|
|
* @depth: How deep this port is relative to the root. depth 0 is the root.
|
|
* @cdat: Cached CDAT data
|
|
* @cdat_available: Should a CDAT attribute be available in sysfs
|
|
*/
|
|
struct cxl_port {
|
|
struct device dev;
|
|
struct device *uport;
|
|
struct device *host_bridge;
|
|
int id;
|
|
struct xarray dports;
|
|
struct xarray endpoints;
|
|
struct xarray regions;
|
|
struct cxl_dport *parent_dport;
|
|
struct ida decoder_ida;
|
|
int nr_dports;
|
|
int hdm_end;
|
|
int commit_end;
|
|
resource_size_t component_reg_phys;
|
|
bool dead;
|
|
unsigned int depth;
|
|
struct cxl_cdat {
|
|
void *table;
|
|
size_t length;
|
|
} cdat;
|
|
bool cdat_available;
|
|
};
|
|
|
|
static inline struct cxl_dport *
|
|
cxl_find_dport_by_dev(struct cxl_port *port, const struct device *dport_dev)
|
|
{
|
|
return xa_load(&port->dports, (unsigned long)dport_dev);
|
|
}
|
|
|
|
/**
|
|
* struct cxl_dport - CXL downstream port
|
|
* @dport: PCI bridge or firmware device representing the downstream link
|
|
* @port_id: unique hardware identifier for dport in decoder target list
|
|
* @component_reg_phys: downstream port component registers
|
|
* @rcrb: base address for the Root Complex Register Block
|
|
* @rch: Indicate whether this dport was enumerated in RCH or VH mode
|
|
* @port: reference to cxl_port that contains this downstream port
|
|
*/
|
|
struct cxl_dport {
|
|
struct device *dport;
|
|
int port_id;
|
|
resource_size_t component_reg_phys;
|
|
resource_size_t rcrb;
|
|
bool rch;
|
|
struct cxl_port *port;
|
|
};
|
|
|
|
/**
|
|
* struct cxl_ep - track an endpoint's interest in a port
|
|
* @ep: device that hosts a generic CXL endpoint (expander or accelerator)
|
|
* @dport: which dport routes to this endpoint on @port
|
|
* @next: cxl switch port across the link attached to @dport NULL if
|
|
* attached to an endpoint
|
|
*/
|
|
struct cxl_ep {
|
|
struct device *ep;
|
|
struct cxl_dport *dport;
|
|
struct cxl_port *next;
|
|
};
|
|
|
|
/**
|
|
* struct cxl_region_ref - track a region's interest in a port
|
|
* @port: point in topology to install this reference
|
|
* @decoder: decoder assigned for @region in @port
|
|
* @region: region for this reference
|
|
* @endpoints: cxl_ep references for region members beneath @port
|
|
* @nr_targets_set: track how many targets have been programmed during setup
|
|
* @nr_eps: number of endpoints beneath @port
|
|
* @nr_targets: number of distinct targets needed to reach @nr_eps
|
|
*/
|
|
struct cxl_region_ref {
|
|
struct cxl_port *port;
|
|
struct cxl_decoder *decoder;
|
|
struct cxl_region *region;
|
|
struct xarray endpoints;
|
|
int nr_targets_set;
|
|
int nr_eps;
|
|
int nr_targets;
|
|
};
|
|
|
|
/*
|
|
* The platform firmware device hosting the root is also the top of the
|
|
* CXL port topology. All other CXL ports have another CXL port as their
|
|
* parent and their ->uport / host device is out-of-line of the port
|
|
* ancestry.
|
|
*/
|
|
static inline bool is_cxl_root(struct cxl_port *port)
|
|
{
|
|
return port->uport == port->dev.parent;
|
|
}
|
|
|
|
bool is_cxl_port(const struct device *dev);
|
|
struct cxl_port *to_cxl_port(const struct device *dev);
|
|
struct pci_bus;
|
|
int devm_cxl_register_pci_bus(struct device *host, struct device *uport,
|
|
struct pci_bus *bus);
|
|
struct pci_bus *cxl_port_to_pci_bus(struct cxl_port *port);
|
|
struct cxl_port *devm_cxl_add_port(struct device *host, struct device *uport,
|
|
resource_size_t component_reg_phys,
|
|
struct cxl_dport *parent_dport);
|
|
struct cxl_port *find_cxl_root(struct device *dev);
|
|
int devm_cxl_enumerate_ports(struct cxl_memdev *cxlmd);
|
|
void cxl_bus_rescan(void);
|
|
void cxl_bus_drain(void);
|
|
struct cxl_port *cxl_mem_find_port(struct cxl_memdev *cxlmd,
|
|
struct cxl_dport **dport);
|
|
bool schedule_cxl_memdev_detach(struct cxl_memdev *cxlmd);
|
|
|
|
struct cxl_dport *devm_cxl_add_dport(struct cxl_port *port,
|
|
struct device *dport, int port_id,
|
|
resource_size_t component_reg_phys);
|
|
struct cxl_dport *devm_cxl_add_rch_dport(struct cxl_port *port,
|
|
struct device *dport_dev, int port_id,
|
|
resource_size_t component_reg_phys,
|
|
resource_size_t rcrb);
|
|
|
|
struct cxl_decoder *to_cxl_decoder(struct device *dev);
|
|
struct cxl_root_decoder *to_cxl_root_decoder(struct device *dev);
|
|
struct cxl_switch_decoder *to_cxl_switch_decoder(struct device *dev);
|
|
struct cxl_endpoint_decoder *to_cxl_endpoint_decoder(struct device *dev);
|
|
bool is_root_decoder(struct device *dev);
|
|
bool is_switch_decoder(struct device *dev);
|
|
bool is_endpoint_decoder(struct device *dev);
|
|
struct cxl_root_decoder *cxl_root_decoder_alloc(struct cxl_port *port,
|
|
unsigned int nr_targets,
|
|
cxl_calc_hb_fn calc_hb);
|
|
struct cxl_dport *cxl_hb_modulo(struct cxl_root_decoder *cxlrd, int pos);
|
|
struct cxl_switch_decoder *cxl_switch_decoder_alloc(struct cxl_port *port,
|
|
unsigned int nr_targets);
|
|
int cxl_decoder_add(struct cxl_decoder *cxld, int *target_map);
|
|
struct cxl_endpoint_decoder *cxl_endpoint_decoder_alloc(struct cxl_port *port);
|
|
int cxl_decoder_add_locked(struct cxl_decoder *cxld, int *target_map);
|
|
int cxl_decoder_autoremove(struct device *host, struct cxl_decoder *cxld);
|
|
int cxl_endpoint_autoremove(struct cxl_memdev *cxlmd, struct cxl_port *endpoint);
|
|
|
|
/**
|
|
* struct cxl_endpoint_dvsec_info - Cached DVSEC info
|
|
* @mem_enabled: cached value of mem_enabled in the DVSEC, PCIE_DEVICE
|
|
* @ranges: Number of active HDM ranges this device uses.
|
|
* @dvsec_range: cached attributes of the ranges in the DVSEC, PCIE_DEVICE
|
|
*/
|
|
struct cxl_endpoint_dvsec_info {
|
|
bool mem_enabled;
|
|
int ranges;
|
|
struct range dvsec_range[2];
|
|
};
|
|
|
|
struct cxl_hdm;
|
|
struct cxl_hdm *devm_cxl_setup_hdm(struct cxl_port *port,
|
|
struct cxl_endpoint_dvsec_info *info);
|
|
int devm_cxl_enumerate_decoders(struct cxl_hdm *cxlhdm,
|
|
struct cxl_endpoint_dvsec_info *info);
|
|
int devm_cxl_add_passthrough_decoder(struct cxl_port *port);
|
|
int cxl_dvsec_rr_decode(struct device *dev, int dvsec,
|
|
struct cxl_endpoint_dvsec_info *info);
|
|
|
|
bool is_cxl_region(struct device *dev);
|
|
|
|
extern struct bus_type cxl_bus_type;
|
|
|
|
struct cxl_driver {
|
|
const char *name;
|
|
int (*probe)(struct device *dev);
|
|
void (*remove)(struct device *dev);
|
|
struct device_driver drv;
|
|
int id;
|
|
};
|
|
|
|
static inline struct cxl_driver *to_cxl_drv(struct device_driver *drv)
|
|
{
|
|
return container_of(drv, struct cxl_driver, drv);
|
|
}
|
|
|
|
int __cxl_driver_register(struct cxl_driver *cxl_drv, struct module *owner,
|
|
const char *modname);
|
|
#define cxl_driver_register(x) __cxl_driver_register(x, THIS_MODULE, KBUILD_MODNAME)
|
|
void cxl_driver_unregister(struct cxl_driver *cxl_drv);
|
|
|
|
#define module_cxl_driver(__cxl_driver) \
|
|
module_driver(__cxl_driver, cxl_driver_register, cxl_driver_unregister)
|
|
|
|
#define CXL_DEVICE_NVDIMM_BRIDGE 1
|
|
#define CXL_DEVICE_NVDIMM 2
|
|
#define CXL_DEVICE_PORT 3
|
|
#define CXL_DEVICE_ROOT 4
|
|
#define CXL_DEVICE_MEMORY_EXPANDER 5
|
|
#define CXL_DEVICE_REGION 6
|
|
#define CXL_DEVICE_PMEM_REGION 7
|
|
#define CXL_DEVICE_DAX_REGION 8
|
|
|
|
#define MODULE_ALIAS_CXL(type) MODULE_ALIAS("cxl:t" __stringify(type) "*")
|
|
#define CXL_MODALIAS_FMT "cxl:t%d"
|
|
|
|
struct cxl_nvdimm_bridge *to_cxl_nvdimm_bridge(struct device *dev);
|
|
struct cxl_nvdimm_bridge *devm_cxl_add_nvdimm_bridge(struct device *host,
|
|
struct cxl_port *port);
|
|
struct cxl_nvdimm *to_cxl_nvdimm(struct device *dev);
|
|
bool is_cxl_nvdimm(struct device *dev);
|
|
bool is_cxl_nvdimm_bridge(struct device *dev);
|
|
int devm_cxl_add_nvdimm(struct cxl_memdev *cxlmd);
|
|
struct cxl_nvdimm_bridge *cxl_find_nvdimm_bridge(struct device *dev);
|
|
|
|
#ifdef CONFIG_CXL_REGION
|
|
bool is_cxl_pmem_region(struct device *dev);
|
|
struct cxl_pmem_region *to_cxl_pmem_region(struct device *dev);
|
|
int cxl_add_to_region(struct cxl_port *root,
|
|
struct cxl_endpoint_decoder *cxled);
|
|
struct cxl_dax_region *to_cxl_dax_region(struct device *dev);
|
|
#else
|
|
static inline bool is_cxl_pmem_region(struct device *dev)
|
|
{
|
|
return false;
|
|
}
|
|
static inline struct cxl_pmem_region *to_cxl_pmem_region(struct device *dev)
|
|
{
|
|
return NULL;
|
|
}
|
|
static inline int cxl_add_to_region(struct cxl_port *root,
|
|
struct cxl_endpoint_decoder *cxled)
|
|
{
|
|
return 0;
|
|
}
|
|
static inline struct cxl_dax_region *to_cxl_dax_region(struct device *dev)
|
|
{
|
|
return NULL;
|
|
}
|
|
#endif
|
|
|
|
/*
|
|
* Unit test builds overrides this to __weak, find the 'strong' version
|
|
* of these symbols in tools/testing/cxl/.
|
|
*/
|
|
#ifndef __mock
|
|
#define __mock static
|
|
#endif
|
|
|
|
#endif /* __CXL_H__ */
|