Zen-based AMD systems report DRAM ECC errors through Unified Memory Controller (UMC) MCA banks. The value provided in MCA_ADDR is a "normalized" address which represents the UMC's view of its managed memory. The normalized address must be translated to a system physical address for software to take action. MI300 systems, uniquely, do not provide a normalized address in MCA_ADDR for DRAM ECC errors. Rather, the "DRAM" address is reported. This value includes identifiers for the bank, row, column, pseudochannel and stack of the memory location. The DRAM address must be converted to a normalized address in order to be further translated to a system physical address. Add helper functions to do the DRAM to normalized translation for MI300 systems. The method is based on the fixed hardware layout of the on-chip memory. [ bp: Massage commit message, decapitalize some, rename function. ] Signed-off-by: Yazen Ghannam <yazen.ghannam@amd.com> Co-developed-by: Muralidhara M K <muralidhara.mk@amd.com> Signed-off-by: Muralidhara M K <muralidhara.mk@amd.com> Signed-off-by: Borislav Petkov (AMD) <bp@alien8.de> Tested-by: Muralidhara M K <muralidhara.mk@amd.com> Link: https://lore.kernel.org/r/20240131165732.88297-1-yazen.ghannam@amd.com
306 lines
7.2 KiB
C
306 lines
7.2 KiB
C
/* SPDX-License-Identifier: GPL-2.0 */
|
|
/*
|
|
* AMD Address Translation Library
|
|
*
|
|
* internal.h : Helper functions and common defines
|
|
*
|
|
* Copyright (c) 2023, Advanced Micro Devices, Inc.
|
|
* All Rights Reserved.
|
|
*
|
|
* Author: Yazen Ghannam <Yazen.Ghannam@amd.com>
|
|
*/
|
|
|
|
#ifndef __AMD_ATL_INTERNAL_H__
|
|
#define __AMD_ATL_INTERNAL_H__
|
|
|
|
#include <linux/bitfield.h>
|
|
#include <linux/bitops.h>
|
|
#include <linux/ras.h>
|
|
|
|
#include <asm/amd_nb.h>
|
|
|
|
#include "reg_fields.h"
|
|
|
|
/* Maximum possible number of Coherent Stations within a single Data Fabric. */
|
|
#define MAX_COH_ST_CHANNELS 32
|
|
|
|
/* PCI ID for Zen4 Server DF Function 0. */
|
|
#define DF_FUNC0_ID_ZEN4_SERVER 0x14AD1022
|
|
|
|
/* PCI IDs for MI300 DF Function 0. */
|
|
#define DF_FUNC0_ID_MI300 0x15281022
|
|
|
|
/* Shift needed for adjusting register values to true values. */
|
|
#define DF_DRAM_BASE_LIMIT_LSB 28
|
|
#define MI300_DRAM_LIMIT_LSB 20
|
|
|
|
enum df_revisions {
|
|
UNKNOWN,
|
|
DF2,
|
|
DF3,
|
|
DF3p5,
|
|
DF4,
|
|
DF4p5,
|
|
};
|
|
|
|
/* These are mapped 1:1 to the hardware values. Special cases are set at > 0x20. */
|
|
enum intlv_modes {
|
|
NONE = 0x00,
|
|
NOHASH_2CHAN = 0x01,
|
|
NOHASH_4CHAN = 0x03,
|
|
NOHASH_8CHAN = 0x05,
|
|
DF3_6CHAN = 0x06,
|
|
NOHASH_16CHAN = 0x07,
|
|
NOHASH_32CHAN = 0x08,
|
|
DF3_COD4_2CHAN_HASH = 0x0C,
|
|
DF3_COD2_4CHAN_HASH = 0x0D,
|
|
DF3_COD1_8CHAN_HASH = 0x0E,
|
|
DF4_NPS4_2CHAN_HASH = 0x10,
|
|
DF4_NPS2_4CHAN_HASH = 0x11,
|
|
DF4_NPS1_8CHAN_HASH = 0x12,
|
|
DF4_NPS4_3CHAN_HASH = 0x13,
|
|
DF4_NPS2_6CHAN_HASH = 0x14,
|
|
DF4_NPS1_12CHAN_HASH = 0x15,
|
|
DF4_NPS2_5CHAN_HASH = 0x16,
|
|
DF4_NPS1_10CHAN_HASH = 0x17,
|
|
MI3_HASH_8CHAN = 0x18,
|
|
MI3_HASH_16CHAN = 0x19,
|
|
MI3_HASH_32CHAN = 0x1A,
|
|
DF2_2CHAN_HASH = 0x21,
|
|
/* DF4.5 modes are all IntLvNumChan + 0x20 */
|
|
DF4p5_NPS1_16CHAN_1K_HASH = 0x2C,
|
|
DF4p5_NPS0_24CHAN_1K_HASH = 0x2E,
|
|
DF4p5_NPS4_2CHAN_1K_HASH = 0x30,
|
|
DF4p5_NPS2_4CHAN_1K_HASH = 0x31,
|
|
DF4p5_NPS1_8CHAN_1K_HASH = 0x32,
|
|
DF4p5_NPS4_3CHAN_1K_HASH = 0x33,
|
|
DF4p5_NPS2_6CHAN_1K_HASH = 0x34,
|
|
DF4p5_NPS1_12CHAN_1K_HASH = 0x35,
|
|
DF4p5_NPS2_5CHAN_1K_HASH = 0x36,
|
|
DF4p5_NPS1_10CHAN_1K_HASH = 0x37,
|
|
DF4p5_NPS4_2CHAN_2K_HASH = 0x40,
|
|
DF4p5_NPS2_4CHAN_2K_HASH = 0x41,
|
|
DF4p5_NPS1_8CHAN_2K_HASH = 0x42,
|
|
DF4p5_NPS1_16CHAN_2K_HASH = 0x43,
|
|
DF4p5_NPS4_3CHAN_2K_HASH = 0x44,
|
|
DF4p5_NPS2_6CHAN_2K_HASH = 0x45,
|
|
DF4p5_NPS1_12CHAN_2K_HASH = 0x46,
|
|
DF4p5_NPS0_24CHAN_2K_HASH = 0x47,
|
|
DF4p5_NPS2_5CHAN_2K_HASH = 0x48,
|
|
DF4p5_NPS1_10CHAN_2K_HASH = 0x49,
|
|
};
|
|
|
|
struct df_flags {
|
|
__u8 legacy_ficaa : 1,
|
|
socket_id_shift_quirk : 1,
|
|
heterogeneous : 1,
|
|
__reserved_0 : 5;
|
|
};
|
|
|
|
struct df_config {
|
|
enum df_revisions rev;
|
|
|
|
/*
|
|
* These masks operate on the 16-bit Coherent Station IDs,
|
|
* e.g. Instance, Fabric, Destination, etc.
|
|
*/
|
|
u16 component_id_mask;
|
|
u16 die_id_mask;
|
|
u16 node_id_mask;
|
|
u16 socket_id_mask;
|
|
|
|
/*
|
|
* Least-significant bit of Node ID portion of the
|
|
* system-wide Coherent Station Fabric ID.
|
|
*/
|
|
u8 node_id_shift;
|
|
|
|
/*
|
|
* Least-significant bit of Die portion of the Node ID.
|
|
* Adjusted to include the Node ID shift in order to apply
|
|
* to the Coherent Station Fabric ID.
|
|
*/
|
|
u8 die_id_shift;
|
|
|
|
/*
|
|
* Least-significant bit of Socket portion of the Node ID.
|
|
* Adjusted to include the Node ID shift in order to apply
|
|
* to the Coherent Station Fabric ID.
|
|
*/
|
|
u8 socket_id_shift;
|
|
|
|
/* Number of DRAM Address maps visible in a Coherent Station. */
|
|
u8 num_coh_st_maps;
|
|
|
|
/* Global flags to handle special cases. */
|
|
struct df_flags flags;
|
|
};
|
|
|
|
extern struct df_config df_cfg;
|
|
|
|
struct dram_addr_map {
|
|
/*
|
|
* Each DRAM Address Map can operate independently
|
|
* in different interleaving modes.
|
|
*/
|
|
enum intlv_modes intlv_mode;
|
|
|
|
/* System-wide number for this address map. */
|
|
u8 num;
|
|
|
|
/* Raw register values */
|
|
u32 base;
|
|
u32 limit;
|
|
u32 ctl;
|
|
u32 intlv;
|
|
|
|
/*
|
|
* Logical to Physical Coherent Station Remapping array
|
|
*
|
|
* Index: Logical Coherent Station Instance ID
|
|
* Value: Physical Coherent Station Instance ID
|
|
*
|
|
* phys_coh_st_inst_id = remap_array[log_coh_st_inst_id]
|
|
*/
|
|
u8 remap_array[MAX_COH_ST_CHANNELS];
|
|
|
|
/*
|
|
* Number of bits covering DRAM Address map 0
|
|
* when interleaving is non-power-of-2.
|
|
*
|
|
* Used only for DF3_6CHAN.
|
|
*/
|
|
u8 np2_bits;
|
|
|
|
/* Position of the 'interleave bit'. */
|
|
u8 intlv_bit_pos;
|
|
/* Number of channels interleaved in this map. */
|
|
u8 num_intlv_chan;
|
|
/* Number of dies interleaved in this map. */
|
|
u8 num_intlv_dies;
|
|
/* Number of sockets interleaved in this map. */
|
|
u8 num_intlv_sockets;
|
|
/*
|
|
* Total number of channels interleaved accounting
|
|
* for die and socket interleaving.
|
|
*/
|
|
u8 total_intlv_chan;
|
|
/* Total bits needed to cover 'total_intlv_chan'. */
|
|
u8 total_intlv_bits;
|
|
};
|
|
|
|
/* Original input values cached for debug printing. */
|
|
struct addr_ctx_inputs {
|
|
u64 norm_addr;
|
|
u8 socket_id;
|
|
u8 die_id;
|
|
u8 coh_st_inst_id;
|
|
};
|
|
|
|
struct addr_ctx {
|
|
u64 ret_addr;
|
|
|
|
struct addr_ctx_inputs inputs;
|
|
struct dram_addr_map map;
|
|
|
|
/* AMD Node ID calculated from Socket and Die IDs. */
|
|
u8 node_id;
|
|
|
|
/*
|
|
* Coherent Station Instance ID
|
|
* Local ID used within a 'node'.
|
|
*/
|
|
u16 inst_id;
|
|
|
|
/*
|
|
* Coherent Station Fabric ID
|
|
* System-wide ID that includes 'node' bits.
|
|
*/
|
|
u16 coh_st_fabric_id;
|
|
};
|
|
|
|
int df_indirect_read_instance(u16 node, u8 func, u16 reg, u8 instance_id, u32 *lo);
|
|
int df_indirect_read_broadcast(u16 node, u8 func, u16 reg, u32 *lo);
|
|
|
|
int get_df_system_info(void);
|
|
int determine_node_id(struct addr_ctx *ctx, u8 socket_num, u8 die_num);
|
|
int get_addr_hash_mi300(void);
|
|
|
|
int get_address_map(struct addr_ctx *ctx);
|
|
|
|
int denormalize_address(struct addr_ctx *ctx);
|
|
int dehash_address(struct addr_ctx *ctx);
|
|
|
|
unsigned long norm_to_sys_addr(u8 socket_id, u8 die_id, u8 coh_st_inst_id, unsigned long addr);
|
|
unsigned long convert_umc_mca_addr_to_sys_addr(struct atl_err *err);
|
|
|
|
/*
|
|
* Make a gap in @data that is @num_bits long starting at @bit_num.
|
|
* e.g. data = 11111111'b
|
|
* bit_num = 3
|
|
* num_bits = 2
|
|
* result = 1111100111'b
|
|
*/
|
|
static inline u64 expand_bits(u8 bit_num, u8 num_bits, u64 data)
|
|
{
|
|
u64 temp1, temp2;
|
|
|
|
if (!num_bits)
|
|
return data;
|
|
|
|
if (!bit_num) {
|
|
WARN_ON_ONCE(num_bits >= BITS_PER_LONG);
|
|
return data << num_bits;
|
|
}
|
|
|
|
WARN_ON_ONCE(bit_num >= BITS_PER_LONG);
|
|
|
|
temp1 = data & GENMASK_ULL(bit_num - 1, 0);
|
|
|
|
temp2 = data & GENMASK_ULL(63, bit_num);
|
|
temp2 <<= num_bits;
|
|
|
|
return temp1 | temp2;
|
|
}
|
|
|
|
/*
|
|
* Remove bits in @data between @low_bit and @high_bit inclusive.
|
|
* e.g. data = XXXYYZZZ'b
|
|
* low_bit = 3
|
|
* high_bit = 4
|
|
* result = XXXZZZ'b
|
|
*/
|
|
static inline u64 remove_bits(u8 low_bit, u8 high_bit, u64 data)
|
|
{
|
|
u64 temp1, temp2;
|
|
|
|
WARN_ON_ONCE(high_bit >= BITS_PER_LONG);
|
|
WARN_ON_ONCE(low_bit >= BITS_PER_LONG);
|
|
WARN_ON_ONCE(low_bit > high_bit);
|
|
|
|
if (!low_bit)
|
|
return data >> (high_bit++);
|
|
|
|
temp1 = GENMASK_ULL(low_bit - 1, 0) & data;
|
|
temp2 = GENMASK_ULL(63, high_bit + 1) & data;
|
|
temp2 >>= high_bit - low_bit + 1;
|
|
|
|
return temp1 | temp2;
|
|
}
|
|
|
|
#define atl_debug(ctx, fmt, arg...) \
|
|
pr_debug("socket_id=%u die_id=%u coh_st_inst_id=%u norm_addr=0x%016llx: " fmt,\
|
|
(ctx)->inputs.socket_id, (ctx)->inputs.die_id,\
|
|
(ctx)->inputs.coh_st_inst_id, (ctx)->inputs.norm_addr, ##arg)
|
|
|
|
static inline void atl_debug_on_bad_df_rev(void)
|
|
{
|
|
pr_debug("Unrecognized DF rev: %u", df_cfg.rev);
|
|
}
|
|
|
|
static inline void atl_debug_on_bad_intlv_mode(struct addr_ctx *ctx)
|
|
{
|
|
atl_debug(ctx, "Unrecognized interleave mode: %u", ctx->map.intlv_mode);
|
|
}
|
|
|
|
#endif /* __AMD_ATL_INTERNAL_H__ */
|