mirror of
				https://github.com/torvalds/linux.git
				synced 2025-11-04 10:40:15 +02:00 
			
		
		
		
	drm/amd/include: Add amd cper header
AMD is using Common Platform Error Record (CPER) format to report all gpu hardware errors. v2: add program attribute Signed-off-by: Hawking Zhang <Hawking.Zhang@amd.com> Signed-off-by: Xiang Liu <xiang.liu@amd.com> Reviewed-by: Tao Zhou <tao.zhou1@amd.com> Signed-off-by: Alex Deucher <alexander.deucher@amd.com>
This commit is contained in:
		
							parent
							
								
									2012aff981
								
							
						
					
					
						commit
						523b69c654
					
				
					 1 changed files with 269 additions and 0 deletions
				
			
		
							
								
								
									
										269
									
								
								drivers/gpu/drm/amd/include/amd_cper.h
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										269
									
								
								drivers/gpu/drm/amd/include/amd_cper.h
									
									
									
									
									
										Normal file
									
								
							| 
						 | 
				
			
			@ -0,0 +1,269 @@
 | 
			
		|||
/* SPDX-License-Identifier: GPL-2.0 */
 | 
			
		||||
/*
 | 
			
		||||
 * Copyright 2025 Advanced Micro Devices, Inc.
 | 
			
		||||
 *
 | 
			
		||||
 * Permission is hereby granted, free of charge, to any person obtaining a
 | 
			
		||||
 * copy of this software and associated documentation files (the "Software"),
 | 
			
		||||
 * to deal in the Software without restriction, including without limitation
 | 
			
		||||
 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
 | 
			
		||||
 * and/or sell copies of the Software, and to permit persons to whom the
 | 
			
		||||
 * Software is furnished to do so, subject to the following conditions:
 | 
			
		||||
 *
 | 
			
		||||
 * The above copyright notice and this permission notice shall be included in
 | 
			
		||||
 * all copies or substantial portions of the Software.
 | 
			
		||||
 *
 | 
			
		||||
 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
 | 
			
		||||
 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
 | 
			
		||||
 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
 | 
			
		||||
 * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
 | 
			
		||||
 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
 | 
			
		||||
 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
 | 
			
		||||
 * OTHER DEALINGS IN THE SOFTWARE.
 | 
			
		||||
 *
 | 
			
		||||
 */
 | 
			
		||||
#ifndef __AMD_CPER_H__
 | 
			
		||||
#define __AMD_CPER_H__
 | 
			
		||||
 | 
			
		||||
#include <linux/uuid.h>
 | 
			
		||||
 | 
			
		||||
#define CPER_HDR_REV_1          (0x100)
 | 
			
		||||
#define CPER_SEC_MINOR_REV_1    (0x01)
 | 
			
		||||
#define CPER_SEC_MAJOR_REV_22   (0x22)
 | 
			
		||||
#define CPER_MAX_OAM_COUNT      (8)
 | 
			
		||||
 | 
			
		||||
#define CPER_CTX_TYPE_CRASH     (1)
 | 
			
		||||
#define CPER_CTX_TYPE_BOOT      (9)
 | 
			
		||||
 | 
			
		||||
#define CPER_CREATOR_ID_AMDGPU	"amdgpu"
 | 
			
		||||
 | 
			
		||||
#define CPER_NOTIFY_MCE                                               \
 | 
			
		||||
	GUID_INIT(0xE8F56FFE, 0x919C, 0x4cc5, 0xBA, 0x88, 0x65, 0xAB, \
 | 
			
		||||
		  0xE1, 0x49, 0x13, 0xBB)
 | 
			
		||||
#define CPER_NOTIFY_CMC                                               \
 | 
			
		||||
	GUID_INIT(0x2DCE8BB1, 0xBDD7, 0x450e, 0xB9, 0xAD, 0x9C, 0xF4, \
 | 
			
		||||
		  0xEB, 0xD4, 0xF8, 0x90)
 | 
			
		||||
#define BOOT_TYPE                                                     \
 | 
			
		||||
	GUID_INIT(0x3D61A466, 0xAB40, 0x409a, 0xA6, 0x98, 0xF3, 0x62, \
 | 
			
		||||
		  0xD4, 0x64, 0xB3, 0x8F)
 | 
			
		||||
 | 
			
		||||
#define AMD_CRASHDUMP                                                 \
 | 
			
		||||
	GUID_INIT(0x32AC0C78, 0x2623, 0x48F6, 0xB0, 0xD0, 0x73, 0x65, \
 | 
			
		||||
		  0x72, 0x5F, 0xD6, 0xAE)
 | 
			
		||||
#define AMD_GPU_NONSTANDARD_ERROR                                     \
 | 
			
		||||
	GUID_INIT(0x32AC0C78, 0x2623, 0x48F6, 0x81, 0xA2, 0xAC, 0x69, \
 | 
			
		||||
		  0x17, 0x80, 0x55, 0x1D)
 | 
			
		||||
#define PROC_ERR_SECTION_TYPE                                         \
 | 
			
		||||
	GUID_INIT(0xDC3EA0B0, 0xA144, 0x4797, 0xB9, 0x5B, 0x53, 0xFA, \
 | 
			
		||||
		  0x24, 0x2B, 0x6E, 0x1D)
 | 
			
		||||
 | 
			
		||||
enum cper_error_severity {
 | 
			
		||||
	CPER_SEV_NON_FATAL_UNCORRECTED = 0,
 | 
			
		||||
	CPER_SEV_FATAL                 = 1,
 | 
			
		||||
	CPER_SEV_NON_FATAL_CORRECTED   = 2,
 | 
			
		||||
	CPER_SEV_NUM                   = 3,
 | 
			
		||||
 | 
			
		||||
	CPER_SEV_UNUSED = 10,
 | 
			
		||||
};
 | 
			
		||||
 | 
			
		||||
enum cper_aca_reg {
 | 
			
		||||
	CPER_ACA_REG_CTL_LO    = 0,
 | 
			
		||||
	CPER_ACA_REG_CTL_HI    = 1,
 | 
			
		||||
	CPER_ACA_REG_STATUS_LO = 2,
 | 
			
		||||
	CPER_ACA_REG_STATUS_HI = 3,
 | 
			
		||||
	CPER_ACA_REG_ADDR_LO   = 4,
 | 
			
		||||
	CPER_ACA_REG_ADDR_HI   = 5,
 | 
			
		||||
	CPER_ACA_REG_MISC0_LO  = 6,
 | 
			
		||||
	CPER_ACA_REG_MISC0_HI  = 7,
 | 
			
		||||
	CPER_ACA_REG_CONFIG_LO = 8,
 | 
			
		||||
	CPER_ACA_REG_CONFIG_HI = 9,
 | 
			
		||||
	CPER_ACA_REG_IPID_LO   = 10,
 | 
			
		||||
	CPER_ACA_REG_IPID_HI   = 11,
 | 
			
		||||
	CPER_ACA_REG_SYND_LO   = 12,
 | 
			
		||||
	CPER_ACA_REG_SYND_HI   = 13,
 | 
			
		||||
 | 
			
		||||
	CPER_ACA_REG_COUNT     = 32,
 | 
			
		||||
};
 | 
			
		||||
 | 
			
		||||
#pragma pack(push, 1)
 | 
			
		||||
 | 
			
		||||
struct cper_timestamp {
 | 
			
		||||
	uint8_t seconds;
 | 
			
		||||
	uint8_t minutes;
 | 
			
		||||
	uint8_t hours;
 | 
			
		||||
	uint8_t flag;
 | 
			
		||||
	uint8_t day;
 | 
			
		||||
	uint8_t month;
 | 
			
		||||
	uint8_t year;
 | 
			
		||||
	uint8_t century;
 | 
			
		||||
};
 | 
			
		||||
 | 
			
		||||
struct cper_hdr {
 | 
			
		||||
	char                     signature[4];  /* "CPER"  */
 | 
			
		||||
	uint16_t                 revision;
 | 
			
		||||
	uint32_t                 signature_end; /* 0xFFFFFFFF */
 | 
			
		||||
	uint16_t                 sec_cnt;
 | 
			
		||||
	enum cper_error_severity error_severity;
 | 
			
		||||
	union {
 | 
			
		||||
		struct {
 | 
			
		||||
			uint32_t platform_id	: 1;
 | 
			
		||||
			uint32_t timestamp	: 1;
 | 
			
		||||
			uint32_t partition_id	: 1;
 | 
			
		||||
			uint32_t reserved	: 29;
 | 
			
		||||
		} valid_bits;
 | 
			
		||||
		uint32_t valid_mask;
 | 
			
		||||
	};
 | 
			
		||||
	uint32_t		record_length;    /* Total size of CPER Entry */
 | 
			
		||||
	struct cper_timestamp	timestamp;
 | 
			
		||||
	char			platform_id[16];
 | 
			
		||||
	guid_t			partition_id;     /* Reserved */
 | 
			
		||||
	char			creator_id[16];
 | 
			
		||||
	guid_t			notify_type;      /* CMC, MCE */
 | 
			
		||||
	char			record_id[8];     /* Unique CPER Entry ID */
 | 
			
		||||
	uint32_t		flags;            /* Reserved */
 | 
			
		||||
	uint64_t		persistence_info; /* Reserved */
 | 
			
		||||
	uint8_t			reserved[12];     /* Reserved */
 | 
			
		||||
};
 | 
			
		||||
 | 
			
		||||
struct cper_sec_desc {
 | 
			
		||||
	uint32_t sec_offset;     /* Offset from the start of CPER entry */
 | 
			
		||||
	uint32_t sec_length;
 | 
			
		||||
	uint8_t  revision_minor; /* CPER_SEC_MINOR_REV_1 */
 | 
			
		||||
	uint8_t  revision_major; /* CPER_SEC_MAJOR_REV_22 */
 | 
			
		||||
	union {
 | 
			
		||||
		struct {
 | 
			
		||||
			uint8_t fru_id		: 1;
 | 
			
		||||
			uint8_t fru_text	: 1;
 | 
			
		||||
			uint8_t reserved	: 6;
 | 
			
		||||
		} valid_bits;
 | 
			
		||||
		uint8_t valid_mask;
 | 
			
		||||
	};
 | 
			
		||||
	uint8_t reserved;
 | 
			
		||||
	union {
 | 
			
		||||
		struct {
 | 
			
		||||
			uint32_t primary		: 1;
 | 
			
		||||
			uint32_t reserved1		: 2;
 | 
			
		||||
			uint32_t exceed_err_threshold	: 1;
 | 
			
		||||
			uint32_t latent_err		: 1;
 | 
			
		||||
			uint32_t reserved2		: 27;
 | 
			
		||||
		} flag_bits;
 | 
			
		||||
		uint32_t flag_mask;
 | 
			
		||||
	};
 | 
			
		||||
	guid_t				sec_type;
 | 
			
		||||
	char				fru_id[16];
 | 
			
		||||
	enum cper_error_severity	severity;
 | 
			
		||||
	char				fru_text[20];
 | 
			
		||||
};
 | 
			
		||||
 | 
			
		||||
struct cper_sec_nonstd_err_hdr {
 | 
			
		||||
	union {
 | 
			
		||||
		struct {
 | 
			
		||||
			uint64_t apic_id		: 1;
 | 
			
		||||
			uint64_t fw_id			: 1;
 | 
			
		||||
			uint64_t err_info_cnt		: 6;
 | 
			
		||||
			uint64_t err_context_cnt	: 6;
 | 
			
		||||
		} valid_bits;
 | 
			
		||||
		uint64_t valid_mask;
 | 
			
		||||
	};
 | 
			
		||||
	uint64_t apic_id;
 | 
			
		||||
	char     fw_id[48];
 | 
			
		||||
};
 | 
			
		||||
 | 
			
		||||
struct cper_sec_nonstd_err_info {
 | 
			
		||||
	guid_t error_type;
 | 
			
		||||
	union {
 | 
			
		||||
		struct {
 | 
			
		||||
			uint64_t ms_chk			: 1;
 | 
			
		||||
			uint64_t target_addr_id		: 1;
 | 
			
		||||
			uint64_t req_id			: 1;
 | 
			
		||||
			uint64_t resp_id		: 1;
 | 
			
		||||
			uint64_t instr_ptr		: 1;
 | 
			
		||||
			uint64_t reserved		: 59;
 | 
			
		||||
		} valid_bits;
 | 
			
		||||
		uint64_t        valid_mask;
 | 
			
		||||
	};
 | 
			
		||||
	union {
 | 
			
		||||
		struct {
 | 
			
		||||
			uint64_t err_type_valid		: 1;
 | 
			
		||||
			uint64_t pcc_valid		: 1;
 | 
			
		||||
			uint64_t uncorr_valid		: 1;
 | 
			
		||||
			uint64_t precise_ip_valid	: 1;
 | 
			
		||||
			uint64_t restartable_ip_valid	: 1;
 | 
			
		||||
			uint64_t overflow_valid		: 1;
 | 
			
		||||
			uint64_t reserved1		: 10;
 | 
			
		||||
			uint64_t err_type		: 2;
 | 
			
		||||
			uint64_t pcc			: 1;
 | 
			
		||||
			uint64_t uncorr			: 1;
 | 
			
		||||
			uint64_t precised_ip		: 1;
 | 
			
		||||
			uint64_t restartable_ip		: 1;
 | 
			
		||||
			uint64_t overflow		: 1;
 | 
			
		||||
			uint64_t reserved2		: 41;
 | 
			
		||||
		} ms_chk_bits;
 | 
			
		||||
		uint64_t ms_chk_mask;
 | 
			
		||||
	};
 | 
			
		||||
	uint64_t target_addr_id;
 | 
			
		||||
	uint64_t req_id;
 | 
			
		||||
	uint64_t resp_id;
 | 
			
		||||
	uint64_t instr_ptr;
 | 
			
		||||
};
 | 
			
		||||
 | 
			
		||||
struct cper_sec_nonstd_err_ctx {
 | 
			
		||||
	uint16_t reg_ctx_type;
 | 
			
		||||
	uint16_t reg_arr_size;
 | 
			
		||||
	uint32_t msr_addr;
 | 
			
		||||
	uint64_t mm_reg_addr;
 | 
			
		||||
	uint32_t reg_dump[CPER_ACA_REG_COUNT];
 | 
			
		||||
};
 | 
			
		||||
 | 
			
		||||
struct cper_sec_nonstd_err {
 | 
			
		||||
	struct cper_sec_nonstd_err_hdr  hdr;
 | 
			
		||||
	struct cper_sec_nonstd_err_info info;
 | 
			
		||||
	struct cper_sec_nonstd_err_ctx  ctx;
 | 
			
		||||
};
 | 
			
		||||
 | 
			
		||||
struct cper_sec_crashdump_hdr {
 | 
			
		||||
	uint64_t reserved1;
 | 
			
		||||
	uint64_t reserved2;
 | 
			
		||||
	char     fw_id[48];
 | 
			
		||||
	uint64_t reserved3[8];
 | 
			
		||||
};
 | 
			
		||||
 | 
			
		||||
struct cper_sec_crashdump_reg_data {
 | 
			
		||||
	uint32_t status_lo;
 | 
			
		||||
	uint32_t status_hi;
 | 
			
		||||
	uint32_t addr_lo;
 | 
			
		||||
	uint32_t addr_hi;
 | 
			
		||||
	uint32_t ipid_lo;
 | 
			
		||||
	uint32_t ipid_hi;
 | 
			
		||||
	uint32_t synd_lo;
 | 
			
		||||
	uint32_t synd_hi;
 | 
			
		||||
};
 | 
			
		||||
 | 
			
		||||
struct cper_sec_crashdump_body_fatal {
 | 
			
		||||
	uint16_t                           reg_ctx_type;
 | 
			
		||||
	uint16_t                           reg_arr_size;
 | 
			
		||||
	uint32_t                           reserved1;
 | 
			
		||||
	uint64_t                           reserved2;
 | 
			
		||||
	struct cper_sec_crashdump_reg_data data;
 | 
			
		||||
};
 | 
			
		||||
 | 
			
		||||
struct cper_sec_crashdump_body_boot {
 | 
			
		||||
	uint16_t reg_ctx_type;
 | 
			
		||||
	uint16_t reg_arr_size;
 | 
			
		||||
	uint32_t reserved1;
 | 
			
		||||
	uint64_t reserved2;
 | 
			
		||||
	uint64_t msg[CPER_MAX_OAM_COUNT];
 | 
			
		||||
};
 | 
			
		||||
 | 
			
		||||
struct cper_sec_crashdump_fatal {
 | 
			
		||||
	struct cper_sec_crashdump_hdr        hdr;
 | 
			
		||||
	struct cper_sec_crashdump_body_fatal body;
 | 
			
		||||
};
 | 
			
		||||
 | 
			
		||||
struct cper_sec_crashdump_boot {
 | 
			
		||||
	struct cper_sec_crashdump_hdr       hdr;
 | 
			
		||||
	struct cper_sec_crashdump_body_boot body;
 | 
			
		||||
};
 | 
			
		||||
 | 
			
		||||
#pragma pack(pop)
 | 
			
		||||
 | 
			
		||||
#endif
 | 
			
		||||
		Loading…
	
		Reference in a new issue