forked from mirrors/linux
		
	Merge patch series "riscv: add SBI FWFT misaligned exception delegation support"
Clément Léger <cleger@rivosinc.com> says:
The SBI Firmware Feature extension allows the S-mode to request some
specific features (either hardware or software) to be enabled. This
series uses this extension to request misaligned access exception
delegation to S-mode in order to let the kernel handle it. It also adds
support for the KVM FWFT SBI extension based on the misaligned access
handling infrastructure.
FWFT SBI extension is part of the SBI V3.0 specifications [1]. It can be
tested using the qemu provided at [2] which contains the series from
[3]. Upstream kvm-unit-tests can be used inside kvm to tests the correct
delegation of misaligned exceptions. Upstream OpenSBI can be used.
The tests can be run using the kselftest from series [4].
$ qemu-system-riscv64 \
        -cpu rv64,trap-misaligned-access=true,v=true \
        -M virt \
        -m 1024M \
        -bios fw_dynamic.bin \
        -kernel Image
 ...
 # ./misaligned
 TAP version 13
 1..23
 # Starting 23 tests from 1 test cases.
 #  RUN           global.gp_load_lh ...
 #            OK  global.gp_load_lh
 ok 1 global.gp_load_lh
 #  RUN           global.gp_load_lhu ...
 #            OK  global.gp_load_lhu
 ok 2 global.gp_load_lhu
 #  RUN           global.gp_load_lw ...
 #            OK  global.gp_load_lw
 ok 3 global.gp_load_lw
 #  RUN           global.gp_load_lwu ...
 #            OK  global.gp_load_lwu
 ok 4 global.gp_load_lwu
 #  RUN           global.gp_load_ld ...
 #            OK  global.gp_load_ld
 ok 5 global.gp_load_ld
 #  RUN           global.gp_load_c_lw ...
 #            OK  global.gp_load_c_lw
 ok 6 global.gp_load_c_lw
 #  RUN           global.gp_load_c_ld ...
 #            OK  global.gp_load_c_ld
 ok 7 global.gp_load_c_ld
 #  RUN           global.gp_load_c_ldsp ...
 #            OK  global.gp_load_c_ldsp
 ok 8 global.gp_load_c_ldsp
 #  RUN           global.gp_load_sh ...
 #            OK  global.gp_load_sh
 ok 9 global.gp_load_sh
 #  RUN           global.gp_load_sw ...
 #            OK  global.gp_load_sw
 ok 10 global.gp_load_sw
 #  RUN           global.gp_load_sd ...
 #            OK  global.gp_load_sd
 ok 11 global.gp_load_sd
 #  RUN           global.gp_load_c_sw ...
 #            OK  global.gp_load_c_sw
 ok 12 global.gp_load_c_sw
 #  RUN           global.gp_load_c_sd ...
 #            OK  global.gp_load_c_sd
 ok 13 global.gp_load_c_sd
 #  RUN           global.gp_load_c_sdsp ...
 #            OK  global.gp_load_c_sdsp
 ok 14 global.gp_load_c_sdsp
 #  RUN           global.fpu_load_flw ...
 #            OK  global.fpu_load_flw
 ok 15 global.fpu_load_flw
 #  RUN           global.fpu_load_fld ...
 #            OK  global.fpu_load_fld
 ok 16 global.fpu_load_fld
 #  RUN           global.fpu_load_c_fld ...
 #            OK  global.fpu_load_c_fld
 ok 17 global.fpu_load_c_fld
 #  RUN           global.fpu_load_c_fldsp ...
 #            OK  global.fpu_load_c_fldsp
 ok 18 global.fpu_load_c_fldsp
 #  RUN           global.fpu_store_fsw ...
 #            OK  global.fpu_store_fsw
 ok 19 global.fpu_store_fsw
 #  RUN           global.fpu_store_fsd ...
 #            OK  global.fpu_store_fsd
 ok 20 global.fpu_store_fsd
 #  RUN           global.fpu_store_c_fsd ...
 #            OK  global.fpu_store_c_fsd
 ok 21 global.fpu_store_c_fsd
 #  RUN           global.fpu_store_c_fsdsp ...
 #            OK  global.fpu_store_c_fsdsp
 ok 22 global.fpu_store_c_fsdsp
 #  RUN           global.gen_sigbus ...
 [12797.988647] misaligned[618]: unhandled signal 7 code 0x1 at 0x0000000000014dc0 in misaligned[4dc0,10000+76000]
 [12797.988990] CPU: 0 UID: 0 PID: 618 Comm: misaligned Not tainted 6.13.0-rc6-00008-g4ec4468967c9-dirty #51
 [12797.989169] Hardware name: riscv-virtio,qemu (DT)
 [12797.989264] epc : 0000000000014dc0 ra : 0000000000014d00 sp : 00007fffe165d100
 [12797.989407]  gp : 000000000008f6e8 tp : 0000000000095760 t0 : 0000000000000008
 [12797.989544]  t1 : 00000000000965d8 t2 : 000000000008e830 s0 : 00007fffe165d160
 [12797.989692]  s1 : 000000000000001a a0 : 0000000000000000 a1 : 0000000000000002
 [12797.989831]  a2 : 0000000000000000 a3 : 0000000000000000 a4 : ffffffffdeadbeef
 [12797.989964]  a5 : 000000000008ef61 a6 : 626769735f6e0000 a7 : fffffffffffff000
 [12797.990094]  s2 : 0000000000000001 s3 : 00007fffe165d838 s4 : 00007fffe165d848
 [12797.990238]  s5 : 000000000000001a s6 : 0000000000010442 s7 : 0000000000010200
 [12797.990391]  s8 : 000000000000003a s9 : 0000000000094508 s10: 0000000000000000
 [12797.990526]  s11: 0000555567460668 t3 : 00007fffe165d070 t4 : 00000000000965d0
 [12797.990656]  t5 : fefefefefefefeff t6 : 0000000000000073
 [12797.990756] status: 0000000200004020 badaddr: 000000000008ef61 cause: 0000000000000006
 [12797.990911] Code: 8793 8791 3423 fcf4 3783 fc84 c737 dead 0713 eef7 (c398) 0001
 #            OK  global.gen_sigbus
 ok 23 global.gen_sigbus
 # PASSED: 23 / 23 tests passed.
 # Totals: pass:23 fail:0 xfail:0 xpass:0 skip:0 error:0
With kvm-tools:
 # lkvm run -k sbi.flat -m 128
  Info: # lkvm run -k sbi.flat -m 128 -c 1 --name guest-97
  Info: Removed ghost socket file "/root/.lkvm//guest-97.sock".
 ##########################################################################
 #    kvm-unit-tests
 ##########################################################################
 ... [test messages elided]
 PASS: sbi: fwft: FWFT extension probing no error
 PASS: sbi: fwft: get/set reserved feature 0x6 error == SBI_ERR_DENIED
 PASS: sbi: fwft: get/set reserved feature 0x3fffffff error == SBI_ERR_DENIED
 PASS: sbi: fwft: get/set reserved feature 0x80000000 error == SBI_ERR_DENIED
 PASS: sbi: fwft: get/set reserved feature 0xbfffffff error == SBI_ERR_DENIED
 PASS: sbi: fwft: misaligned_deleg: Get misaligned deleg feature no error
 PASS: sbi: fwft: misaligned_deleg: Set misaligned deleg feature invalid value error
 PASS: sbi: fwft: misaligned_deleg: Set misaligned deleg feature invalid value error
 PASS: sbi: fwft: misaligned_deleg: Set misaligned deleg feature value no error
 PASS: sbi: fwft: misaligned_deleg: Set misaligned deleg feature value 0
 PASS: sbi: fwft: misaligned_deleg: Set misaligned deleg feature value no error
 PASS: sbi: fwft: misaligned_deleg: Set misaligned deleg feature value 1
 PASS: sbi: fwft: misaligned_deleg: Verify misaligned load exception trap in supervisor
 SUMMARY: 50 tests, 2 unexpected failures, 12 skipped
This series is available at [5].
[Palmer: slighyt commit text modification, as SBI-3.0 is merged now.
Also drop the KVM patches, as they're too late.]
* b4-shazam-merge:
  riscv: misaligned: add a function to check misalign trap delegability
  riscv: misaligned: move emulated access uniformity check in a function
  riscv: misaligned: declare misaligned_access_speed under CONFIG_RISCV_MISALIGNED
  riscv: misaligned: use on_each_cpu() for scalar misaligned access probing
  riscv: misaligned: request misaligned exception from SBI
  riscv: sbi: add SBI FWFT extension calls
  riscv: sbi: add FWFT extension interface
  riscv: sbi: add new SBI error mappings
  riscv: sbi: remove useless parenthesis
  riscv: sbi: add Firmware Feature (FWFT) SBI extensions definitions
Link: https://lore.kernel.org/r/20250523101932.1594077-1-cleger@rivosinc.com
Signed-off-by: Palmer Dabbelt <palmer@dabbelt.com>
			
			
This commit is contained in:
		
						commit
						51f1b16367
					
				
					 5 changed files with 257 additions and 18 deletions
				
			
		|  | @ -67,11 +67,11 @@ void __init riscv_user_isa_enable(void); | |||
| 	_RISCV_ISA_EXT_DATA(_name, _id, _sub_exts, ARRAY_SIZE(_sub_exts), _validate) | ||||
| 
 | ||||
| bool __init check_unaligned_access_emulated_all_cpus(void); | ||||
| void unaligned_access_init(void); | ||||
| int cpu_online_unaligned_access_init(unsigned int cpu); | ||||
| #if defined(CONFIG_RISCV_SCALAR_MISALIGNED) | ||||
| void check_unaligned_access_emulated(struct work_struct *work __always_unused); | ||||
| void unaligned_emulation_finish(void); | ||||
| bool unaligned_ctl_available(void); | ||||
| DECLARE_PER_CPU(long, misaligned_access_speed); | ||||
| #else | ||||
| static inline bool unaligned_ctl_available(void) | ||||
| { | ||||
|  | @ -79,6 +79,16 @@ static inline bool unaligned_ctl_available(void) | |||
| } | ||||
| #endif | ||||
| 
 | ||||
| #if defined(CONFIG_RISCV_MISALIGNED) | ||||
| DECLARE_PER_CPU(long, misaligned_access_speed); | ||||
| bool misaligned_traps_can_delegate(void); | ||||
| #else | ||||
| static inline bool misaligned_traps_can_delegate(void) | ||||
| { | ||||
| 	return false; | ||||
| } | ||||
| #endif | ||||
| 
 | ||||
| bool __init check_vector_unaligned_access_emulated_all_cpus(void); | ||||
| #if defined(CONFIG_RISCV_VECTOR_MISALIGNED) | ||||
| void check_vector_unaligned_access_emulated(struct work_struct *work __always_unused); | ||||
|  |  | |||
|  | @ -35,6 +35,7 @@ enum sbi_ext_id { | |||
| 	SBI_EXT_DBCN = 0x4442434E, | ||||
| 	SBI_EXT_STA = 0x535441, | ||||
| 	SBI_EXT_NACL = 0x4E41434C, | ||||
| 	SBI_EXT_FWFT = 0x46574654, | ||||
| 
 | ||||
| 	/* Experimentals extensions must lie within this range */ | ||||
| 	SBI_EXT_EXPERIMENTAL_START = 0x08000000, | ||||
|  | @ -402,6 +403,33 @@ enum sbi_ext_nacl_feature { | |||
| #define SBI_NACL_SHMEM_SRET_X(__i)		((__riscv_xlen / 8) * (__i)) | ||||
| #define SBI_NACL_SHMEM_SRET_X_LAST		31 | ||||
| 
 | ||||
| /* SBI function IDs for FW feature extension */ | ||||
| #define SBI_EXT_FWFT_SET		0x0 | ||||
| #define SBI_EXT_FWFT_GET		0x1 | ||||
| 
 | ||||
| enum sbi_fwft_feature_t { | ||||
| 	SBI_FWFT_MISALIGNED_EXC_DELEG		= 0x0, | ||||
| 	SBI_FWFT_LANDING_PAD			= 0x1, | ||||
| 	SBI_FWFT_SHADOW_STACK			= 0x2, | ||||
| 	SBI_FWFT_DOUBLE_TRAP			= 0x3, | ||||
| 	SBI_FWFT_PTE_AD_HW_UPDATING		= 0x4, | ||||
| 	SBI_FWFT_POINTER_MASKING_PMLEN		= 0x5, | ||||
| 	SBI_FWFT_LOCAL_RESERVED_START		= 0x6, | ||||
| 	SBI_FWFT_LOCAL_RESERVED_END		= 0x3fffffff, | ||||
| 	SBI_FWFT_LOCAL_PLATFORM_START		= 0x40000000, | ||||
| 	SBI_FWFT_LOCAL_PLATFORM_END		= 0x7fffffff, | ||||
| 
 | ||||
| 	SBI_FWFT_GLOBAL_RESERVED_START		= 0x80000000, | ||||
| 	SBI_FWFT_GLOBAL_RESERVED_END		= 0xbfffffff, | ||||
| 	SBI_FWFT_GLOBAL_PLATFORM_START		= 0xc0000000, | ||||
| 	SBI_FWFT_GLOBAL_PLATFORM_END		= 0xffffffff, | ||||
| }; | ||||
| 
 | ||||
| #define SBI_FWFT_PLATFORM_FEATURE_BIT		BIT(30) | ||||
| #define SBI_FWFT_GLOBAL_FEATURE_BIT		BIT(31) | ||||
| 
 | ||||
| #define SBI_FWFT_SET_FLAG_LOCK			BIT(0) | ||||
| 
 | ||||
| /* SBI spec version fields */ | ||||
| #define SBI_SPEC_VERSION_DEFAULT	0x1 | ||||
| #define SBI_SPEC_VERSION_MAJOR_SHIFT	24 | ||||
|  | @ -419,6 +447,11 @@ enum sbi_ext_nacl_feature { | |||
| #define SBI_ERR_ALREADY_STARTED -7 | ||||
| #define SBI_ERR_ALREADY_STOPPED -8 | ||||
| #define SBI_ERR_NO_SHMEM	-9 | ||||
| #define SBI_ERR_INVALID_STATE	-10 | ||||
| #define SBI_ERR_BAD_RANGE	-11 | ||||
| #define SBI_ERR_TIMEOUT		-12 | ||||
| #define SBI_ERR_IO		-13 | ||||
| #define SBI_ERR_DENIED_LOCKED	-14 | ||||
| 
 | ||||
| extern unsigned long sbi_spec_version; | ||||
| struct sbiret { | ||||
|  | @ -470,6 +503,23 @@ int sbi_remote_hfence_vvma_asid(const struct cpumask *cpu_mask, | |||
| 				unsigned long asid); | ||||
| long sbi_probe_extension(int ext); | ||||
| 
 | ||||
| int sbi_fwft_set(u32 feature, unsigned long value, unsigned long flags); | ||||
| int sbi_fwft_set_cpumask(const cpumask_t *mask, u32 feature, | ||||
| 			 unsigned long value, unsigned long flags); | ||||
| /**
 | ||||
|  * sbi_fwft_set_online_cpus() - Set a feature on all online cpus | ||||
|  * @feature: The feature to be set | ||||
|  * @value: The feature value to be set | ||||
|  * @flags: FWFT feature set flags | ||||
|  * | ||||
|  * Return: 0 on success, appropriate linux error code otherwise. | ||||
|  */ | ||||
| static inline int sbi_fwft_set_online_cpus(u32 feature, unsigned long value, | ||||
| 					   unsigned long flags) | ||||
| { | ||||
| 	return sbi_fwft_set_cpumask(cpu_online_mask, feature, value, flags); | ||||
| } | ||||
| 
 | ||||
| /* Check if current SBI specification version is 0.1 or not */ | ||||
| static inline int sbi_spec_is_0_1(void) | ||||
| { | ||||
|  | @ -503,11 +553,21 @@ static inline int sbi_err_map_linux_errno(int err) | |||
| 	case SBI_SUCCESS: | ||||
| 		return 0; | ||||
| 	case SBI_ERR_DENIED: | ||||
| 	case SBI_ERR_DENIED_LOCKED: | ||||
| 		return -EPERM; | ||||
| 	case SBI_ERR_INVALID_PARAM: | ||||
| 	case SBI_ERR_INVALID_STATE: | ||||
| 		return -EINVAL; | ||||
| 	case SBI_ERR_BAD_RANGE: | ||||
| 		return -ERANGE; | ||||
| 	case SBI_ERR_INVALID_ADDRESS: | ||||
| 		return -EFAULT; | ||||
| 	case SBI_ERR_NO_SHMEM: | ||||
| 		return -ENOMEM; | ||||
| 	case SBI_ERR_TIMEOUT: | ||||
| 		return -ETIMEDOUT; | ||||
| 	case SBI_ERR_IO: | ||||
| 		return -EIO; | ||||
| 	case SBI_ERR_NOT_SUPPORTED: | ||||
| 	case SBI_ERR_FAILURE: | ||||
| 	default: | ||||
|  |  | |||
|  | @ -299,6 +299,76 @@ static int __sbi_rfence_v02(int fid, const struct cpumask *cpu_mask, | |||
| 	return 0; | ||||
| } | ||||
| 
 | ||||
| static bool sbi_fwft_supported; | ||||
| 
 | ||||
| struct fwft_set_req { | ||||
| 	u32 feature; | ||||
| 	unsigned long value; | ||||
| 	unsigned long flags; | ||||
| 	atomic_t error; | ||||
| }; | ||||
| 
 | ||||
| static void cpu_sbi_fwft_set(void *arg) | ||||
| { | ||||
| 	struct fwft_set_req *req = arg; | ||||
| 	int ret; | ||||
| 
 | ||||
| 	ret = sbi_fwft_set(req->feature, req->value, req->flags); | ||||
| 	if (ret) | ||||
| 		atomic_set(&req->error, ret); | ||||
| } | ||||
| 
 | ||||
| /**
 | ||||
|  * sbi_fwft_set() - Set a feature on the local hart | ||||
|  * @feature: The feature ID to be set | ||||
|  * @value: The feature value to be set | ||||
|  * @flags: FWFT feature set flags | ||||
|  * | ||||
|  * Return: 0 on success, appropriate linux error code otherwise. | ||||
|  */ | ||||
| int sbi_fwft_set(u32 feature, unsigned long value, unsigned long flags) | ||||
| { | ||||
| 	struct sbiret ret; | ||||
| 
 | ||||
| 	if (!sbi_fwft_supported) | ||||
| 		return -EOPNOTSUPP; | ||||
| 
 | ||||
| 	ret = sbi_ecall(SBI_EXT_FWFT, SBI_EXT_FWFT_SET, | ||||
| 			feature, value, flags, 0, 0, 0); | ||||
| 
 | ||||
| 	return sbi_err_map_linux_errno(ret.error); | ||||
| } | ||||
| 
 | ||||
| /**
 | ||||
|  * sbi_fwft_set_cpumask() - Set a feature for the specified cpumask | ||||
|  * @mask: CPU mask of cpus that need the feature to be set | ||||
|  * @feature: The feature ID to be set | ||||
|  * @value: The feature value to be set | ||||
|  * @flags: FWFT feature set flags | ||||
|  * | ||||
|  * Return: 0 on success, appropriate linux error code otherwise. | ||||
|  */ | ||||
| int sbi_fwft_set_cpumask(const cpumask_t *mask, u32 feature, | ||||
| 			       unsigned long value, unsigned long flags) | ||||
| { | ||||
| 	struct fwft_set_req req = { | ||||
| 		.feature = feature, | ||||
| 		.value = value, | ||||
| 		.flags = flags, | ||||
| 		.error = ATOMIC_INIT(0), | ||||
| 	}; | ||||
| 
 | ||||
| 	if (!sbi_fwft_supported) | ||||
| 		return -EOPNOTSUPP; | ||||
| 
 | ||||
| 	if (feature & SBI_FWFT_GLOBAL_FEATURE_BIT) | ||||
| 		return -EINVAL; | ||||
| 
 | ||||
| 	on_each_cpu_mask(mask, cpu_sbi_fwft_set, &req, 1); | ||||
| 
 | ||||
| 	return atomic_read(&req.error); | ||||
| } | ||||
| 
 | ||||
| /**
 | ||||
|  * sbi_set_timer() - Program the timer for next timer event. | ||||
|  * @stime_value: The value after which next timer event should fire. | ||||
|  | @ -609,7 +679,7 @@ void __init sbi_init(void) | |||
| 		} else { | ||||
| 			__sbi_rfence	= __sbi_rfence_v01; | ||||
| 		} | ||||
| 		if ((sbi_spec_version >= sbi_mk_version(0, 3)) && | ||||
| 		if (sbi_spec_version >= sbi_mk_version(0, 3) && | ||||
| 		    sbi_probe_extension(SBI_EXT_SRST)) { | ||||
| 			pr_info("SBI SRST extension detected\n"); | ||||
| 			pm_power_off = sbi_srst_power_off; | ||||
|  | @ -617,11 +687,16 @@ void __init sbi_init(void) | |||
| 			sbi_srst_reboot_nb.priority = 192; | ||||
| 			register_restart_handler(&sbi_srst_reboot_nb); | ||||
| 		} | ||||
| 		if ((sbi_spec_version >= sbi_mk_version(2, 0)) && | ||||
| 		    (sbi_probe_extension(SBI_EXT_DBCN) > 0)) { | ||||
| 		if (sbi_spec_version >= sbi_mk_version(2, 0) && | ||||
| 		    sbi_probe_extension(SBI_EXT_DBCN) > 0) { | ||||
| 			pr_info("SBI DBCN extension detected\n"); | ||||
| 			sbi_debug_console_available = true; | ||||
| 		} | ||||
| 		if (sbi_spec_version >= sbi_mk_version(3, 0) && | ||||
| 		    sbi_probe_extension(SBI_EXT_FWFT)) { | ||||
| 			pr_info("SBI FWFT extension detected\n"); | ||||
| 			sbi_fwft_supported = true; | ||||
| 		} | ||||
| 	} else { | ||||
| 		__sbi_set_timer = __sbi_set_timer_v01; | ||||
| 		__sbi_send_ipi	= __sbi_send_ipi_v01; | ||||
|  |  | |||
|  | @ -16,6 +16,7 @@ | |||
| #include <asm/entry-common.h> | ||||
| #include <asm/hwprobe.h> | ||||
| #include <asm/cpufeature.h> | ||||
| #include <asm/sbi.h> | ||||
| #include <asm/vector.h> | ||||
| 
 | ||||
| #define INSN_MATCH_LB			0x3 | ||||
|  | @ -368,9 +369,7 @@ static int handle_scalar_misaligned_load(struct pt_regs *regs) | |||
| 
 | ||||
| 	perf_sw_event(PERF_COUNT_SW_ALIGNMENT_FAULTS, 1, regs, addr); | ||||
| 
 | ||||
| #ifdef CONFIG_RISCV_PROBE_UNALIGNED_ACCESS | ||||
| 	*this_cpu_ptr(&misaligned_access_speed) = RISCV_HWPROBE_MISALIGNED_SCALAR_EMULATED; | ||||
| #endif | ||||
| 
 | ||||
| 	if (!unaligned_enabled) | ||||
| 		return -1; | ||||
|  | @ -626,6 +625,10 @@ bool __init check_vector_unaligned_access_emulated_all_cpus(void) | |||
| { | ||||
| 	int cpu; | ||||
| 
 | ||||
| 	/*
 | ||||
| 	 * While being documented as very slow, schedule_on_each_cpu() is used since | ||||
| 	 * kernel_vector_begin() expects irqs to be enabled or it will panic() | ||||
| 	 */ | ||||
| 	schedule_on_each_cpu(check_vector_unaligned_access_emulated); | ||||
| 
 | ||||
| 	for_each_online_cpu(cpu) | ||||
|  | @ -642,11 +645,23 @@ bool __init check_vector_unaligned_access_emulated_all_cpus(void) | |||
| } | ||||
| #endif | ||||
| 
 | ||||
| static bool all_cpus_unaligned_scalar_access_emulated(void) | ||||
| { | ||||
| 	int cpu; | ||||
| 
 | ||||
| 	for_each_online_cpu(cpu) | ||||
| 		if (per_cpu(misaligned_access_speed, cpu) != | ||||
| 		    RISCV_HWPROBE_MISALIGNED_SCALAR_EMULATED) | ||||
| 			return false; | ||||
| 
 | ||||
| 	return true; | ||||
| } | ||||
| 
 | ||||
| #ifdef CONFIG_RISCV_SCALAR_MISALIGNED | ||||
| 
 | ||||
| static bool unaligned_ctl __read_mostly; | ||||
| 
 | ||||
| void check_unaligned_access_emulated(struct work_struct *work __always_unused) | ||||
| static void check_unaligned_access_emulated(void *arg __always_unused) | ||||
| { | ||||
| 	int cpu = smp_processor_id(); | ||||
| 	long *mas_ptr = per_cpu_ptr(&misaligned_access_speed, cpu); | ||||
|  | @ -657,6 +672,13 @@ void check_unaligned_access_emulated(struct work_struct *work __always_unused) | |||
| 	__asm__ __volatile__ ( | ||||
| 		"       "REG_L" %[tmp], 1(%[ptr])\n" | ||||
| 		: [tmp] "=r" (tmp_val) : [ptr] "r" (&tmp_var) : "memory"); | ||||
| } | ||||
| 
 | ||||
| static int cpu_online_check_unaligned_access_emulated(unsigned int cpu) | ||||
| { | ||||
| 	long *mas_ptr = per_cpu_ptr(&misaligned_access_speed, cpu); | ||||
| 
 | ||||
| 	check_unaligned_access_emulated(NULL); | ||||
| 
 | ||||
| 	/*
 | ||||
| 	 * If unaligned_ctl is already set, this means that we detected that all | ||||
|  | @ -665,26 +687,23 @@ void check_unaligned_access_emulated(struct work_struct *work __always_unused) | |||
| 	 */ | ||||
| 	if (unlikely(unaligned_ctl && (*mas_ptr != RISCV_HWPROBE_MISALIGNED_SCALAR_EMULATED))) { | ||||
| 		pr_crit("CPU misaligned accesses non homogeneous (expected all emulated)\n"); | ||||
| 		while (true) | ||||
| 			cpu_relax(); | ||||
| 		return -EINVAL; | ||||
| 	} | ||||
| 
 | ||||
| 	return 0; | ||||
| } | ||||
| 
 | ||||
| bool __init check_unaligned_access_emulated_all_cpus(void) | ||||
| { | ||||
| 	int cpu; | ||||
| 
 | ||||
| 	/*
 | ||||
| 	 * We can only support PR_UNALIGN controls if all CPUs have misaligned | ||||
| 	 * accesses emulated since tasks requesting such control can run on any | ||||
| 	 * CPU. | ||||
| 	 */ | ||||
| 	schedule_on_each_cpu(check_unaligned_access_emulated); | ||||
| 	on_each_cpu(check_unaligned_access_emulated, NULL, 1); | ||||
| 
 | ||||
| 	for_each_online_cpu(cpu) | ||||
| 		if (per_cpu(misaligned_access_speed, cpu) | ||||
| 		    != RISCV_HWPROBE_MISALIGNED_SCALAR_EMULATED) | ||||
| 			return false; | ||||
| 	if (!all_cpus_unaligned_scalar_access_emulated()) | ||||
| 		return false; | ||||
| 
 | ||||
| 	unaligned_ctl = true; | ||||
| 	return true; | ||||
|  | @ -699,4 +718,73 @@ bool __init check_unaligned_access_emulated_all_cpus(void) | |||
| { | ||||
| 	return false; | ||||
| } | ||||
| static int cpu_online_check_unaligned_access_emulated(unsigned int cpu) | ||||
| { | ||||
| 	return 0; | ||||
| } | ||||
| #endif | ||||
| 
 | ||||
| static bool misaligned_traps_delegated; | ||||
| 
 | ||||
| #ifdef CONFIG_RISCV_SBI | ||||
| 
 | ||||
| static int cpu_online_sbi_unaligned_setup(unsigned int cpu) | ||||
| { | ||||
| 	if (sbi_fwft_set(SBI_FWFT_MISALIGNED_EXC_DELEG, 1, 0) && | ||||
| 	    misaligned_traps_delegated) { | ||||
| 		pr_crit("Misaligned trap delegation non homogeneous (expected delegated)"); | ||||
| 		return -EINVAL; | ||||
| 	} | ||||
| 
 | ||||
| 	return 0; | ||||
| } | ||||
| 
 | ||||
| void __init unaligned_access_init(void) | ||||
| { | ||||
| 	int ret; | ||||
| 
 | ||||
| 	ret = sbi_fwft_set_online_cpus(SBI_FWFT_MISALIGNED_EXC_DELEG, 1, 0); | ||||
| 	if (ret) | ||||
| 		return; | ||||
| 
 | ||||
| 	misaligned_traps_delegated = true; | ||||
| 	pr_info("SBI misaligned access exception delegation ok\n"); | ||||
| 	/*
 | ||||
| 	 * Note that we don't have to take any specific action here, if | ||||
| 	 * the delegation is successful, then | ||||
| 	 * check_unaligned_access_emulated() will verify that indeed the | ||||
| 	 * platform traps on misaligned accesses. | ||||
| 	 */ | ||||
| } | ||||
| #else | ||||
| void __init unaligned_access_init(void) {} | ||||
| 
 | ||||
| static int cpu_online_sbi_unaligned_setup(unsigned int cpu __always_unused) | ||||
| { | ||||
| 	return 0; | ||||
| } | ||||
| 
 | ||||
| #endif | ||||
| 
 | ||||
| int cpu_online_unaligned_access_init(unsigned int cpu) | ||||
| { | ||||
| 	int ret; | ||||
| 
 | ||||
| 	ret = cpu_online_sbi_unaligned_setup(cpu); | ||||
| 	if (ret) | ||||
| 		return ret; | ||||
| 
 | ||||
| 	return cpu_online_check_unaligned_access_emulated(cpu); | ||||
| } | ||||
| 
 | ||||
| bool misaligned_traps_can_delegate(void) | ||||
| { | ||||
| 	/*
 | ||||
| 	 * Either we successfully requested misaligned traps delegation for all | ||||
| 	 * CPUs, or the SBI does not implement the FWFT extension but delegated | ||||
| 	 * the exception by default. | ||||
| 	 */ | ||||
| 	return misaligned_traps_delegated || | ||||
| 	       all_cpus_unaligned_scalar_access_emulated(); | ||||
| } | ||||
| EXPORT_SYMBOL_GPL(misaligned_traps_can_delegate); | ||||
|  |  | |||
|  | @ -236,6 +236,11 @@ arch_initcall_sync(lock_and_set_unaligned_access_static_branch); | |||
| 
 | ||||
| static int riscv_online_cpu(unsigned int cpu) | ||||
| { | ||||
| 	int ret = cpu_online_unaligned_access_init(cpu); | ||||
| 
 | ||||
| 	if (ret) | ||||
| 		return ret; | ||||
| 
 | ||||
| 	/* We are already set since the last check */ | ||||
| 	if (per_cpu(misaligned_access_speed, cpu) != RISCV_HWPROBE_MISALIGNED_SCALAR_UNKNOWN) { | ||||
| 		goto exit; | ||||
|  | @ -248,7 +253,6 @@ static int riscv_online_cpu(unsigned int cpu) | |||
| 	{ | ||||
| 		static struct page *buf; | ||||
| 
 | ||||
| 		check_unaligned_access_emulated(NULL); | ||||
| 		buf = alloc_pages(GFP_KERNEL, MISALIGNED_BUFFER_ORDER); | ||||
| 		if (!buf) { | ||||
| 			pr_warn("Allocation failure, not measuring misaligned performance\n"); | ||||
|  | @ -439,6 +443,8 @@ static int __init check_unaligned_access_all_cpus(void) | |||
| { | ||||
| 	int cpu; | ||||
| 
 | ||||
| 	unaligned_access_init(); | ||||
| 
 | ||||
| 	if (unaligned_scalar_speed_param != RISCV_HWPROBE_MISALIGNED_SCALAR_UNKNOWN) { | ||||
| 		pr_info("scalar unaligned access speed set to '%s' (%lu) by command line\n", | ||||
| 			speed_str[unaligned_scalar_speed_param], unaligned_scalar_speed_param); | ||||
|  |  | |||
		Loading…
	
		Reference in a new issue
	
	 Palmer Dabbelt
						Palmer Dabbelt