RISC-V: Probe for unaligned access speed (584ea656) · Commits · EulixOS / Software / Kernel

Documentation/riscv/hwprobe.rst

+5 −6

Original line number	Diff line number	Diff line
		@@ -87,13 +87,12 @@ The following keys are defined:
		emulated via software, either in or below the kernel. These accesses are
		always extremely slow.

		* :c:macro:`RISCV_HWPROBE_MISALIGNED_SLOW`: Misaligned accesses are supported
		in hardware, but are slower than the cooresponding aligned accesses
		sequences.
		* :c:macro:`RISCV_HWPROBE_MISALIGNED_SLOW`: Misaligned accesses are slower
		than equivalent byte accesses. Misaligned accesses may be supported
		directly in hardware, or trapped and emulated by software.

		* :c:macro:`RISCV_HWPROBE_MISALIGNED_FAST`: Misaligned accesses are supported
		in hardware and are faster than the cooresponding aligned accesses
		sequences.
		* :c:macro:`RISCV_HWPROBE_MISALIGNED_FAST`: Misaligned accesses are faster
		than equivalent byte accesses.

		* :c:macro:`RISCV_HWPROBE_MISALIGNED_UNSUPPORTED`: Misaligned accesses are
		not supported at all and will generate a misaligned address fault.

+2 −0

Original line number	Diff line number	Diff line
		@@ -30,4 +30,6 @@ DECLARE_PER_CPU(long, misaligned_access_speed);
		/* Per-cpu ISA extensions. */
		extern struct riscv_isainfo hart_isa[NR_CPUS];

		void check_unaligned_access(int cpu);

		#endif

+1 −0

Original line number	Diff line number	Diff line
		@@ -38,6 +38,7 @@ extra-y += vmlinux.lds
		obj-y += head.o
		obj-y += soc.o
		obj-$(CONFIG_RISCV_ALTERNATIVE) += alternative.o
		obj-y += copy-unaligned.o
		obj-y += cpu.o
		obj-y += cpufeature.o
		obj-y += entry.o

0 → 100644

+71 −0

Original line number	Diff line number	Diff line
		/* SPDX-License-Identifier: GPL-2.0 */
		/* Copyright (C) 2023 Rivos Inc. */

		#include <linux/linkage.h>
		#include <asm/asm.h>

		.text

		/* void __riscv_copy_words_unaligned(void , const void , size_t) */
		/* Performs a memcpy without aligning buffers, using word loads and stores. */
		/* Note: The size is truncated to a multiple of 8 * SZREG */
		ENTRY(__riscv_copy_words_unaligned)
		andi a4, a2, ~((8*SZREG)-1)
		beqz a4, 2f
		add a3, a1, a4
		1:
		REG_L a4, 0(a1)
		REG_L a5, SZREG(a1)
		REG_L a6, 2*SZREG(a1)
		REG_L a7, 3*SZREG(a1)
		REG_L t0, 4*SZREG(a1)
		REG_L t1, 5*SZREG(a1)
		REG_L t2, 6*SZREG(a1)
		REG_L t3, 7*SZREG(a1)
		REG_S a4, 0(a0)
		REG_S a5, SZREG(a0)
		REG_S a6, 2*SZREG(a0)
		REG_S a7, 3*SZREG(a0)
		REG_S t0, 4*SZREG(a0)
		REG_S t1, 5*SZREG(a0)
		REG_S t2, 6*SZREG(a0)
		REG_S t3, 7*SZREG(a0)
		addi a0, a0, 8*SZREG
		addi a1, a1, 8*SZREG
		bltu a1, a3, 1b

		2:
		ret
		END(__riscv_copy_words_unaligned)

		/* void __riscv_copy_bytes_unaligned(void , const void , size_t) */
		/* Performs a memcpy without aligning buffers, using only byte accesses. */
		/* Note: The size is truncated to a multiple of 8 */
		ENTRY(__riscv_copy_bytes_unaligned)
		andi a4, a2, ~(8-1)
		beqz a4, 2f
		add a3, a1, a4
		1:
		lb a4, 0(a1)
		lb a5, 1(a1)
		lb a6, 2(a1)
		lb a7, 3(a1)
		lb t0, 4(a1)
		lb t1, 5(a1)
		lb t2, 6(a1)
		lb t3, 7(a1)
		sb a4, 0(a0)
		sb a5, 1(a0)
		sb a6, 2(a0)
		sb a7, 3(a0)
		sb t0, 4(a0)
		sb t1, 5(a0)
		sb t2, 6(a0)
		sb t3, 7(a0)
		addi a0, a0, 8
		addi a1, a1, 8
		bltu a1, a3, 1b

		2:
		ret
		END(__riscv_copy_bytes_unaligned)

0 → 100644

+13 −0

Original line number	Diff line number	Diff line
		/* SPDX-License-Identifier: GPL-2.0 */
		/*
		* Copyright (C) 2023 Rivos, Inc.
		*/
		#ifndef __RISCV_KERNEL_COPY_UNALIGNED_H
		#define __RISCV_KERNEL_COPY_UNALIGNED_H

		#include <linux/types.h>

		void __riscv_copy_words_unaligned(void dst, const void src, size_t size);
		void __riscv_copy_bytes_unaligned(void dst, const void src, size_t size);

		#endif /* __RISCV_KERNEL_COPY_UNALIGNED_H */