Max Shvetsov | 959be33 | 2021-03-16 14:18:13 +0000 | [diff] [blame] | 1 | /* |
Arunachalam Ganapathy | 0bbdc2d | 2023-04-05 15:30:18 +0100 | [diff] [blame] | 2 | * Copyright (c) 2021-2023, Arm Limited. All rights reserved. |
Max Shvetsov | 959be33 | 2021-03-16 14:18:13 +0000 | [diff] [blame] | 3 | * |
| 4 | * SPDX-License-Identifier: BSD-3-Clause |
| 5 | */ |
| 6 | |
| 7 | #ifndef SVE_H |
| 8 | #define SVE_H |
| 9 | |
Arunachalam Ganapathy | 0bbdc2d | 2023-04-05 15:30:18 +0100 | [diff] [blame] | 10 | #include <arch.h> |
Arunachalam Ganapathy | c1136a8 | 2023-04-12 15:24:44 +0100 | [diff] [blame] | 11 | #include <stdlib.h> /* for rand() */ |
Arunachalam Ganapathy | 5b68e20 | 2023-06-06 16:31:19 +0100 | [diff] [blame] | 12 | #include <lib/extensions/sme.h> |
Arunachalam Ganapathy | 0bbdc2d | 2023-04-05 15:30:18 +0100 | [diff] [blame] | 13 | |
Max Shvetsov | 959be33 | 2021-03-16 14:18:13 +0000 | [diff] [blame] | 14 | #define fill_sve_helper(num) "ldr z"#num", [%0, #"#num", MUL VL];" |
| 15 | #define read_sve_helper(num) "str z"#num", [%0, #"#num", MUL VL];" |
| 16 | |
Arunachalam Ganapathy | fa05bd9 | 2023-08-30 14:36:53 +0100 | [diff] [blame] | 17 | #define fill_sve_p_helper(num) "ldr p"#num", [%0, #"#num", MUL VL];" |
| 18 | #define read_sve_p_helper(num) "str p"#num", [%0, #"#num", MUL VL];" |
| 19 | |
Olivier Deprez | 569be40 | 2022-07-08 10:24:39 +0200 | [diff] [blame] | 20 | /* |
| 21 | * Max. vector length permitted by the architecture: |
| 22 | * SVE: 2048 bits = 256 bytes |
| 23 | */ |
Arunachalam Ganapathy | fa05bd9 | 2023-08-30 14:36:53 +0100 | [diff] [blame] | 24 | #define SVE_VECTOR_LEN_BYTES (256U) |
| 25 | #define SVE_NUM_VECTORS (32U) |
| 26 | |
| 27 | /* Max size of one predicate register is 1/8 of Z register */ |
| 28 | #define SVE_P_REG_LEN_BYTES (SVE_VECTOR_LEN_BYTES / 8U) |
| 29 | #define SVE_NUM_P_REGS (16U) |
| 30 | |
| 31 | /* Max size of one FFR register is 1/8 of Z register */ |
| 32 | #define SVE_FFR_REG_LEN_BYTES (SVE_VECTOR_LEN_BYTES / 8U) |
| 33 | #define SVE_NUM_FFR_REGS (1U) |
Olivier Deprez | 569be40 | 2022-07-08 10:24:39 +0200 | [diff] [blame] | 34 | |
Arunachalam Ganapathy | 5270d01 | 2023-04-19 14:53:42 +0100 | [diff] [blame] | 35 | #define SVE_VQ_ARCH_MIN (0U) |
Arunachalam Ganapathy | fa05bd9 | 2023-08-30 14:36:53 +0100 | [diff] [blame] | 36 | #define SVE_VQ_ARCH_MAX ((1U << ZCR_EL2_SVE_VL_WIDTH) - 1U) |
Arunachalam Ganapathy | 0bbdc2d | 2023-04-05 15:30:18 +0100 | [diff] [blame] | 37 | |
| 38 | /* convert SVE VL in bytes to VQ */ |
Arunachalam Ganapathy | fa05bd9 | 2023-08-30 14:36:53 +0100 | [diff] [blame] | 39 | #define SVE_VL_TO_VQ(vl_bytes) (((vl_bytes) >> 4U) - 1U) |
Arunachalam Ganapathy | 0bbdc2d | 2023-04-05 15:30:18 +0100 | [diff] [blame] | 40 | |
| 41 | /* convert SVE VQ to bits */ |
| 42 | #define SVE_VQ_TO_BITS(vq) (((vq) + 1U) << 7U) |
| 43 | |
Arunachalam Ganapathy | 5270d01 | 2023-04-19 14:53:42 +0100 | [diff] [blame] | 44 | /* convert SVE VQ to bytes */ |
Arunachalam Ganapathy | fa05bd9 | 2023-08-30 14:36:53 +0100 | [diff] [blame] | 45 | #define SVE_VQ_TO_BYTES(vq) (SVE_VQ_TO_BITS(vq) / 8U) |
Arunachalam Ganapathy | 5270d01 | 2023-04-19 14:53:42 +0100 | [diff] [blame] | 46 | |
Arunachalam Ganapathy | c1136a8 | 2023-04-12 15:24:44 +0100 | [diff] [blame] | 47 | /* get a random SVE VQ b/w 0 to SVE_VQ_ARCH_MAX */ |
Arunachalam Ganapathy | fa05bd9 | 2023-08-30 14:36:53 +0100 | [diff] [blame] | 48 | #define SVE_GET_RANDOM_VQ (rand() % (SVE_VQ_ARCH_MAX + 1U)) |
Arunachalam Ganapathy | c1136a8 | 2023-04-12 15:24:44 +0100 | [diff] [blame] | 49 | |
Kathleen Capella | c59184c | 2022-08-23 19:09:41 -0400 | [diff] [blame] | 50 | #ifndef __ASSEMBLY__ |
| 51 | |
Arunachalam Ganapathy | 0358997 | 2023-08-30 11:04:51 +0100 | [diff] [blame] | 52 | typedef uint8_t sve_z_regs_t[SVE_NUM_VECTORS * SVE_VECTOR_LEN_BYTES] |
| 53 | __aligned(16); |
Arunachalam Ganapathy | fa05bd9 | 2023-08-30 14:36:53 +0100 | [diff] [blame] | 54 | typedef uint8_t sve_p_regs_t[SVE_NUM_P_REGS * SVE_P_REG_LEN_BYTES] |
| 55 | __aligned(16); |
| 56 | typedef uint8_t sve_ffr_regs_t[SVE_NUM_FFR_REGS * SVE_FFR_REG_LEN_BYTES] |
| 57 | __aligned(16); |
Olivier Deprez | 569be40 | 2022-07-08 10:24:39 +0200 | [diff] [blame] | 58 | |
Arunachalam Ganapathy | 0bbdc2d | 2023-04-05 15:30:18 +0100 | [diff] [blame] | 59 | void sve_config_vq(uint8_t sve_vq); |
| 60 | uint32_t sve_probe_vl(uint8_t sve_max_vq); |
Arunachalam Ganapathy | 0358997 | 2023-08-30 11:04:51 +0100 | [diff] [blame] | 61 | |
| 62 | void sve_z_regs_write(const sve_z_regs_t *z_regs); |
Arunachalam Ganapathy | fa05bd9 | 2023-08-30 14:36:53 +0100 | [diff] [blame] | 63 | void sve_z_regs_write_rand(sve_z_regs_t *z_regs); |
Arunachalam Ganapathy | 0358997 | 2023-08-30 11:04:51 +0100 | [diff] [blame] | 64 | void sve_z_regs_read(sve_z_regs_t *z_regs); |
Arunachalam Ganapathy | fa05bd9 | 2023-08-30 14:36:53 +0100 | [diff] [blame] | 65 | uint64_t sve_z_regs_compare(const sve_z_regs_t *s1, const sve_z_regs_t *s2); |
| 66 | |
| 67 | void sve_p_regs_write(const sve_p_regs_t *p_regs); |
| 68 | void sve_p_regs_write_rand(sve_p_regs_t *p_regs); |
| 69 | void sve_p_regs_read(sve_p_regs_t *p_regs); |
| 70 | uint64_t sve_p_regs_compare(const sve_p_regs_t *s1, const sve_p_regs_t *s2); |
| 71 | |
| 72 | void sve_ffr_regs_write(const sve_ffr_regs_t *ffr_regs); |
| 73 | void sve_ffr_regs_write_rand(sve_ffr_regs_t *ffr_regs); |
| 74 | void sve_ffr_regs_read(sve_ffr_regs_t *ffr_regs); |
| 75 | uint64_t sve_ffr_regs_compare(const sve_ffr_regs_t *s1, |
| 76 | const sve_ffr_regs_t *s2); |
Arunachalam Ganapathy | d179ddc | 2023-04-12 10:41:42 +0100 | [diff] [blame] | 77 | |
| 78 | /* Assembly routines */ |
| 79 | bool sve_subtract_arrays_interleaved(int *dst_array, int *src_array1, |
| 80 | int *src_array2, int array_size, |
| 81 | bool (*world_switch_cb)(void)); |
| 82 | |
| 83 | void sve_subtract_arrays(int *dst_array, int *src_array1, int *src_array2, |
| 84 | int array_size); |
Arunachalam Ganapathy | 0bbdc2d | 2023-04-05 15:30:18 +0100 | [diff] [blame] | 85 | |
Olivier Deprez | 569be40 | 2022-07-08 10:24:39 +0200 | [diff] [blame] | 86 | #ifdef __aarch64__ |
| 87 | |
| 88 | /* Returns the SVE implemented VL in bytes (constrained by ZCR_EL3.LEN) */ |
Arunachalam Ganapathy | 0358997 | 2023-08-30 11:04:51 +0100 | [diff] [blame] | 89 | static inline uint64_t sve_rdvl_1(void) |
Olivier Deprez | 569be40 | 2022-07-08 10:24:39 +0200 | [diff] [blame] | 90 | { |
| 91 | uint64_t vl; |
| 92 | |
| 93 | __asm__ volatile( |
| 94 | ".arch_extension sve\n" |
| 95 | "rdvl %0, #1;" |
| 96 | ".arch_extension nosve\n" |
| 97 | : "=r" (vl) |
| 98 | ); |
| 99 | |
| 100 | return vl; |
| 101 | } |
| 102 | |
| 103 | #endif /* __aarch64__ */ |
Kathleen Capella | c59184c | 2022-08-23 19:09:41 -0400 | [diff] [blame] | 104 | #endif /* __ASSEMBLY__ */ |
Olivier Deprez | 569be40 | 2022-07-08 10:24:39 +0200 | [diff] [blame] | 105 | #endif /* SVE_H */ |