Max Shvetsov | 959be33 | 2021-03-16 14:18:13 +0000 | [diff] [blame] | 1 | /* |
Arunachalam Ganapathy | 0bbdc2d | 2023-04-05 15:30:18 +0100 | [diff] [blame] | 2 | * Copyright (c) 2021-2023, Arm Limited. All rights reserved. |
Max Shvetsov | 959be33 | 2021-03-16 14:18:13 +0000 | [diff] [blame] | 3 | * |
| 4 | * SPDX-License-Identifier: BSD-3-Clause |
| 5 | */ |
| 6 | |
| 7 | #ifndef SVE_H |
| 8 | #define SVE_H |
| 9 | |
Arunachalam Ganapathy | 0bbdc2d | 2023-04-05 15:30:18 +0100 | [diff] [blame] | 10 | #include <arch.h> |
Arunachalam Ganapathy | c1136a8 | 2023-04-12 15:24:44 +0100 | [diff] [blame] | 11 | #include <stdlib.h> /* for rand() */ |
Arunachalam Ganapathy | 0bbdc2d | 2023-04-05 15:30:18 +0100 | [diff] [blame] | 12 | |
Max Shvetsov | 959be33 | 2021-03-16 14:18:13 +0000 | [diff] [blame] | 13 | #define fill_sve_helper(num) "ldr z"#num", [%0, #"#num", MUL VL];" |
| 14 | #define read_sve_helper(num) "str z"#num", [%0, #"#num", MUL VL];" |
| 15 | |
Arunachalam Ganapathy | fa05bd9 | 2023-08-30 14:36:53 +0100 | [diff] [blame^] | 16 | #define fill_sve_p_helper(num) "ldr p"#num", [%0, #"#num", MUL VL];" |
| 17 | #define read_sve_p_helper(num) "str p"#num", [%0, #"#num", MUL VL];" |
| 18 | |
Olivier Deprez | 569be40 | 2022-07-08 10:24:39 +0200 | [diff] [blame] | 19 | /* |
| 20 | * Max. vector length permitted by the architecture: |
| 21 | * SVE: 2048 bits = 256 bytes |
| 22 | */ |
Arunachalam Ganapathy | fa05bd9 | 2023-08-30 14:36:53 +0100 | [diff] [blame^] | 23 | #define SVE_VECTOR_LEN_BYTES (256U) |
| 24 | #define SVE_NUM_VECTORS (32U) |
| 25 | |
| 26 | /* Max size of one predicate register is 1/8 of Z register */ |
| 27 | #define SVE_P_REG_LEN_BYTES (SVE_VECTOR_LEN_BYTES / 8U) |
| 28 | #define SVE_NUM_P_REGS (16U) |
| 29 | |
| 30 | /* Max size of one FFR register is 1/8 of Z register */ |
| 31 | #define SVE_FFR_REG_LEN_BYTES (SVE_VECTOR_LEN_BYTES / 8U) |
| 32 | #define SVE_NUM_FFR_REGS (1U) |
Olivier Deprez | 569be40 | 2022-07-08 10:24:39 +0200 | [diff] [blame] | 33 | |
Arunachalam Ganapathy | 5270d01 | 2023-04-19 14:53:42 +0100 | [diff] [blame] | 34 | #define SVE_VQ_ARCH_MIN (0U) |
Arunachalam Ganapathy | fa05bd9 | 2023-08-30 14:36:53 +0100 | [diff] [blame^] | 35 | #define SVE_VQ_ARCH_MAX ((1U << ZCR_EL2_SVE_VL_WIDTH) - 1U) |
Arunachalam Ganapathy | 0bbdc2d | 2023-04-05 15:30:18 +0100 | [diff] [blame] | 36 | |
| 37 | /* convert SVE VL in bytes to VQ */ |
Arunachalam Ganapathy | fa05bd9 | 2023-08-30 14:36:53 +0100 | [diff] [blame^] | 38 | #define SVE_VL_TO_VQ(vl_bytes) (((vl_bytes) >> 4U) - 1U) |
Arunachalam Ganapathy | 0bbdc2d | 2023-04-05 15:30:18 +0100 | [diff] [blame] | 39 | |
| 40 | /* convert SVE VQ to bits */ |
| 41 | #define SVE_VQ_TO_BITS(vq) (((vq) + 1U) << 7U) |
| 42 | |
Arunachalam Ganapathy | 5270d01 | 2023-04-19 14:53:42 +0100 | [diff] [blame] | 43 | /* convert SVE VQ to bytes */ |
Arunachalam Ganapathy | fa05bd9 | 2023-08-30 14:36:53 +0100 | [diff] [blame^] | 44 | #define SVE_VQ_TO_BYTES(vq) (SVE_VQ_TO_BITS(vq) / 8U) |
Arunachalam Ganapathy | 5270d01 | 2023-04-19 14:53:42 +0100 | [diff] [blame] | 45 | |
Arunachalam Ganapathy | c1136a8 | 2023-04-12 15:24:44 +0100 | [diff] [blame] | 46 | /* get a random SVE VQ b/w 0 to SVE_VQ_ARCH_MAX */ |
Arunachalam Ganapathy | fa05bd9 | 2023-08-30 14:36:53 +0100 | [diff] [blame^] | 47 | #define SVE_GET_RANDOM_VQ (rand() % (SVE_VQ_ARCH_MAX + 1U)) |
Arunachalam Ganapathy | c1136a8 | 2023-04-12 15:24:44 +0100 | [diff] [blame] | 48 | |
Kathleen Capella | c59184c | 2022-08-23 19:09:41 -0400 | [diff] [blame] | 49 | #ifndef __ASSEMBLY__ |
| 50 | |
Arunachalam Ganapathy | 0358997 | 2023-08-30 11:04:51 +0100 | [diff] [blame] | 51 | typedef uint8_t sve_z_regs_t[SVE_NUM_VECTORS * SVE_VECTOR_LEN_BYTES] |
| 52 | __aligned(16); |
Arunachalam Ganapathy | fa05bd9 | 2023-08-30 14:36:53 +0100 | [diff] [blame^] | 53 | typedef uint8_t sve_p_regs_t[SVE_NUM_P_REGS * SVE_P_REG_LEN_BYTES] |
| 54 | __aligned(16); |
| 55 | typedef uint8_t sve_ffr_regs_t[SVE_NUM_FFR_REGS * SVE_FFR_REG_LEN_BYTES] |
| 56 | __aligned(16); |
Olivier Deprez | 569be40 | 2022-07-08 10:24:39 +0200 | [diff] [blame] | 57 | |
Arunachalam Ganapathy | 0bbdc2d | 2023-04-05 15:30:18 +0100 | [diff] [blame] | 58 | void sve_config_vq(uint8_t sve_vq); |
| 59 | uint32_t sve_probe_vl(uint8_t sve_max_vq); |
Arunachalam Ganapathy | 0358997 | 2023-08-30 11:04:51 +0100 | [diff] [blame] | 60 | |
| 61 | void sve_z_regs_write(const sve_z_regs_t *z_regs); |
Arunachalam Ganapathy | fa05bd9 | 2023-08-30 14:36:53 +0100 | [diff] [blame^] | 62 | void sve_z_regs_write_rand(sve_z_regs_t *z_regs); |
Arunachalam Ganapathy | 0358997 | 2023-08-30 11:04:51 +0100 | [diff] [blame] | 63 | void sve_z_regs_read(sve_z_regs_t *z_regs); |
Arunachalam Ganapathy | fa05bd9 | 2023-08-30 14:36:53 +0100 | [diff] [blame^] | 64 | uint64_t sve_z_regs_compare(const sve_z_regs_t *s1, const sve_z_regs_t *s2); |
| 65 | |
| 66 | void sve_p_regs_write(const sve_p_regs_t *p_regs); |
| 67 | void sve_p_regs_write_rand(sve_p_regs_t *p_regs); |
| 68 | void sve_p_regs_read(sve_p_regs_t *p_regs); |
| 69 | uint64_t sve_p_regs_compare(const sve_p_regs_t *s1, const sve_p_regs_t *s2); |
| 70 | |
| 71 | void sve_ffr_regs_write(const sve_ffr_regs_t *ffr_regs); |
| 72 | void sve_ffr_regs_write_rand(sve_ffr_regs_t *ffr_regs); |
| 73 | void sve_ffr_regs_read(sve_ffr_regs_t *ffr_regs); |
| 74 | uint64_t sve_ffr_regs_compare(const sve_ffr_regs_t *s1, |
| 75 | const sve_ffr_regs_t *s2); |
Arunachalam Ganapathy | d179ddc | 2023-04-12 10:41:42 +0100 | [diff] [blame] | 76 | |
| 77 | /* Assembly routines */ |
| 78 | bool sve_subtract_arrays_interleaved(int *dst_array, int *src_array1, |
| 79 | int *src_array2, int array_size, |
| 80 | bool (*world_switch_cb)(void)); |
| 81 | |
| 82 | void sve_subtract_arrays(int *dst_array, int *src_array1, int *src_array2, |
| 83 | int array_size); |
Arunachalam Ganapathy | 0bbdc2d | 2023-04-05 15:30:18 +0100 | [diff] [blame] | 84 | |
Olivier Deprez | 569be40 | 2022-07-08 10:24:39 +0200 | [diff] [blame] | 85 | #ifdef __aarch64__ |
| 86 | |
| 87 | /* Returns the SVE implemented VL in bytes (constrained by ZCR_EL3.LEN) */ |
Arunachalam Ganapathy | 0358997 | 2023-08-30 11:04:51 +0100 | [diff] [blame] | 88 | static inline uint64_t sve_rdvl_1(void) |
Olivier Deprez | 569be40 | 2022-07-08 10:24:39 +0200 | [diff] [blame] | 89 | { |
| 90 | uint64_t vl; |
| 91 | |
| 92 | __asm__ volatile( |
| 93 | ".arch_extension sve\n" |
| 94 | "rdvl %0, #1;" |
| 95 | ".arch_extension nosve\n" |
| 96 | : "=r" (vl) |
| 97 | ); |
| 98 | |
| 99 | return vl; |
| 100 | } |
| 101 | |
| 102 | #endif /* __aarch64__ */ |
Kathleen Capella | c59184c | 2022-08-23 19:09:41 -0400 | [diff] [blame] | 103 | #endif /* __ASSEMBLY__ */ |
Olivier Deprez | 569be40 | 2022-07-08 10:24:39 +0200 | [diff] [blame] | 104 | #endif /* SVE_H */ |