123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155 |
- /*
- * Copyright (c) 2006-2022, RT-Thread Development Team
- *
- * SPDX-License-Identifier: Apache-2.0
- *
- * Change Logs:
- * Date Author Notes
- * 2022-10-10 RT-Thread the first version,
- * compatible to riscv-v-spec-1.0
- */
- #ifndef __EXT_CONTEXT_H__
- #define __EXT_CONTEXT_H__
- #ifdef __ASSEMBLY__
- /**
- * extension context maintenance
- */
- #include "cpuport.h"
- #include "encoding.h"
- #include "vector_encoding.h"
- /**
- * ==================================
- * FPU EXTENSION
- * ==================================
- */
- #ifdef ENABLE_FPU
- #define FPU_CTX_F0_OFF 0 /* offsetof(fpu_context_t, fpustatus.f[0]) - offsetof(fpu_context_t, fpustatus.f[0]) */
- #define FPU_CTX_F1_OFF 8 /* offsetof(fpu_context_t, fpustatus.f[1]) - offsetof(fpu_context_t, fpustatus.f[0]) */
- #define FPU_CTX_F2_OFF 16 /* offsetof(fpu_context_t, fpustatus.f[2]) - offsetof(fpu_context_t, fpustatus.f[0]) */
- #define FPU_CTX_F3_OFF 24 /* offsetof(fpu_context_t, fpustatus.f[3]) - offsetof(fpu_context_t, fpustatus.f[0]) */
- #define FPU_CTX_F4_OFF 32 /* offsetof(fpu_context_t, fpustatus.f[4]) - offsetof(fpu_context_t, fpustatus.f[0]) */
- #define FPU_CTX_F5_OFF 40 /* offsetof(fpu_context_t, fpustatus.f[5]) - offsetof(fpu_context_t, fpustatus.f[0]) */
- #define FPU_CTX_F6_OFF 48 /* offsetof(fpu_context_t, fpustatus.f[6]) - offsetof(fpu_context_t, fpustatus.f[0]) */
- #define FPU_CTX_F7_OFF 56 /* offsetof(fpu_context_t, fpustatus.f[7]) - offsetof(fpu_context_t, fpustatus.f[0]) */
- #define FPU_CTX_F8_OFF 64 /* offsetof(fpu_context_t, fpustatus.f[8]) - offsetof(fpu_context_t, fpustatus.f[0]) */
- #define FPU_CTX_F9_OFF 72 /* offsetof(fpu_context_t, fpustatus.f[9]) - offsetof(fpu_context_t, fpustatus.f[0]) */
- #define FPU_CTX_F10_OFF 80 /* offsetof(fpu_context_t, fpustatus.f[10]) - offsetof(fpu_context_t, fpustatus.f[0]) */
- #define FPU_CTX_F11_OFF 88 /* offsetof(fpu_context_t, fpustatus.f[11]) - offsetof(fpu_context_t, fpustatus.f[0]) */
- #define FPU_CTX_F12_OFF 96 /* offsetof(fpu_context_t, fpustatus.f[12]) - offsetof(fpu_context_t, fpustatus.f[0]) */
- #define FPU_CTX_F13_OFF 104 /* offsetof(fpu_context_t, fpustatus.f[13]) - offsetof(fpu_context_t, fpustatus.f[0]) */
- #define FPU_CTX_F14_OFF 112 /* offsetof(fpu_context_t, fpustatus.f[14]) - offsetof(fpu_context_t, fpustatus.f[0]) */
- #define FPU_CTX_F15_OFF 120 /* offsetof(fpu_context_t, fpustatus.f[15]) - offsetof(fpu_context_t, fpustatus.f[0]) */
- #define FPU_CTX_F16_OFF 128 /* offsetof(fpu_context_t, fpustatus.f[16]) - offsetof(fpu_context_t, fpustatus.f[0]) */
- #define FPU_CTX_F17_OFF 136 /* offsetof(fpu_context_t, fpustatus.f[17]) - offsetof(fpu_context_t, fpustatus.f[0]) */
- #define FPU_CTX_F18_OFF 144 /* offsetof(fpu_context_t, fpustatus.f[18]) - offsetof(fpu_context_t, fpustatus.f[0]) */
- #define FPU_CTX_F19_OFF 152 /* offsetof(fpu_context_t, fpustatus.f[19]) - offsetof(fpu_context_t, fpustatus.f[0]) */
- #define FPU_CTX_F20_OFF 160 /* offsetof(fpu_context_t, fpustatus.f[20]) - offsetof(fpu_context_t, fpustatus.f[0]) */
- #define FPU_CTX_F21_OFF 168 /* offsetof(fpu_context_t, fpustatus.f[21]) - offsetof(fpu_context_t, fpustatus.f[0]) */
- #define FPU_CTX_F22_OFF 176 /* offsetof(fpu_context_t, fpustatus.f[22]) - offsetof(fpu_context_t, fpustatus.f[0]) */
- #define FPU_CTX_F23_OFF 184 /* offsetof(fpu_context_t, fpustatus.f[23]) - offsetof(fpu_context_t, fpustatus.f[0]) */
- #define FPU_CTX_F24_OFF 192 /* offsetof(fpu_context_t, fpustatus.f[24]) - offsetof(fpu_context_t, fpustatus.f[0]) */
- #define FPU_CTX_F25_OFF 200 /* offsetof(fpu_context_t, fpustatus.f[25]) - offsetof(fpu_context_t, fpustatus.f[0]) */
- #define FPU_CTX_F26_OFF 208 /* offsetof(fpu_context_t, fpustatus.f[26]) - offsetof(fpu_context_t, fpustatus.f[0]) */
- #define FPU_CTX_F27_OFF 216 /* offsetof(fpu_context_t, fpustatus.f[27]) - offsetof(fpu_context_t, fpustatus.f[0]) */
- #define FPU_CTX_F28_OFF 224 /* offsetof(fpu_context_t, fpustatus.f[28]) - offsetof(fpu_context_t, fpustatus.f[0]) */
- #define FPU_CTX_F29_OFF 232 /* offsetof(fpu_context_t, fpustatus.f[29]) - offsetof(fpu_context_t, fpustatus.f[0]) */
- #define FPU_CTX_F30_OFF 240 /* offsetof(fpu_context_t, fpustatus.f[30]) - offsetof(fpu_context_t, fpustatus.f[0]) */
- #define FPU_CTX_F31_OFF 248 /* offsetof(fpu_context_t, fpustatus.f[31]) - offsetof(fpu_context_t, fpustatus.f[0]) */
- #endif /* ENABLE_FPU */
- /**
- * ==================================
- * VECTOR EXTENSION
- * ==================================
- */
- #ifdef ENABLE_VECTOR
- #define VEC_FRAME_VSTART (0 * REGBYTES)
- #define VEC_FRAME_VTYPE (1 * REGBYTES)
- #define VEC_FRAME_VL (2 * REGBYTES)
- #define VEC_FRAME_VCSR (3 * REGBYTES)
- #define VEC_FRAME_V0 (4 * REGBYTES)
- .macro GET_VEC_FRAME_LEN, xreg
- csrr \xreg, vlenb
- slli \xreg, \xreg, 5
- addi \xreg, \xreg, 4 * REGBYTES
- .endm
- /**
- * @brief save vector extension hardware state
- *
- * @param dst register storing bottom of storage block
- *
- */
- .macro SAVE_VECTOR, dst
- mv t1, \dst
- csrr t0, vstart
- STORE t0, VEC_FRAME_VSTART(t1)
- csrr t0, vtype
- STORE t0, VEC_FRAME_VTYPE(t1)
- csrr t0, vl
- STORE t0, VEC_FRAME_VL(t1)
- csrr t0, vcsr
- STORE t0, VEC_FRAME_VCSR(t1)
- addi t1, t1, VEC_FRAME_V0
- // config vector setting,
- // t2 is updated to length of a vector group in bytes
- VEC_CONFIG_SETVLI(t2, x0, VEC_IMM_SEW_8, VEC_IMM_LMUL_8)
- vse8.v v0, (t1)
- add t1, t1, t2
- vse8.v v8, (t1)
- add t1, t1, t2
- vse8.v v16, (t1)
- add t1, t1, t2
- vse8.v v24, (t1)
- .endm
- /**
- * @brief restore vector extension hardware states
- *
- * @param dst register storing bottom of storage block
- *
- */
- .macro RESTORE_VECTOR, dst
- // restore vector registers first since it will modify vector states
- mv t0, \dst
- addi t1, t0, VEC_FRAME_V0
- VEC_CONFIG_SETVLI(t2, x0, VEC_IMM_SEW_8, VEC_IMM_LMUL_8)
- vle8.v v0, (t1)
- add t1, t1, t2
- vle8.v v8, (t1)
- add t1, t1, t2
- vle8.v v16, (t1)
- add t1, t1, t2
- vle8.v v24, (t1)
- mv t1, t0
- LOAD t0, VEC_FRAME_VSTART(t1)
- csrw vstart, t0
- LOAD t0, VEC_FRAME_VCSR(t1)
- csrw vcsr, t0
- LOAD t0, VEC_FRAME_VTYPE(t1)
- LOAD t3, VEC_FRAME_VL(t1)
- VEC_CONFIG_SET_VL_VTYPE(t3, t0)
- .endm
- #endif /* ENABLE_VECTOR */
- #endif /* __ASSEMBLY__ */
- #endif /* __EXT_CONTEXT_H__ */
|