|
@@ -60,22 +60,22 @@
|
|
.set push
|
|
.set push
|
|
SET_HARDFLOAT
|
|
SET_HARDFLOAT
|
|
cfc1 \tmp, fcr31
|
|
cfc1 \tmp, fcr31
|
|
- sdc1 $f0, THREAD_FPR0_LS64(\thread)
|
|
|
|
- sdc1 $f2, THREAD_FPR2_LS64(\thread)
|
|
|
|
- sdc1 $f4, THREAD_FPR4_LS64(\thread)
|
|
|
|
- sdc1 $f6, THREAD_FPR6_LS64(\thread)
|
|
|
|
- sdc1 $f8, THREAD_FPR8_LS64(\thread)
|
|
|
|
- sdc1 $f10, THREAD_FPR10_LS64(\thread)
|
|
|
|
- sdc1 $f12, THREAD_FPR12_LS64(\thread)
|
|
|
|
- sdc1 $f14, THREAD_FPR14_LS64(\thread)
|
|
|
|
- sdc1 $f16, THREAD_FPR16_LS64(\thread)
|
|
|
|
- sdc1 $f18, THREAD_FPR18_LS64(\thread)
|
|
|
|
- sdc1 $f20, THREAD_FPR20_LS64(\thread)
|
|
|
|
- sdc1 $f22, THREAD_FPR22_LS64(\thread)
|
|
|
|
- sdc1 $f24, THREAD_FPR24_LS64(\thread)
|
|
|
|
- sdc1 $f26, THREAD_FPR26_LS64(\thread)
|
|
|
|
- sdc1 $f28, THREAD_FPR28_LS64(\thread)
|
|
|
|
- sdc1 $f30, THREAD_FPR30_LS64(\thread)
|
|
|
|
|
|
+ sdc1 $f0, THREAD_FPR0(\thread)
|
|
|
|
+ sdc1 $f2, THREAD_FPR2(\thread)
|
|
|
|
+ sdc1 $f4, THREAD_FPR4(\thread)
|
|
|
|
+ sdc1 $f6, THREAD_FPR6(\thread)
|
|
|
|
+ sdc1 $f8, THREAD_FPR8(\thread)
|
|
|
|
+ sdc1 $f10, THREAD_FPR10(\thread)
|
|
|
|
+ sdc1 $f12, THREAD_FPR12(\thread)
|
|
|
|
+ sdc1 $f14, THREAD_FPR14(\thread)
|
|
|
|
+ sdc1 $f16, THREAD_FPR16(\thread)
|
|
|
|
+ sdc1 $f18, THREAD_FPR18(\thread)
|
|
|
|
+ sdc1 $f20, THREAD_FPR20(\thread)
|
|
|
|
+ sdc1 $f22, THREAD_FPR22(\thread)
|
|
|
|
+ sdc1 $f24, THREAD_FPR24(\thread)
|
|
|
|
+ sdc1 $f26, THREAD_FPR26(\thread)
|
|
|
|
+ sdc1 $f28, THREAD_FPR28(\thread)
|
|
|
|
+ sdc1 $f30, THREAD_FPR30(\thread)
|
|
sw \tmp, THREAD_FCR31(\thread)
|
|
sw \tmp, THREAD_FCR31(\thread)
|
|
.set pop
|
|
.set pop
|
|
.endm
|
|
.endm
|
|
@@ -84,22 +84,22 @@
|
|
.set push
|
|
.set push
|
|
.set mips64r2
|
|
.set mips64r2
|
|
SET_HARDFLOAT
|
|
SET_HARDFLOAT
|
|
- sdc1 $f1, THREAD_FPR1_LS64(\thread)
|
|
|
|
- sdc1 $f3, THREAD_FPR3_LS64(\thread)
|
|
|
|
- sdc1 $f5, THREAD_FPR5_LS64(\thread)
|
|
|
|
- sdc1 $f7, THREAD_FPR7_LS64(\thread)
|
|
|
|
- sdc1 $f9, THREAD_FPR9_LS64(\thread)
|
|
|
|
- sdc1 $f11, THREAD_FPR11_LS64(\thread)
|
|
|
|
- sdc1 $f13, THREAD_FPR13_LS64(\thread)
|
|
|
|
- sdc1 $f15, THREAD_FPR15_LS64(\thread)
|
|
|
|
- sdc1 $f17, THREAD_FPR17_LS64(\thread)
|
|
|
|
- sdc1 $f19, THREAD_FPR19_LS64(\thread)
|
|
|
|
- sdc1 $f21, THREAD_FPR21_LS64(\thread)
|
|
|
|
- sdc1 $f23, THREAD_FPR23_LS64(\thread)
|
|
|
|
- sdc1 $f25, THREAD_FPR25_LS64(\thread)
|
|
|
|
- sdc1 $f27, THREAD_FPR27_LS64(\thread)
|
|
|
|
- sdc1 $f29, THREAD_FPR29_LS64(\thread)
|
|
|
|
- sdc1 $f31, THREAD_FPR31_LS64(\thread)
|
|
|
|
|
|
+ sdc1 $f1, THREAD_FPR1(\thread)
|
|
|
|
+ sdc1 $f3, THREAD_FPR3(\thread)
|
|
|
|
+ sdc1 $f5, THREAD_FPR5(\thread)
|
|
|
|
+ sdc1 $f7, THREAD_FPR7(\thread)
|
|
|
|
+ sdc1 $f9, THREAD_FPR9(\thread)
|
|
|
|
+ sdc1 $f11, THREAD_FPR11(\thread)
|
|
|
|
+ sdc1 $f13, THREAD_FPR13(\thread)
|
|
|
|
+ sdc1 $f15, THREAD_FPR15(\thread)
|
|
|
|
+ sdc1 $f17, THREAD_FPR17(\thread)
|
|
|
|
+ sdc1 $f19, THREAD_FPR19(\thread)
|
|
|
|
+ sdc1 $f21, THREAD_FPR21(\thread)
|
|
|
|
+ sdc1 $f23, THREAD_FPR23(\thread)
|
|
|
|
+ sdc1 $f25, THREAD_FPR25(\thread)
|
|
|
|
+ sdc1 $f27, THREAD_FPR27(\thread)
|
|
|
|
+ sdc1 $f29, THREAD_FPR29(\thread)
|
|
|
|
+ sdc1 $f31, THREAD_FPR31(\thread)
|
|
.set pop
|
|
.set pop
|
|
.endm
|
|
.endm
|
|
|
|
|
|
@@ -118,22 +118,22 @@
|
|
.set push
|
|
.set push
|
|
SET_HARDFLOAT
|
|
SET_HARDFLOAT
|
|
lw \tmp, THREAD_FCR31(\thread)
|
|
lw \tmp, THREAD_FCR31(\thread)
|
|
- ldc1 $f0, THREAD_FPR0_LS64(\thread)
|
|
|
|
- ldc1 $f2, THREAD_FPR2_LS64(\thread)
|
|
|
|
- ldc1 $f4, THREAD_FPR4_LS64(\thread)
|
|
|
|
- ldc1 $f6, THREAD_FPR6_LS64(\thread)
|
|
|
|
- ldc1 $f8, THREAD_FPR8_LS64(\thread)
|
|
|
|
- ldc1 $f10, THREAD_FPR10_LS64(\thread)
|
|
|
|
- ldc1 $f12, THREAD_FPR12_LS64(\thread)
|
|
|
|
- ldc1 $f14, THREAD_FPR14_LS64(\thread)
|
|
|
|
- ldc1 $f16, THREAD_FPR16_LS64(\thread)
|
|
|
|
- ldc1 $f18, THREAD_FPR18_LS64(\thread)
|
|
|
|
- ldc1 $f20, THREAD_FPR20_LS64(\thread)
|
|
|
|
- ldc1 $f22, THREAD_FPR22_LS64(\thread)
|
|
|
|
- ldc1 $f24, THREAD_FPR24_LS64(\thread)
|
|
|
|
- ldc1 $f26, THREAD_FPR26_LS64(\thread)
|
|
|
|
- ldc1 $f28, THREAD_FPR28_LS64(\thread)
|
|
|
|
- ldc1 $f30, THREAD_FPR30_LS64(\thread)
|
|
|
|
|
|
+ ldc1 $f0, THREAD_FPR0(\thread)
|
|
|
|
+ ldc1 $f2, THREAD_FPR2(\thread)
|
|
|
|
+ ldc1 $f4, THREAD_FPR4(\thread)
|
|
|
|
+ ldc1 $f6, THREAD_FPR6(\thread)
|
|
|
|
+ ldc1 $f8, THREAD_FPR8(\thread)
|
|
|
|
+ ldc1 $f10, THREAD_FPR10(\thread)
|
|
|
|
+ ldc1 $f12, THREAD_FPR12(\thread)
|
|
|
|
+ ldc1 $f14, THREAD_FPR14(\thread)
|
|
|
|
+ ldc1 $f16, THREAD_FPR16(\thread)
|
|
|
|
+ ldc1 $f18, THREAD_FPR18(\thread)
|
|
|
|
+ ldc1 $f20, THREAD_FPR20(\thread)
|
|
|
|
+ ldc1 $f22, THREAD_FPR22(\thread)
|
|
|
|
+ ldc1 $f24, THREAD_FPR24(\thread)
|
|
|
|
+ ldc1 $f26, THREAD_FPR26(\thread)
|
|
|
|
+ ldc1 $f28, THREAD_FPR28(\thread)
|
|
|
|
+ ldc1 $f30, THREAD_FPR30(\thread)
|
|
ctc1 \tmp, fcr31
|
|
ctc1 \tmp, fcr31
|
|
.endm
|
|
.endm
|
|
|
|
|
|
@@ -141,22 +141,22 @@
|
|
.set push
|
|
.set push
|
|
.set mips64r2
|
|
.set mips64r2
|
|
SET_HARDFLOAT
|
|
SET_HARDFLOAT
|
|
- ldc1 $f1, THREAD_FPR1_LS64(\thread)
|
|
|
|
- ldc1 $f3, THREAD_FPR3_LS64(\thread)
|
|
|
|
- ldc1 $f5, THREAD_FPR5_LS64(\thread)
|
|
|
|
- ldc1 $f7, THREAD_FPR7_LS64(\thread)
|
|
|
|
- ldc1 $f9, THREAD_FPR9_LS64(\thread)
|
|
|
|
- ldc1 $f11, THREAD_FPR11_LS64(\thread)
|
|
|
|
- ldc1 $f13, THREAD_FPR13_LS64(\thread)
|
|
|
|
- ldc1 $f15, THREAD_FPR15_LS64(\thread)
|
|
|
|
- ldc1 $f17, THREAD_FPR17_LS64(\thread)
|
|
|
|
- ldc1 $f19, THREAD_FPR19_LS64(\thread)
|
|
|
|
- ldc1 $f21, THREAD_FPR21_LS64(\thread)
|
|
|
|
- ldc1 $f23, THREAD_FPR23_LS64(\thread)
|
|
|
|
- ldc1 $f25, THREAD_FPR25_LS64(\thread)
|
|
|
|
- ldc1 $f27, THREAD_FPR27_LS64(\thread)
|
|
|
|
- ldc1 $f29, THREAD_FPR29_LS64(\thread)
|
|
|
|
- ldc1 $f31, THREAD_FPR31_LS64(\thread)
|
|
|
|
|
|
+ ldc1 $f1, THREAD_FPR1(\thread)
|
|
|
|
+ ldc1 $f3, THREAD_FPR3(\thread)
|
|
|
|
+ ldc1 $f5, THREAD_FPR5(\thread)
|
|
|
|
+ ldc1 $f7, THREAD_FPR7(\thread)
|
|
|
|
+ ldc1 $f9, THREAD_FPR9(\thread)
|
|
|
|
+ ldc1 $f11, THREAD_FPR11(\thread)
|
|
|
|
+ ldc1 $f13, THREAD_FPR13(\thread)
|
|
|
|
+ ldc1 $f15, THREAD_FPR15(\thread)
|
|
|
|
+ ldc1 $f17, THREAD_FPR17(\thread)
|
|
|
|
+ ldc1 $f19, THREAD_FPR19(\thread)
|
|
|
|
+ ldc1 $f21, THREAD_FPR21(\thread)
|
|
|
|
+ ldc1 $f23, THREAD_FPR23(\thread)
|
|
|
|
+ ldc1 $f25, THREAD_FPR25(\thread)
|
|
|
|
+ ldc1 $f27, THREAD_FPR27(\thread)
|
|
|
|
+ ldc1 $f29, THREAD_FPR29(\thread)
|
|
|
|
+ ldc1 $f31, THREAD_FPR31(\thread)
|
|
.set pop
|
|
.set pop
|
|
.endm
|
|
.endm
|
|
|
|
|
|
@@ -211,6 +211,22 @@
|
|
.endm
|
|
.endm
|
|
|
|
|
|
#ifdef TOOLCHAIN_SUPPORTS_MSA
|
|
#ifdef TOOLCHAIN_SUPPORTS_MSA
|
|
|
|
+ .macro _cfcmsa rd, cs
|
|
|
|
+ .set push
|
|
|
|
+ .set mips32r2
|
|
|
|
+ .set msa
|
|
|
|
+ cfcmsa \rd, $\cs
|
|
|
|
+ .set pop
|
|
|
|
+ .endm
|
|
|
|
+
|
|
|
|
+ .macro _ctcmsa cd, rs
|
|
|
|
+ .set push
|
|
|
|
+ .set mips32r2
|
|
|
|
+ .set msa
|
|
|
|
+ ctcmsa $\cd, \rs
|
|
|
|
+ .set pop
|
|
|
|
+ .endm
|
|
|
|
+
|
|
.macro ld_d wd, off, base
|
|
.macro ld_d wd, off, base
|
|
.set push
|
|
.set push
|
|
.set mips32r2
|
|
.set mips32r2
|
|
@@ -227,35 +243,35 @@
|
|
.set pop
|
|
.set pop
|
|
.endm
|
|
.endm
|
|
|
|
|
|
- .macro copy_u_w rd, ws, n
|
|
|
|
|
|
+ .macro copy_u_w ws, n
|
|
.set push
|
|
.set push
|
|
.set mips32r2
|
|
.set mips32r2
|
|
.set msa
|
|
.set msa
|
|
- copy_u.w \rd, $w\ws[\n]
|
|
|
|
|
|
+ copy_u.w $1, $w\ws[\n]
|
|
.set pop
|
|
.set pop
|
|
.endm
|
|
.endm
|
|
|
|
|
|
- .macro copy_u_d rd, ws, n
|
|
|
|
|
|
+ .macro copy_u_d ws, n
|
|
.set push
|
|
.set push
|
|
.set mips64r2
|
|
.set mips64r2
|
|
.set msa
|
|
.set msa
|
|
- copy_u.d \rd, $w\ws[\n]
|
|
|
|
|
|
+ copy_u.d $1, $w\ws[\n]
|
|
.set pop
|
|
.set pop
|
|
.endm
|
|
.endm
|
|
|
|
|
|
- .macro insert_w wd, n, rs
|
|
|
|
|
|
+ .macro insert_w wd, n
|
|
.set push
|
|
.set push
|
|
.set mips32r2
|
|
.set mips32r2
|
|
.set msa
|
|
.set msa
|
|
- insert.w $w\wd[\n], \rs
|
|
|
|
|
|
+ insert.w $w\wd[\n], $1
|
|
.set pop
|
|
.set pop
|
|
.endm
|
|
.endm
|
|
|
|
|
|
- .macro insert_d wd, n, rs
|
|
|
|
|
|
+ .macro insert_d wd, n
|
|
.set push
|
|
.set push
|
|
.set mips64r2
|
|
.set mips64r2
|
|
.set msa
|
|
.set msa
|
|
- insert.d $w\wd[\n], \rs
|
|
|
|
|
|
+ insert.d $w\wd[\n], $1
|
|
.set pop
|
|
.set pop
|
|
.endm
|
|
.endm
|
|
#else
|
|
#else
|
|
@@ -283,7 +299,7 @@
|
|
/*
|
|
/*
|
|
* Temporary until all toolchains in use include MSA support.
|
|
* Temporary until all toolchains in use include MSA support.
|
|
*/
|
|
*/
|
|
- .macro cfcmsa rd, cs
|
|
|
|
|
|
+ .macro _cfcmsa rd, cs
|
|
.set push
|
|
.set push
|
|
.set noat
|
|
.set noat
|
|
SET_HARDFLOAT
|
|
SET_HARDFLOAT
|
|
@@ -293,7 +309,7 @@
|
|
.set pop
|
|
.set pop
|
|
.endm
|
|
.endm
|
|
|
|
|
|
- .macro ctcmsa cd, rs
|
|
|
|
|
|
+ .macro _ctcmsa cd, rs
|
|
.set push
|
|
.set push
|
|
.set noat
|
|
.set noat
|
|
SET_HARDFLOAT
|
|
SET_HARDFLOAT
|
|
@@ -320,44 +336,36 @@
|
|
.set pop
|
|
.set pop
|
|
.endm
|
|
.endm
|
|
|
|
|
|
- .macro copy_u_w rd, ws, n
|
|
|
|
|
|
+ .macro copy_u_w ws, n
|
|
.set push
|
|
.set push
|
|
.set noat
|
|
.set noat
|
|
SET_HARDFLOAT
|
|
SET_HARDFLOAT
|
|
.insn
|
|
.insn
|
|
.word COPY_UW_MSA_INSN | (\n << 16) | (\ws << 11)
|
|
.word COPY_UW_MSA_INSN | (\n << 16) | (\ws << 11)
|
|
- /* move triggers an assembler bug... */
|
|
|
|
- or \rd, $1, zero
|
|
|
|
.set pop
|
|
.set pop
|
|
.endm
|
|
.endm
|
|
|
|
|
|
- .macro copy_u_d rd, ws, n
|
|
|
|
|
|
+ .macro copy_u_d ws, n
|
|
.set push
|
|
.set push
|
|
.set noat
|
|
.set noat
|
|
SET_HARDFLOAT
|
|
SET_HARDFLOAT
|
|
.insn
|
|
.insn
|
|
.word COPY_UD_MSA_INSN | (\n << 16) | (\ws << 11)
|
|
.word COPY_UD_MSA_INSN | (\n << 16) | (\ws << 11)
|
|
- /* move triggers an assembler bug... */
|
|
|
|
- or \rd, $1, zero
|
|
|
|
.set pop
|
|
.set pop
|
|
.endm
|
|
.endm
|
|
|
|
|
|
- .macro insert_w wd, n, rs
|
|
|
|
|
|
+ .macro insert_w wd, n
|
|
.set push
|
|
.set push
|
|
.set noat
|
|
.set noat
|
|
SET_HARDFLOAT
|
|
SET_HARDFLOAT
|
|
- /* move triggers an assembler bug... */
|
|
|
|
- or $1, \rs, zero
|
|
|
|
.word INSERT_W_MSA_INSN | (\n << 16) | (\wd << 6)
|
|
.word INSERT_W_MSA_INSN | (\n << 16) | (\wd << 6)
|
|
.set pop
|
|
.set pop
|
|
.endm
|
|
.endm
|
|
|
|
|
|
- .macro insert_d wd, n, rs
|
|
|
|
|
|
+ .macro insert_d wd, n
|
|
.set push
|
|
.set push
|
|
.set noat
|
|
.set noat
|
|
SET_HARDFLOAT
|
|
SET_HARDFLOAT
|
|
- /* move triggers an assembler bug... */
|
|
|
|
- or $1, \rs, zero
|
|
|
|
.word INSERT_D_MSA_INSN | (\n << 16) | (\wd << 6)
|
|
.word INSERT_D_MSA_INSN | (\n << 16) | (\wd << 6)
|
|
.set pop
|
|
.set pop
|
|
.endm
|
|
.endm
|
|
@@ -399,7 +407,7 @@
|
|
.set push
|
|
.set push
|
|
.set noat
|
|
.set noat
|
|
SET_HARDFLOAT
|
|
SET_HARDFLOAT
|
|
- cfcmsa $1, MSA_CSR
|
|
|
|
|
|
+ _cfcmsa $1, MSA_CSR
|
|
sw $1, THREAD_MSA_CSR(\thread)
|
|
sw $1, THREAD_MSA_CSR(\thread)
|
|
.set pop
|
|
.set pop
|
|
.endm
|
|
.endm
|
|
@@ -409,7 +417,7 @@
|
|
.set noat
|
|
.set noat
|
|
SET_HARDFLOAT
|
|
SET_HARDFLOAT
|
|
lw $1, THREAD_MSA_CSR(\thread)
|
|
lw $1, THREAD_MSA_CSR(\thread)
|
|
- ctcmsa MSA_CSR, $1
|
|
|
|
|
|
+ _ctcmsa MSA_CSR, $1
|
|
.set pop
|
|
.set pop
|
|
ld_d 0, THREAD_FPR0, \thread
|
|
ld_d 0, THREAD_FPR0, \thread
|
|
ld_d 1, THREAD_FPR1, \thread
|
|
ld_d 1, THREAD_FPR1, \thread
|
|
@@ -452,9 +460,6 @@
|
|
insert_w \wd, 2
|
|
insert_w \wd, 2
|
|
insert_w \wd, 3
|
|
insert_w \wd, 3
|
|
#endif
|
|
#endif
|
|
- .if 31-\wd
|
|
|
|
- msa_init_upper (\wd+1)
|
|
|
|
- .endif
|
|
|
|
.endm
|
|
.endm
|
|
|
|
|
|
.macro msa_init_all_upper
|
|
.macro msa_init_all_upper
|
|
@@ -463,6 +468,37 @@
|
|
SET_HARDFLOAT
|
|
SET_HARDFLOAT
|
|
not $1, zero
|
|
not $1, zero
|
|
msa_init_upper 0
|
|
msa_init_upper 0
|
|
|
|
+ msa_init_upper 1
|
|
|
|
+ msa_init_upper 2
|
|
|
|
+ msa_init_upper 3
|
|
|
|
+ msa_init_upper 4
|
|
|
|
+ msa_init_upper 5
|
|
|
|
+ msa_init_upper 6
|
|
|
|
+ msa_init_upper 7
|
|
|
|
+ msa_init_upper 8
|
|
|
|
+ msa_init_upper 9
|
|
|
|
+ msa_init_upper 10
|
|
|
|
+ msa_init_upper 11
|
|
|
|
+ msa_init_upper 12
|
|
|
|
+ msa_init_upper 13
|
|
|
|
+ msa_init_upper 14
|
|
|
|
+ msa_init_upper 15
|
|
|
|
+ msa_init_upper 16
|
|
|
|
+ msa_init_upper 17
|
|
|
|
+ msa_init_upper 18
|
|
|
|
+ msa_init_upper 19
|
|
|
|
+ msa_init_upper 20
|
|
|
|
+ msa_init_upper 21
|
|
|
|
+ msa_init_upper 22
|
|
|
|
+ msa_init_upper 23
|
|
|
|
+ msa_init_upper 24
|
|
|
|
+ msa_init_upper 25
|
|
|
|
+ msa_init_upper 26
|
|
|
|
+ msa_init_upper 27
|
|
|
|
+ msa_init_upper 28
|
|
|
|
+ msa_init_upper 29
|
|
|
|
+ msa_init_upper 30
|
|
|
|
+ msa_init_upper 31
|
|
.set pop
|
|
.set pop
|
|
.endm
|
|
.endm
|
|
|
|
|