|
@@ -18,7 +18,7 @@
|
|
* The algorithm for the leading and trailing quadwords remains the same,
|
|
* The algorithm for the leading and trailing quadwords remains the same,
|
|
* however the loop has been unrolled to enable better memory throughput,
|
|
* however the loop has been unrolled to enable better memory throughput,
|
|
* and the code has been replicated for each of the entry points: __memset
|
|
* and the code has been replicated for each of the entry points: __memset
|
|
- * and __memsetw to permit better scheduling to eliminate the stalling
|
|
|
|
|
|
+ * and __memset16 to permit better scheduling to eliminate the stalling
|
|
* encountered during the mask replication.
|
|
* encountered during the mask replication.
|
|
* A future enhancement might be to put in a byte store loop for really
|
|
* A future enhancement might be to put in a byte store loop for really
|
|
* small (say < 32 bytes) memset()s. Whether or not that change would be
|
|
* small (say < 32 bytes) memset()s. Whether or not that change would be
|
|
@@ -34,7 +34,7 @@
|
|
.globl memset
|
|
.globl memset
|
|
.globl __memset
|
|
.globl __memset
|
|
.globl ___memset
|
|
.globl ___memset
|
|
- .globl __memsetw
|
|
|
|
|
|
+ .globl __memset16
|
|
.globl __constant_c_memset
|
|
.globl __constant_c_memset
|
|
|
|
|
|
.ent ___memset
|
|
.ent ___memset
|
|
@@ -415,9 +415,9 @@ end:
|
|
* to mask stalls. Note that entry point names also had to change
|
|
* to mask stalls. Note that entry point names also had to change
|
|
*/
|
|
*/
|
|
.align 5
|
|
.align 5
|
|
- .ent __memsetw
|
|
|
|
|
|
+ .ent __memset16
|
|
|
|
|
|
-__memsetw:
|
|
|
|
|
|
+__memset16:
|
|
.frame $30,0,$26,0
|
|
.frame $30,0,$26,0
|
|
.prologue 0
|
|
.prologue 0
|
|
|
|
|
|
@@ -596,8 +596,8 @@ end_w:
|
|
nop
|
|
nop
|
|
ret $31,($26),1 # L0 :
|
|
ret $31,($26),1 # L0 :
|
|
|
|
|
|
- .end __memsetw
|
|
|
|
- EXPORT_SYMBOL(__memsetw)
|
|
|
|
|
|
+ .end __memset16
|
|
|
|
+ EXPORT_SYMBOL(__memset16)
|
|
|
|
|
|
memset = ___memset
|
|
memset = ___memset
|
|
__memset = ___memset
|
|
__memset = ___memset
|