memset.S 2.4 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115
  1. /* SPDX-License-Identifier: GPL-2.0-only */
  2. /*
  3. * Copyright (C) 2013 Regents of the University of California
  4. */
  5. #include <linux/linkage.h>
  6. #include <asm/asm.h>
  7. /* void *memset(void *, int, size_t) */
  8. SYM_FUNC_START(__memset)
  9. move t0, a0 /* Preserve return value */
  10. /* Defer to byte-oriented fill for small sizes */
  11. sltiu a3, a2, 16
  12. bnez a3, 4f
  13. /*
  14. * Round to nearest XLEN-aligned address
  15. * greater than or equal to start address
  16. */
  17. addi a3, t0, SZREG-1
  18. andi a3, a3, ~(SZREG-1)
  19. beq a3, t0, 2f /* Skip if already aligned */
  20. /* Handle initial misalignment */
  21. sub a4, a3, t0
  22. 1:
  23. sb a1, 0(t0)
  24. addi t0, t0, 1
  25. bltu t0, a3, 1b
  26. sub a2, a2, a4 /* Update count */
  27. 2: /* Duff's device with 32 XLEN stores per iteration */
  28. /* Broadcast value into all bytes */
  29. andi a1, a1, 0xff
  30. slli a3, a1, 8
  31. or a1, a3, a1
  32. slli a3, a1, 16
  33. or a1, a3, a1
  34. #ifdef CONFIG_64BIT
  35. slli a3, a1, 32
  36. or a1, a3, a1
  37. #endif
  38. /* Calculate end address */
  39. andi a4, a2, ~(SZREG-1)
  40. add a3, t0, a4
  41. andi a4, a4, 31*SZREG /* Calculate remainder */
  42. beqz a4, 3f /* Shortcut if no remainder */
  43. neg a4, a4
  44. addi a4, a4, 32*SZREG /* Calculate initial offset */
  45. /* Adjust start address with offset */
  46. sub t0, t0, a4
  47. /* Jump into loop body */
  48. /* Assumes 32-bit instruction lengths */
  49. la a5, 3f
  50. #ifdef CONFIG_64BIT
  51. srli a4, a4, 1
  52. #endif
  53. add a5, a5, a4
  54. jr a5
  55. 3:
  56. REG_S a1, 0(t0)
  57. REG_S a1, SZREG(t0)
  58. REG_S a1, 2*SZREG(t0)
  59. REG_S a1, 3*SZREG(t0)
  60. REG_S a1, 4*SZREG(t0)
  61. REG_S a1, 5*SZREG(t0)
  62. REG_S a1, 6*SZREG(t0)
  63. REG_S a1, 7*SZREG(t0)
  64. REG_S a1, 8*SZREG(t0)
  65. REG_S a1, 9*SZREG(t0)
  66. REG_S a1, 10*SZREG(t0)
  67. REG_S a1, 11*SZREG(t0)
  68. REG_S a1, 12*SZREG(t0)
  69. REG_S a1, 13*SZREG(t0)
  70. REG_S a1, 14*SZREG(t0)
  71. REG_S a1, 15*SZREG(t0)
  72. REG_S a1, 16*SZREG(t0)
  73. REG_S a1, 17*SZREG(t0)
  74. REG_S a1, 18*SZREG(t0)
  75. REG_S a1, 19*SZREG(t0)
  76. REG_S a1, 20*SZREG(t0)
  77. REG_S a1, 21*SZREG(t0)
  78. REG_S a1, 22*SZREG(t0)
  79. REG_S a1, 23*SZREG(t0)
  80. REG_S a1, 24*SZREG(t0)
  81. REG_S a1, 25*SZREG(t0)
  82. REG_S a1, 26*SZREG(t0)
  83. REG_S a1, 27*SZREG(t0)
  84. REG_S a1, 28*SZREG(t0)
  85. REG_S a1, 29*SZREG(t0)
  86. REG_S a1, 30*SZREG(t0)
  87. REG_S a1, 31*SZREG(t0)
  88. addi t0, t0, 32*SZREG
  89. bltu t0, a3, 3b
  90. andi a2, a2, SZREG-1 /* Update count */
  91. 4:
  92. /* Handle trailing misalignment */
  93. beqz a2, 6f
  94. add a3, t0, a2
  95. 5:
  96. sb a1, 0(t0)
  97. addi t0, t0, 1
  98. bltu t0, a3, 5b
  99. 6:
  100. ret
  101. SYM_FUNC_END(__memset)
  102. SYM_FUNC_ALIAS_WEAK(memset, __memset)
  103. SYM_FUNC_ALIAS(__pi_memset, __memset)
  104. SYM_FUNC_ALIAS(__pi___memset, __memset)