string_64.S 2.7 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179
  1. /* SPDX-License-Identifier: GPL-2.0-or-later */
  2. /*
  3. *
  4. * Copyright (C) IBM Corporation, 2012
  5. *
  6. * Author: Anton Blanchard <[email protected]>
  7. */
  8. #include <asm/ppc_asm.h>
  9. #include <asm/linkage.h>
  10. #include <asm/asm-offsets.h>
  11. #include <asm/export.h>
  12. /**
  13. * __arch_clear_user: - Zero a block of memory in user space, with less checking.
  14. * @to: Destination address, in user space.
  15. * @n: Number of bytes to zero.
  16. *
  17. * Zero a block of memory in user space. Caller must check
  18. * the specified block with access_ok() before calling this function.
  19. *
  20. * Returns number of bytes that could not be cleared.
  21. * On success, this will be zero.
  22. */
  23. .macro err1
  24. 100:
  25. EX_TABLE(100b,.Ldo_err1)
  26. .endm
  27. .macro err2
  28. 200:
  29. EX_TABLE(200b,.Ldo_err2)
  30. .endm
  31. .macro err3
  32. 300:
  33. EX_TABLE(300b,.Ldo_err3)
  34. .endm
  35. .Ldo_err1:
  36. mr r3,r8
  37. .Ldo_err2:
  38. mtctr r4
  39. 1:
  40. err3; stb r0,0(r3)
  41. addi r3,r3,1
  42. addi r4,r4,-1
  43. bdnz 1b
  44. .Ldo_err3:
  45. mr r3,r4
  46. blr
  47. _GLOBAL_TOC(__arch_clear_user)
  48. cmpdi r4,32
  49. neg r6,r3
  50. li r0,0
  51. blt .Lshort_clear
  52. mr r8,r3
  53. mtocrf 0x01,r6
  54. clrldi r6,r6,(64-3)
  55. /* Get the destination 8 byte aligned */
  56. bf cr7*4+3,1f
  57. err1; stb r0,0(r3)
  58. addi r3,r3,1
  59. 1: bf cr7*4+2,2f
  60. err1; sth r0,0(r3)
  61. addi r3,r3,2
  62. 2: bf cr7*4+1,3f
  63. err1; stw r0,0(r3)
  64. addi r3,r3,4
  65. 3: sub r4,r4,r6
  66. cmpdi r4,32
  67. cmpdi cr1,r4,512
  68. blt .Lshort_clear
  69. bgt cr1,.Llong_clear
  70. .Lmedium_clear:
  71. srdi r6,r4,5
  72. mtctr r6
  73. /* Do 32 byte chunks */
  74. 4:
  75. err2; std r0,0(r3)
  76. err2; std r0,8(r3)
  77. err2; std r0,16(r3)
  78. err2; std r0,24(r3)
  79. addi r3,r3,32
  80. addi r4,r4,-32
  81. bdnz 4b
  82. .Lshort_clear:
  83. /* up to 31 bytes to go */
  84. cmpdi r4,16
  85. blt 6f
  86. err2; std r0,0(r3)
  87. err2; std r0,8(r3)
  88. addi r3,r3,16
  89. addi r4,r4,-16
  90. /* Up to 15 bytes to go */
  91. 6: mr r8,r3
  92. clrldi r4,r4,(64-4)
  93. mtocrf 0x01,r4
  94. bf cr7*4+0,7f
  95. err1; std r0,0(r3)
  96. addi r3,r3,8
  97. 7: bf cr7*4+1,8f
  98. err1; stw r0,0(r3)
  99. addi r3,r3,4
  100. 8: bf cr7*4+2,9f
  101. err1; sth r0,0(r3)
  102. addi r3,r3,2
  103. 9: bf cr7*4+3,10f
  104. err1; stb r0,0(r3)
  105. 10: li r3,0
  106. blr
  107. .Llong_clear:
  108. LOAD_REG_ADDR(r5, ppc64_caches)
  109. bf cr7*4+0,11f
  110. err2; std r0,0(r3)
  111. addi r3,r3,8
  112. addi r4,r4,-8
  113. /* Destination is 16 byte aligned, need to get it cache block aligned */
  114. 11: lwz r7,DCACHEL1LOGBLOCKSIZE(r5)
  115. lwz r9,DCACHEL1BLOCKSIZE(r5)
  116. /*
  117. * With worst case alignment the long clear loop takes a minimum
  118. * of 1 byte less than 2 cachelines.
  119. */
  120. sldi r10,r9,2
  121. cmpd r4,r10
  122. blt .Lmedium_clear
  123. neg r6,r3
  124. addi r10,r9,-1
  125. and. r5,r6,r10
  126. beq 13f
  127. srdi r6,r5,4
  128. mtctr r6
  129. mr r8,r3
  130. 12:
  131. err1; std r0,0(r3)
  132. err1; std r0,8(r3)
  133. addi r3,r3,16
  134. bdnz 12b
  135. sub r4,r4,r5
  136. 13: srd r6,r4,r7
  137. mtctr r6
  138. mr r8,r3
  139. 14:
  140. err1; dcbz 0,r3
  141. add r3,r3,r9
  142. bdnz 14b
  143. and r4,r4,r10
  144. cmpdi r4,32
  145. blt .Lshort_clear
  146. b .Lmedium_clear
  147. EXPORT_SYMBOL(__arch_clear_user)