NGpage.S 3.5 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139
  1. /* SPDX-License-Identifier: GPL-2.0 */
  2. /* NGpage.S: Niagara optimize clear and copy page.
  3. *
  4. * Copyright (C) 2006 (davem@davemloft.net)
  5. */
  6. #include <asm/asi.h>
  7. #include <asm/page.h>
  8. .text
  9. .align 32
  10. /* This is heavily simplified from the sun4u variants
  11. * because Niagara does not have any D-cache aliasing issues
  12. * and also we don't need to use the FPU in order to implement
  13. * an optimal page copy/clear.
  14. */
  15. NGcopy_user_page: /* %o0=dest, %o1=src, %o2=vaddr */
  16. save %sp, -192, %sp
  17. rd %asi, %g3
  18. wr %g0, ASI_BLK_INIT_QUAD_LDD_P, %asi
  19. set PAGE_SIZE, %g7
  20. prefetch [%i1 + 0x00], #one_read
  21. prefetch [%i1 + 0x40], #one_read
  22. 1: prefetch [%i1 + 0x80], #one_read
  23. prefetch [%i1 + 0xc0], #one_read
  24. ldda [%i1 + 0x00] %asi, %o2
  25. ldda [%i1 + 0x10] %asi, %o4
  26. ldda [%i1 + 0x20] %asi, %l2
  27. ldda [%i1 + 0x30] %asi, %l4
  28. stxa %o2, [%i0 + 0x00] %asi
  29. stxa %o3, [%i0 + 0x08] %asi
  30. stxa %o4, [%i0 + 0x10] %asi
  31. stxa %o5, [%i0 + 0x18] %asi
  32. stxa %l2, [%i0 + 0x20] %asi
  33. stxa %l3, [%i0 + 0x28] %asi
  34. stxa %l4, [%i0 + 0x30] %asi
  35. stxa %l5, [%i0 + 0x38] %asi
  36. ldda [%i1 + 0x40] %asi, %o2
  37. ldda [%i1 + 0x50] %asi, %o4
  38. ldda [%i1 + 0x60] %asi, %l2
  39. ldda [%i1 + 0x70] %asi, %l4
  40. stxa %o2, [%i0 + 0x40] %asi
  41. stxa %o3, [%i0 + 0x48] %asi
  42. stxa %o4, [%i0 + 0x50] %asi
  43. stxa %o5, [%i0 + 0x58] %asi
  44. stxa %l2, [%i0 + 0x60] %asi
  45. stxa %l3, [%i0 + 0x68] %asi
  46. stxa %l4, [%i0 + 0x70] %asi
  47. stxa %l5, [%i0 + 0x78] %asi
  48. add %i1, 128, %i1
  49. subcc %g7, 128, %g7
  50. bne,pt %xcc, 1b
  51. add %i0, 128, %i0
  52. wr %g3, 0x0, %asi
  53. membar #Sync
  54. ret
  55. restore
  56. .align 32
  57. .globl NGclear_page
  58. .globl NGclear_user_page
  59. NGclear_page: /* %o0=dest */
  60. NGclear_user_page: /* %o0=dest, %o1=vaddr */
  61. rd %asi, %g3
  62. wr %g0, ASI_BLK_INIT_QUAD_LDD_P, %asi
  63. set PAGE_SIZE, %g7
  64. 1: stxa %g0, [%o0 + 0x00] %asi
  65. stxa %g0, [%o0 + 0x08] %asi
  66. stxa %g0, [%o0 + 0x10] %asi
  67. stxa %g0, [%o0 + 0x18] %asi
  68. stxa %g0, [%o0 + 0x20] %asi
  69. stxa %g0, [%o0 + 0x28] %asi
  70. stxa %g0, [%o0 + 0x30] %asi
  71. stxa %g0, [%o0 + 0x38] %asi
  72. stxa %g0, [%o0 + 0x40] %asi
  73. stxa %g0, [%o0 + 0x48] %asi
  74. stxa %g0, [%o0 + 0x50] %asi
  75. stxa %g0, [%o0 + 0x58] %asi
  76. stxa %g0, [%o0 + 0x60] %asi
  77. stxa %g0, [%o0 + 0x68] %asi
  78. stxa %g0, [%o0 + 0x70] %asi
  79. stxa %g0, [%o0 + 0x78] %asi
  80. stxa %g0, [%o0 + 0x80] %asi
  81. stxa %g0, [%o0 + 0x88] %asi
  82. stxa %g0, [%o0 + 0x90] %asi
  83. stxa %g0, [%o0 + 0x98] %asi
  84. stxa %g0, [%o0 + 0xa0] %asi
  85. stxa %g0, [%o0 + 0xa8] %asi
  86. stxa %g0, [%o0 + 0xb0] %asi
  87. stxa %g0, [%o0 + 0xb8] %asi
  88. stxa %g0, [%o0 + 0xc0] %asi
  89. stxa %g0, [%o0 + 0xc8] %asi
  90. stxa %g0, [%o0 + 0xd0] %asi
  91. stxa %g0, [%o0 + 0xd8] %asi
  92. stxa %g0, [%o0 + 0xe0] %asi
  93. stxa %g0, [%o0 + 0xe8] %asi
  94. stxa %g0, [%o0 + 0xf0] %asi
  95. stxa %g0, [%o0 + 0xf8] %asi
  96. subcc %g7, 256, %g7
  97. bne,pt %xcc, 1b
  98. add %o0, 256, %o0
  99. wr %g3, 0x0, %asi
  100. membar #Sync
  101. retl
  102. nop
  103. #define BRANCH_ALWAYS 0x10680000
  104. #define NOP 0x01000000
  105. #define NG_DO_PATCH(OLD, NEW) \
  106. sethi %hi(NEW), %g1; \
  107. or %g1, %lo(NEW), %g1; \
  108. sethi %hi(OLD), %g2; \
  109. or %g2, %lo(OLD), %g2; \
  110. sub %g1, %g2, %g1; \
  111. sethi %hi(BRANCH_ALWAYS), %g3; \
  112. sll %g1, 11, %g1; \
  113. srl %g1, 11 + 2, %g1; \
  114. or %g3, %lo(BRANCH_ALWAYS), %g3; \
  115. or %g3, %g1, %g3; \
  116. stw %g3, [%g2]; \
  117. sethi %hi(NOP), %g3; \
  118. or %g3, %lo(NOP), %g3; \
  119. stw %g3, [%g2 + 0x4]; \
  120. flush %g2;
  121. .globl niagara_patch_pageops
  122. .type niagara_patch_pageops,#function
  123. niagara_patch_pageops:
  124. NG_DO_PATCH(copy_user_page, NGcopy_user_page)
  125. NG_DO_PATCH(_clear_page, NGclear_page)
  126. NG_DO_PATCH(clear_user_page, NGclear_user_page)
  127. retl
  128. nop
  129. .size niagara_patch_pageops,.-niagara_patch_pageops