init_caches.S 11 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288
  1. /*
  2. * init_caches.S
  3. *
  4. * Common Cache initialization
  5. */
  6. /*
  7. Copyright (c) 2007-2018, MIPS Tech, LLC and/or its affiliated group companies or licensors
  8. All rights reserved.
  9. Redistribution and use in source and binary forms, with or without modification, are
  10. permitted provided that the following conditions are met:
  11. 1. Redistributions of source code must retain the above copyright notice, this list of
  12. conditions and the following disclaimer.
  13. 2. Redistributions in binary form must reproduce the above copyright notice, this list
  14. of conditions and the following disclaimer in the documentation and/or other materials
  15. provided with the distribution.
  16. 3. Neither the name of the copyright holder nor the names of its contributors may be
  17. used to endorse or promote products derived from this software without specific prior
  18. written permission.
  19. THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND ANY
  20. EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
  21. OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT
  22. SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
  23. SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT
  24. OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
  25. HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
  26. OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
  27. SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
  28. */
  29. #include <mips/asm.h>
  30. #include <mips/regdef.h> // #defines for GPRs
  31. #include <mips/m32c0.h> // #defines for CP0 registers
  32. #include <core_config.h> // #defines for ILINE_SIZE, DLINE_SIZE and HCI
  33. #define LINE_SIZE $3
  34. #define BYTES_PER_LOOP $2
  35. #define SET_SIZE $4
  36. #define ASSOC $5
  37. #define CONFIG_1 $6
  38. #define END_ADDR $7
  39. #define TOTAL_BYTES $12
  40. #define CURRENT_ADDR $13
  41. #define TEMP1 $14
  42. #define TEMP2 $15
  43. #define LINES_PER_ITER 8 // number of cache instructions per loop
  44. /**************************************************************************************
  45. **************************************************************************************/
  46. LEAF(init_icache)
  47. // Can be skipped if Config7[HCI] set
  48. mfc0 TEMP1, C0_CONFIG, 7 // Read CP0 Config7
  49. ext TEMP1, TEMP1, HCI, 1 // extract HCI
  50. bne TEMP1, zero, done_icache
  51. // Determine how big the I$ is
  52. mfc0 CONFIG_1, C0_CONFIG1 // read C0_Config1
  53. // Isolate I$ Line Size
  54. ext LINE_SIZE, CONFIG_1, CFG1_ILSHIFT, 3 // extract IL
  55. // Skip ahead if No I$
  56. beq LINE_SIZE, zero, done_icache
  57. li TEMP1, 2
  58. sllv LINE_SIZE, TEMP1, LINE_SIZE // Now have true I$ line size in bytes
  59. ext SET_SIZE, CONFIG_1, CFG1_ISSHIFT, 3 // extract IS
  60. li TEMP1, 64
  61. sllv SET_SIZE, TEMP1, SET_SIZE // I$ Sets per way
  62. // Config1IA == I$ Assoc - 1
  63. ext ASSOC, CONFIG_1, CFG1_IASHIFT, 3 // extract IA
  64. addiu ASSOC, ASSOC, 1
  65. li TEMP1, (LINES_PER_ITER)
  66. mul SET_SIZE, SET_SIZE, ASSOC // Total number of sets
  67. mul TOTAL_BYTES, SET_SIZE, LINE_SIZE // Total number of bytes
  68. mul BYTES_PER_LOOP, LINE_SIZE, TEMP1 // Total bytes per loop
  69. // Set the starting address at the beginning of kgeg0 (0x80000000) which will corresponds to
  70. // way 0 index 0 of the cache and position so starting address is in the
  71. // middle of the first bytes per loop because the code will use + and - offsets
  72. li CURRENT_ADDR, 0x0000000080000000
  73. srl TEMP1, BYTES_PER_LOOP, 1
  74. addu CURRENT_ADDR, TEMP1, CURRENT_ADDR
  75. addu END_ADDR, CURRENT_ADDR, TOTAL_BYTES // make ending address
  76. subu END_ADDR, END_ADDR, BYTES_PER_LOOP // -1
  77. // Clear TagLo/TagHi registers
  78. mtc0 zero, C0_TAGLO // write C0_ITagLo
  79. mtc0 zero, C0_TAGHI // Note: not all implementations will have a tag Hi but writes will be ignored if not present
  80. ehb
  81. // due to offset field restrictions code assumes line size will not be more that 128 bytes for a r5 or less core
  82. // or not more than 64 bytes for a r6 and greater core
  83. next_icache_tag:
  84. // Index Store Tag Cache Op
  85. // Will invalidate the tag entry, clear the lock bit, and clear the LRF bit
  86. cache 0x8, (ILINE_SIZE*-2)(CURRENT_ADDR)
  87. cache 0x8, (ILINE_SIZE*-1)(CURRENT_ADDR)
  88. cache 0x8, (ILINE_SIZE*0)(CURRENT_ADDR)
  89. cache 0x8, (ILINE_SIZE*1)(CURRENT_ADDR)
  90. cache 0x8, (ILINE_SIZE*-4)(CURRENT_ADDR)
  91. cache 0x8, (ILINE_SIZE*-3)(CURRENT_ADDR)
  92. cache 0x8, (ILINE_SIZE*2)(CURRENT_ADDR)
  93. cache 0x8, (ILINE_SIZE*3)(CURRENT_ADDR)
  94. addu CURRENT_ADDR, BYTES_PER_LOOP // Get next starting line address
  95. bge END_ADDR, CURRENT_ADDR, next_icache_tag // Done yet?
  96. done_icache:
  97. jalr zero, ra
  98. END(init_icache)
  99. /**************************************************************************************
  100. * init_dcache invalidates all data cache entries
  101. **************************************************************************************/
  102. LEAF(init_dcache)
  103. // Can be skipped if Config7[HCI] set
  104. mfc0 TEMP1, C0_CONFIG, 7 // Read CP0 Config7
  105. ext TEMP1, TEMP1, HCI, 1 // extract HCI
  106. bne TEMP1, zero, done_dcache
  107. mfc0 CONFIG_1, C0_CONFIG1 // read C0_Config1
  108. // Isolate D$ Line Size
  109. ext LINE_SIZE, CONFIG_1, CFG1_DLSHIFT, 3 // extract DL
  110. // Skip ahead if No D$
  111. beq LINE_SIZE, zero, done_dcache
  112. li TEMP1, 2
  113. sllv LINE_SIZE, TEMP1, LINE_SIZE // Now have true D$ line size in bytes
  114. ext SET_SIZE, CONFIG_1, CFG1_DSSHIFT, 3 // extract DS
  115. li TEMP1, 64
  116. sllv SET_SIZE, TEMP1, SET_SIZE // D$ Sets per way
  117. // Config1DA == D$ Assoc - 1
  118. ext ASSOC, CONFIG_1, CFG1_DASHIFT, 3 // extract DA
  119. addiu ASSOC, 1
  120. li TEMP1, (LINES_PER_ITER)
  121. mul SET_SIZE, SET_SIZE, ASSOC // Total number of sets
  122. mul TOTAL_BYTES, SET_SIZE, LINE_SIZE // Total number of bytes
  123. mul BYTES_PER_LOOP, LINE_SIZE, TEMP1 // Total bytes per loop
  124. // Set the starting address at the beginning of kgeg0 (0x80000000) which will corresponds to
  125. // way 0 index 0 of the cache and position so starting address is in the
  126. // middle of the first bytes per loop because the code will use + and - offsets
  127. lui CURRENT_ADDR, 0x8000
  128. srl TEMP1, BYTES_PER_LOOP, 1
  129. addu CURRENT_ADDR, TEMP1, CURRENT_ADDR
  130. addu END_ADDR, CURRENT_ADDR, TOTAL_BYTES // make ending address
  131. subu END_ADDR, END_ADDR, BYTES_PER_LOOP // -1
  132. // Clear TagLo/TagHi registers
  133. mtc0 zero, C0_TAGLO, 2 // write C0_DTagLo
  134. mtc0 zero, C0_TAGHI, 2 // Note: not all implementations will have a tag Hi but writes will be ignored if not present
  135. ehb
  136. // due to offset field restrictions code assumes line size will not be more that 128 bytes for a r5 or less core
  137. // or not more than 64 bytes for a r6 and greater core
  138. next_dcache_tag:
  139. // Index Store Tag Cache Op
  140. // Will invalidate the tag entry, clear the lock bit, and clear the LRF bit
  141. cache 0x9, (DLINE_SIZE*-2)(CURRENT_ADDR)
  142. cache 0x9, (DLINE_SIZE*-1)(CURRENT_ADDR)
  143. cache 0x9, (DLINE_SIZE*0)(CURRENT_ADDR)
  144. cache 0x9, (DLINE_SIZE*1)(CURRENT_ADDR)
  145. cache 0x9, (DLINE_SIZE*-4)(CURRENT_ADDR)
  146. cache 0x9, (DLINE_SIZE*-3)(CURRENT_ADDR)
  147. cache 0x9, (DLINE_SIZE*2)(CURRENT_ADDR)
  148. cache 0x9, (DLINE_SIZE*3)(CURRENT_ADDR)
  149. addu CURRENT_ADDR, BYTES_PER_LOOP // Get next starting line address
  150. bge END_ADDR, CURRENT_ADDR, next_dcache_tag // Done yet?
  151. done_dcache:
  152. jalr zero, ra
  153. END(init_dcache)
  154. LEAF(change_k0_cca)
  155. // NOTE! This code must be executed in KSEG1 (not KSGE0 uncached)
  156. // Set CCA for kseg0 to cacheable
  157. mfc0 TEMP1, C0_CONFIG // read C0_Config
  158. li TEMP2, 3 // CCA for all others
  159. beqz r11_is_cps, set_kseg0_cca
  160. li TEMP2, 5 // CCA for coherent cores (fall through)
  161. set_kseg0_cca:
  162. ins TEMP1, TEMP2, 0, 3 // insert K0
  163. mtc0 TEMP1, C0_CONFIG // write C0_Config
  164. jalr.hb zero, ra
  165. END(change_k0_cca)
  166. LEAF(flush_dcache)
  167. mfc0 CONFIG_1, C0_CONFIG1 // read C0_Config1
  168. // Isolate D$ Line Size
  169. ext LINE_SIZE, CONFIG_1, CFG1_DLSHIFT, 3 // extract DL
  170. // Skip ahead if No D$
  171. beq LINE_SIZE, zero, done_flush_dcache
  172. li TEMP1, 2
  173. sllv LINE_SIZE, TEMP1, LINE_SIZE // Now have true D$ line size in bytes
  174. ext SET_SIZE, CONFIG_1, CFG1_DSSHIFT, 3 // extract DS
  175. li TEMP1, 64
  176. sllv SET_SIZE, TEMP1, SET_SIZE // D$ Sets per way
  177. // Config1DA == D$ Assoc - 1
  178. ext ASSOC, CONFIG_1, CFG1_DASHIFT, 3 // extract DA
  179. addiu ASSOC, 1
  180. li TEMP1, (LINES_PER_ITER)
  181. mul SET_SIZE, SET_SIZE, ASSOC // Total number of sets
  182. mul TOTAL_BYTES, SET_SIZE, LINE_SIZE // Total number of bytes
  183. mul BYTES_PER_LOOP, LINE_SIZE, TEMP1 // Total bytes per loop
  184. lui CURRENT_ADDR, 0x8000 // Get a KSeg0 address for cacheops
  185. srl TEMP1, BYTES_PER_LOOP, 1
  186. addu CURRENT_ADDR, TEMP1, CURRENT_ADDR
  187. addu END_ADDR, CURRENT_ADDR, TOTAL_BYTES // make ending address
  188. subu END_ADDR, END_ADDR, BYTES_PER_LOOP // -1
  189. // Clear TagLo/TagHi registers
  190. mtc0 zero, C0_TAGLO, 2 // write C0_DTagLo
  191. mtc0 zero, C0_TAGHI, 2 // Note: not all implementations will have a tag Hi but writes will be ignored if not present
  192. ehb
  193. // due to offset field restrictions code assumes line size will not be more that 128 bytes for a r5 or less core
  194. // or not more than 64 bytes for a r6 and greater core
  195. fnext_dcache_tag:
  196. // Index writeback invalidate Cache Op
  197. // Will invalidate the tag entry, clear the lock bit, and clear the LRF bit
  198. cache 0x1, (DLINE_SIZE*-2)(CURRENT_ADDR)
  199. cache 0x1, (DLINE_SIZE*-1)(CURRENT_ADDR)
  200. cache 0x1, (DLINE_SIZE*0)(CURRENT_ADDR)
  201. cache 0x1, (DLINE_SIZE*1)(CURRENT_ADDR)
  202. cache 0x1, (DLINE_SIZE*-4)(CURRENT_ADDR)
  203. cache 0x1, (DLINE_SIZE*-3)(CURRENT_ADDR)
  204. cache 0x1, (DLINE_SIZE*2)(CURRENT_ADDR)
  205. cache 0x1, (DLINE_SIZE*3)(CURRENT_ADDR)
  206. addu CURRENT_ADDR, BYTES_PER_LOOP // Get next starting line address
  207. bge END_ADDR, CURRENT_ADDR, fnext_dcache_tag // Done yet?
  208. done_flush_dcache:
  209. sync
  210. jalr zero, ra
  211. END(flush_dcache)
  212. #undef LINE_SIZE
  213. #undef BYTES_PER_LOOP
  214. #undef SET_SIZE
  215. #undef ASSOC
  216. #undef CONFIG_1
  217. #undef END_ADDR
  218. #undef TOTAL_BYTES
  219. #undef CURRENT_ADDR
  220. #undef TEMP1
  221. #undef TEMP2