debug_vm_pgtable.c 39 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187118811891190119111921193119411951196119711981199120012011202120312041205120612071208120912101211121212131214121512161217121812191220122112221223122412251226122712281229123012311232123312341235123612371238123912401241124212431244124512461247124812491250125112521253125412551256125712581259126012611262126312641265126612671268126912701271127212731274127512761277127812791280128112821283128412851286128712881289129012911292129312941295129612971298129913001301130213031304130513061307130813091310131113121313131413151316131713181319132013211322132313241325132613271328132913301331133213331334133513361337133813391340134113421343134413451346134713481349135013511352135313541355135613571358135913601361136213631364136513661367136813691370137113721373137413751376137713781379138013811382138313841385138613871388138913901391139213931394139513961397139813991400
  1. // SPDX-License-Identifier: GPL-2.0-only
  2. /*
  3. * This kernel test validates architecture page table helpers and
  4. * accessors and helps in verifying their continued compliance with
  5. * expected generic MM semantics.
  6. *
  7. * Copyright (C) 2019 ARM Ltd.
  8. *
  9. * Author: Anshuman Khandual <anshuman.khandual@arm.com>
  10. */
  11. #define pr_fmt(fmt) "debug_vm_pgtable: [%-25s]: " fmt, __func__
  12. #include <linux/gfp.h>
  13. #include <linux/highmem.h>
  14. #include <linux/hugetlb.h>
  15. #include <linux/kernel.h>
  16. #include <linux/kconfig.h>
  17. #include <linux/memblock.h>
  18. #include <linux/mm.h>
  19. #include <linux/mman.h>
  20. #include <linux/mm_types.h>
  21. #include <linux/module.h>
  22. #include <linux/pfn_t.h>
  23. #include <linux/printk.h>
  24. #include <linux/pgtable.h>
  25. #include <linux/random.h>
  26. #include <linux/spinlock.h>
  27. #include <linux/swap.h>
  28. #include <linux/swapops.h>
  29. #include <linux/start_kernel.h>
  30. #include <linux/sched/mm.h>
  31. #include <linux/io.h>
  32. #include <linux/vmalloc.h>
  33. #include <asm/cacheflush.h>
  34. #include <asm/pgalloc.h>
  35. #include <asm/tlbflush.h>
  36. /*
  37. * Please refer Documentation/mm/arch_pgtable_helpers.rst for the semantics
  38. * expectations that are being validated here. All future changes in here
  39. * or the documentation need to be in sync.
  40. */
  41. #define RANDOM_NZVALUE GENMASK(7, 0)
  42. struct pgtable_debug_args {
  43. struct mm_struct *mm;
  44. struct vm_area_struct *vma;
  45. pgd_t *pgdp;
  46. p4d_t *p4dp;
  47. pud_t *pudp;
  48. pmd_t *pmdp;
  49. pte_t *ptep;
  50. p4d_t *start_p4dp;
  51. pud_t *start_pudp;
  52. pmd_t *start_pmdp;
  53. pgtable_t start_ptep;
  54. unsigned long vaddr;
  55. pgprot_t page_prot;
  56. pgprot_t page_prot_none;
  57. bool is_contiguous_page;
  58. unsigned long pud_pfn;
  59. unsigned long pmd_pfn;
  60. unsigned long pte_pfn;
  61. unsigned long fixed_alignment;
  62. unsigned long fixed_pgd_pfn;
  63. unsigned long fixed_p4d_pfn;
  64. unsigned long fixed_pud_pfn;
  65. unsigned long fixed_pmd_pfn;
  66. unsigned long fixed_pte_pfn;
  67. };
  68. static void __init pte_basic_tests(struct pgtable_debug_args *args, int idx)
  69. {
  70. pgprot_t prot = vm_get_page_prot(idx);
  71. pte_t pte = pfn_pte(args->fixed_pte_pfn, prot);
  72. unsigned long val = idx, *ptr = &val;
  73. pr_debug("Validating PTE basic (%pGv)\n", ptr);
  74. /*
  75. * This test needs to be executed after the given page table entry
  76. * is created with pfn_pte() to make sure that vm_get_page_prot(idx)
  77. * does not have the dirty bit enabled from the beginning. This is
  78. * important for platforms like arm64 where (!PTE_RDONLY) indicate
  79. * dirty bit being set.
  80. */
  81. WARN_ON(pte_dirty(pte_wrprotect(pte)));
  82. WARN_ON(!pte_same(pte, pte));
  83. WARN_ON(!pte_young(pte_mkyoung(pte_mkold(pte))));
  84. WARN_ON(!pte_dirty(pte_mkdirty(pte_mkclean(pte))));
  85. WARN_ON(!pte_write(pte_mkwrite(pte_wrprotect(pte), args->vma)));
  86. WARN_ON(pte_young(pte_mkold(pte_mkyoung(pte))));
  87. WARN_ON(pte_dirty(pte_mkclean(pte_mkdirty(pte))));
  88. WARN_ON(pte_write(pte_wrprotect(pte_mkwrite(pte, args->vma))));
  89. WARN_ON(pte_dirty(pte_wrprotect(pte_mkclean(pte))));
  90. WARN_ON(!pte_dirty(pte_wrprotect(pte_mkdirty(pte))));
  91. }
  92. static void __init pte_advanced_tests(struct pgtable_debug_args *args)
  93. {
  94. struct page *page;
  95. pte_t pte;
  96. /*
  97. * Architectures optimize set_pte_at by avoiding TLB flush.
  98. * This requires set_pte_at to be not used to update an
  99. * existing pte entry. Clear pte before we do set_pte_at
  100. *
  101. * flush_dcache_page() is called after set_pte_at() to clear
  102. * PG_arch_1 for the page on ARM64. The page flag isn't cleared
  103. * when it's released and page allocation check will fail when
  104. * the page is allocated again. For architectures other than ARM64,
  105. * the unexpected overhead of cache flushing is acceptable.
  106. */
  107. page = (args->pte_pfn != ULONG_MAX) ? pfn_to_page(args->pte_pfn) : NULL;
  108. if (!page)
  109. return;
  110. pr_debug("Validating PTE advanced\n");
  111. if (WARN_ON(!args->ptep))
  112. return;
  113. pte = pfn_pte(args->pte_pfn, args->page_prot);
  114. set_pte_at(args->mm, args->vaddr, args->ptep, pte);
  115. flush_dcache_page(page);
  116. ptep_set_wrprotect(args->mm, args->vaddr, args->ptep);
  117. pte = ptep_get(args->ptep);
  118. WARN_ON(pte_write(pte));
  119. ptep_get_and_clear(args->mm, args->vaddr, args->ptep);
  120. pte = ptep_get(args->ptep);
  121. WARN_ON(!pte_none(pte));
  122. pte = pfn_pte(args->pte_pfn, args->page_prot);
  123. pte = pte_wrprotect(pte);
  124. pte = pte_mkclean(pte);
  125. set_pte_at(args->mm, args->vaddr, args->ptep, pte);
  126. flush_dcache_page(page);
  127. pte = pte_mkwrite(pte, args->vma);
  128. pte = pte_mkdirty(pte);
  129. ptep_set_access_flags(args->vma, args->vaddr, args->ptep, pte, 1);
  130. pte = ptep_get(args->ptep);
  131. WARN_ON(!(pte_write(pte) && pte_dirty(pte)));
  132. ptep_get_and_clear_full(args->mm, args->vaddr, args->ptep, 1);
  133. pte = ptep_get(args->ptep);
  134. WARN_ON(!pte_none(pte));
  135. pte = pfn_pte(args->pte_pfn, args->page_prot);
  136. pte = pte_mkyoung(pte);
  137. set_pte_at(args->mm, args->vaddr, args->ptep, pte);
  138. flush_dcache_page(page);
  139. ptep_test_and_clear_young(args->vma, args->vaddr, args->ptep);
  140. pte = ptep_get(args->ptep);
  141. WARN_ON(pte_young(pte));
  142. ptep_get_and_clear_full(args->mm, args->vaddr, args->ptep, 1);
  143. }
  144. #ifdef CONFIG_TRANSPARENT_HUGEPAGE
  145. static void __init pmd_basic_tests(struct pgtable_debug_args *args, int idx)
  146. {
  147. pgprot_t prot = vm_get_page_prot(idx);
  148. unsigned long val = idx, *ptr = &val;
  149. pmd_t pmd;
  150. if (!has_transparent_hugepage())
  151. return;
  152. pr_debug("Validating PMD basic (%pGv)\n", ptr);
  153. pmd = pfn_pmd(args->fixed_pmd_pfn, prot);
  154. /*
  155. * This test needs to be executed after the given page table entry
  156. * is created with pfn_pmd() to make sure that vm_get_page_prot(idx)
  157. * does not have the dirty bit enabled from the beginning. This is
  158. * important for platforms like arm64 where (!PTE_RDONLY) indicate
  159. * dirty bit being set.
  160. */
  161. WARN_ON(pmd_dirty(pmd_wrprotect(pmd)));
  162. WARN_ON(!pmd_same(pmd, pmd));
  163. WARN_ON(!pmd_young(pmd_mkyoung(pmd_mkold(pmd))));
  164. WARN_ON(!pmd_dirty(pmd_mkdirty(pmd_mkclean(pmd))));
  165. WARN_ON(!pmd_write(pmd_mkwrite(pmd_wrprotect(pmd), args->vma)));
  166. WARN_ON(pmd_young(pmd_mkold(pmd_mkyoung(pmd))));
  167. WARN_ON(pmd_dirty(pmd_mkclean(pmd_mkdirty(pmd))));
  168. WARN_ON(pmd_write(pmd_wrprotect(pmd_mkwrite(pmd, args->vma))));
  169. WARN_ON(pmd_dirty(pmd_wrprotect(pmd_mkclean(pmd))));
  170. WARN_ON(!pmd_dirty(pmd_wrprotect(pmd_mkdirty(pmd))));
  171. /*
  172. * A huge page does not point to next level page table
  173. * entry. Hence this must qualify as pmd_bad().
  174. */
  175. WARN_ON(!pmd_bad(pmd_mkhuge(pmd)));
  176. }
  177. static void __init pmd_advanced_tests(struct pgtable_debug_args *args)
  178. {
  179. struct page *page;
  180. pmd_t pmd;
  181. unsigned long vaddr = args->vaddr;
  182. if (!has_transparent_hugepage())
  183. return;
  184. page = (args->pmd_pfn != ULONG_MAX) ? pfn_to_page(args->pmd_pfn) : NULL;
  185. if (!page)
  186. return;
  187. /*
  188. * flush_dcache_page() is called after set_pmd_at() to clear
  189. * PG_arch_1 for the page on ARM64. The page flag isn't cleared
  190. * when it's released and page allocation check will fail when
  191. * the page is allocated again. For architectures other than ARM64,
  192. * the unexpected overhead of cache flushing is acceptable.
  193. */
  194. pr_debug("Validating PMD advanced\n");
  195. /* Align the address wrt HPAGE_PMD_SIZE */
  196. vaddr &= HPAGE_PMD_MASK;
  197. pgtable_trans_huge_deposit(args->mm, args->pmdp, args->start_ptep);
  198. pmd = pfn_pmd(args->pmd_pfn, args->page_prot);
  199. set_pmd_at(args->mm, vaddr, args->pmdp, pmd);
  200. flush_dcache_page(page);
  201. pmdp_set_wrprotect(args->mm, vaddr, args->pmdp);
  202. pmd = pmdp_get(args->pmdp);
  203. WARN_ON(pmd_write(pmd));
  204. pmdp_huge_get_and_clear(args->mm, vaddr, args->pmdp);
  205. pmd = pmdp_get(args->pmdp);
  206. WARN_ON(!pmd_none(pmd));
  207. pmd = pfn_pmd(args->pmd_pfn, args->page_prot);
  208. pmd = pmd_wrprotect(pmd);
  209. pmd = pmd_mkclean(pmd);
  210. set_pmd_at(args->mm, vaddr, args->pmdp, pmd);
  211. flush_dcache_page(page);
  212. pmd = pmd_mkwrite(pmd, args->vma);
  213. pmd = pmd_mkdirty(pmd);
  214. pmdp_set_access_flags(args->vma, vaddr, args->pmdp, pmd, 1);
  215. pmd = pmdp_get(args->pmdp);
  216. WARN_ON(!(pmd_write(pmd) && pmd_dirty(pmd)));
  217. pmdp_huge_get_and_clear_full(args->vma, vaddr, args->pmdp, 1);
  218. pmd = pmdp_get(args->pmdp);
  219. WARN_ON(!pmd_none(pmd));
  220. pmd = pmd_mkhuge(pfn_pmd(args->pmd_pfn, args->page_prot));
  221. pmd = pmd_mkyoung(pmd);
  222. set_pmd_at(args->mm, vaddr, args->pmdp, pmd);
  223. flush_dcache_page(page);
  224. pmdp_test_and_clear_young(args->vma, vaddr, args->pmdp);
  225. pmd = pmdp_get(args->pmdp);
  226. WARN_ON(pmd_young(pmd));
  227. /* Clear the pte entries */
  228. pmdp_huge_get_and_clear(args->mm, vaddr, args->pmdp);
  229. pgtable_trans_huge_withdraw(args->mm, args->pmdp);
  230. }
  231. static void __init pmd_leaf_tests(struct pgtable_debug_args *args)
  232. {
  233. pmd_t pmd;
  234. if (!has_transparent_hugepage())
  235. return;
  236. pr_debug("Validating PMD leaf\n");
  237. pmd = pfn_pmd(args->fixed_pmd_pfn, args->page_prot);
  238. /*
  239. * PMD based THP is a leaf entry.
  240. */
  241. pmd = pmd_mkhuge(pmd);
  242. WARN_ON(!pmd_leaf(pmd));
  243. }
  244. #ifdef CONFIG_HAVE_ARCH_TRANSPARENT_HUGEPAGE_PUD
  245. static void __init pud_basic_tests(struct pgtable_debug_args *args, int idx)
  246. {
  247. pgprot_t prot = vm_get_page_prot(idx);
  248. unsigned long val = idx, *ptr = &val;
  249. pud_t pud;
  250. if (!has_transparent_pud_hugepage())
  251. return;
  252. pr_debug("Validating PUD basic (%pGv)\n", ptr);
  253. pud = pfn_pud(args->fixed_pud_pfn, prot);
  254. /*
  255. * This test needs to be executed after the given page table entry
  256. * is created with pfn_pud() to make sure that vm_get_page_prot(idx)
  257. * does not have the dirty bit enabled from the beginning. This is
  258. * important for platforms like arm64 where (!PTE_RDONLY) indicate
  259. * dirty bit being set.
  260. */
  261. WARN_ON(pud_dirty(pud_wrprotect(pud)));
  262. WARN_ON(!pud_same(pud, pud));
  263. WARN_ON(!pud_young(pud_mkyoung(pud_mkold(pud))));
  264. WARN_ON(!pud_dirty(pud_mkdirty(pud_mkclean(pud))));
  265. WARN_ON(pud_dirty(pud_mkclean(pud_mkdirty(pud))));
  266. WARN_ON(!pud_write(pud_mkwrite(pud_wrprotect(pud))));
  267. WARN_ON(pud_write(pud_wrprotect(pud_mkwrite(pud))));
  268. WARN_ON(pud_young(pud_mkold(pud_mkyoung(pud))));
  269. WARN_ON(pud_dirty(pud_wrprotect(pud_mkclean(pud))));
  270. WARN_ON(!pud_dirty(pud_wrprotect(pud_mkdirty(pud))));
  271. if (mm_pmd_folded(args->mm))
  272. return;
  273. /*
  274. * A huge page does not point to next level page table
  275. * entry. Hence this must qualify as pud_bad().
  276. */
  277. WARN_ON(!pud_bad(pud_mkhuge(pud)));
  278. }
  279. static void __init pud_advanced_tests(struct pgtable_debug_args *args)
  280. {
  281. struct page *page;
  282. unsigned long vaddr = args->vaddr;
  283. pud_t pud;
  284. if (!has_transparent_pud_hugepage())
  285. return;
  286. page = (args->pud_pfn != ULONG_MAX) ? pfn_to_page(args->pud_pfn) : NULL;
  287. if (!page)
  288. return;
  289. /*
  290. * flush_dcache_page() is called after set_pud_at() to clear
  291. * PG_arch_1 for the page on ARM64. The page flag isn't cleared
  292. * when it's released and page allocation check will fail when
  293. * the page is allocated again. For architectures other than ARM64,
  294. * the unexpected overhead of cache flushing is acceptable.
  295. */
  296. pr_debug("Validating PUD advanced\n");
  297. /* Align the address wrt HPAGE_PUD_SIZE */
  298. vaddr &= HPAGE_PUD_MASK;
  299. pud = pfn_pud(args->pud_pfn, args->page_prot);
  300. /*
  301. * Some architectures have debug checks to make sure
  302. * huge pud mapping are only found with devmap entries
  303. * For now test with only devmap entries.
  304. */
  305. pud = pud_mkdevmap(pud);
  306. set_pud_at(args->mm, vaddr, args->pudp, pud);
  307. flush_dcache_page(page);
  308. pudp_set_wrprotect(args->mm, vaddr, args->pudp);
  309. pud = pudp_get(args->pudp);
  310. WARN_ON(pud_write(pud));
  311. #ifndef __PAGETABLE_PMD_FOLDED
  312. pudp_huge_get_and_clear(args->mm, vaddr, args->pudp);
  313. pud = pudp_get(args->pudp);
  314. WARN_ON(!pud_none(pud));
  315. #endif /* __PAGETABLE_PMD_FOLDED */
  316. pud = pfn_pud(args->pud_pfn, args->page_prot);
  317. pud = pud_mkdevmap(pud);
  318. pud = pud_wrprotect(pud);
  319. pud = pud_mkclean(pud);
  320. set_pud_at(args->mm, vaddr, args->pudp, pud);
  321. flush_dcache_page(page);
  322. pud = pud_mkwrite(pud);
  323. pud = pud_mkdirty(pud);
  324. pudp_set_access_flags(args->vma, vaddr, args->pudp, pud, 1);
  325. pud = pudp_get(args->pudp);
  326. WARN_ON(!(pud_write(pud) && pud_dirty(pud)));
  327. #ifndef __PAGETABLE_PMD_FOLDED
  328. pudp_huge_get_and_clear_full(args->vma, vaddr, args->pudp, 1);
  329. pud = pudp_get(args->pudp);
  330. WARN_ON(!pud_none(pud));
  331. #endif /* __PAGETABLE_PMD_FOLDED */
  332. pud = pfn_pud(args->pud_pfn, args->page_prot);
  333. pud = pud_mkdevmap(pud);
  334. pud = pud_mkyoung(pud);
  335. set_pud_at(args->mm, vaddr, args->pudp, pud);
  336. flush_dcache_page(page);
  337. pudp_test_and_clear_young(args->vma, vaddr, args->pudp);
  338. pud = pudp_get(args->pudp);
  339. WARN_ON(pud_young(pud));
  340. pudp_huge_get_and_clear(args->mm, vaddr, args->pudp);
  341. }
  342. static void __init pud_leaf_tests(struct pgtable_debug_args *args)
  343. {
  344. pud_t pud;
  345. if (!has_transparent_pud_hugepage())
  346. return;
  347. pr_debug("Validating PUD leaf\n");
  348. pud = pfn_pud(args->fixed_pud_pfn, args->page_prot);
  349. /*
  350. * PUD based THP is a leaf entry.
  351. */
  352. pud = pud_mkhuge(pud);
  353. WARN_ON(!pud_leaf(pud));
  354. }
  355. #else /* !CONFIG_HAVE_ARCH_TRANSPARENT_HUGEPAGE_PUD */
  356. static void __init pud_basic_tests(struct pgtable_debug_args *args, int idx) { }
  357. static void __init pud_advanced_tests(struct pgtable_debug_args *args) { }
  358. static void __init pud_leaf_tests(struct pgtable_debug_args *args) { }
  359. #endif /* CONFIG_HAVE_ARCH_TRANSPARENT_HUGEPAGE_PUD */
  360. #else /* !CONFIG_TRANSPARENT_HUGEPAGE */
  361. static void __init pmd_basic_tests(struct pgtable_debug_args *args, int idx) { }
  362. static void __init pud_basic_tests(struct pgtable_debug_args *args, int idx) { }
  363. static void __init pmd_advanced_tests(struct pgtable_debug_args *args) { }
  364. static void __init pud_advanced_tests(struct pgtable_debug_args *args) { }
  365. static void __init pmd_leaf_tests(struct pgtable_debug_args *args) { }
  366. static void __init pud_leaf_tests(struct pgtable_debug_args *args) { }
  367. #endif /* CONFIG_TRANSPARENT_HUGEPAGE */
  368. #ifdef CONFIG_HAVE_ARCH_HUGE_VMAP
  369. static void __init pmd_huge_tests(struct pgtable_debug_args *args)
  370. {
  371. pmd_t pmd;
  372. if (!arch_vmap_pmd_supported(args->page_prot) ||
  373. args->fixed_alignment < PMD_SIZE)
  374. return;
  375. pr_debug("Validating PMD huge\n");
  376. /*
  377. * X86 defined pmd_set_huge() verifies that the given
  378. * PMD is not a populated non-leaf entry.
  379. */
  380. WRITE_ONCE(*args->pmdp, __pmd(0));
  381. WARN_ON(!pmd_set_huge(args->pmdp, __pfn_to_phys(args->fixed_pmd_pfn), args->page_prot));
  382. WARN_ON(!pmd_clear_huge(args->pmdp));
  383. pmd = pmdp_get(args->pmdp);
  384. WARN_ON(!pmd_none(pmd));
  385. }
  386. static void __init pud_huge_tests(struct pgtable_debug_args *args)
  387. {
  388. pud_t pud;
  389. if (!arch_vmap_pud_supported(args->page_prot) ||
  390. args->fixed_alignment < PUD_SIZE)
  391. return;
  392. pr_debug("Validating PUD huge\n");
  393. /*
  394. * X86 defined pud_set_huge() verifies that the given
  395. * PUD is not a populated non-leaf entry.
  396. */
  397. WRITE_ONCE(*args->pudp, __pud(0));
  398. WARN_ON(!pud_set_huge(args->pudp, __pfn_to_phys(args->fixed_pud_pfn), args->page_prot));
  399. WARN_ON(!pud_clear_huge(args->pudp));
  400. pud = pudp_get(args->pudp);
  401. WARN_ON(!pud_none(pud));
  402. }
  403. #else /* !CONFIG_HAVE_ARCH_HUGE_VMAP */
  404. static void __init pmd_huge_tests(struct pgtable_debug_args *args) { }
  405. static void __init pud_huge_tests(struct pgtable_debug_args *args) { }
  406. #endif /* CONFIG_HAVE_ARCH_HUGE_VMAP */
  407. static void __init p4d_basic_tests(struct pgtable_debug_args *args)
  408. {
  409. p4d_t p4d;
  410. pr_debug("Validating P4D basic\n");
  411. memset(&p4d, RANDOM_NZVALUE, sizeof(p4d_t));
  412. WARN_ON(!p4d_same(p4d, p4d));
  413. }
  414. static void __init pgd_basic_tests(struct pgtable_debug_args *args)
  415. {
  416. pgd_t pgd;
  417. pr_debug("Validating PGD basic\n");
  418. memset(&pgd, RANDOM_NZVALUE, sizeof(pgd_t));
  419. WARN_ON(!pgd_same(pgd, pgd));
  420. }
  421. #ifndef __PAGETABLE_PUD_FOLDED
  422. static void __init pud_clear_tests(struct pgtable_debug_args *args)
  423. {
  424. pud_t pud = pudp_get(args->pudp);
  425. if (mm_pmd_folded(args->mm))
  426. return;
  427. pr_debug("Validating PUD clear\n");
  428. WARN_ON(pud_none(pud));
  429. pud_clear(args->pudp);
  430. pud = pudp_get(args->pudp);
  431. WARN_ON(!pud_none(pud));
  432. }
  433. static void __init pud_populate_tests(struct pgtable_debug_args *args)
  434. {
  435. pud_t pud;
  436. if (mm_pmd_folded(args->mm))
  437. return;
  438. pr_debug("Validating PUD populate\n");
  439. /*
  440. * This entry points to next level page table page.
  441. * Hence this must not qualify as pud_bad().
  442. */
  443. pud_populate(args->mm, args->pudp, args->start_pmdp);
  444. pud = pudp_get(args->pudp);
  445. WARN_ON(pud_bad(pud));
  446. }
  447. #else /* !__PAGETABLE_PUD_FOLDED */
  448. static void __init pud_clear_tests(struct pgtable_debug_args *args) { }
  449. static void __init pud_populate_tests(struct pgtable_debug_args *args) { }
  450. #endif /* PAGETABLE_PUD_FOLDED */
  451. #ifndef __PAGETABLE_P4D_FOLDED
  452. static void __init p4d_clear_tests(struct pgtable_debug_args *args)
  453. {
  454. p4d_t p4d = p4dp_get(args->p4dp);
  455. if (mm_pud_folded(args->mm))
  456. return;
  457. pr_debug("Validating P4D clear\n");
  458. WARN_ON(p4d_none(p4d));
  459. p4d_clear(args->p4dp);
  460. p4d = p4dp_get(args->p4dp);
  461. WARN_ON(!p4d_none(p4d));
  462. }
  463. static void __init p4d_populate_tests(struct pgtable_debug_args *args)
  464. {
  465. p4d_t p4d;
  466. if (mm_pud_folded(args->mm))
  467. return;
  468. pr_debug("Validating P4D populate\n");
  469. /*
  470. * This entry points to next level page table page.
  471. * Hence this must not qualify as p4d_bad().
  472. */
  473. pud_clear(args->pudp);
  474. p4d_clear(args->p4dp);
  475. p4d_populate(args->mm, args->p4dp, args->start_pudp);
  476. p4d = p4dp_get(args->p4dp);
  477. WARN_ON(p4d_bad(p4d));
  478. }
  479. static void __init pgd_clear_tests(struct pgtable_debug_args *args)
  480. {
  481. pgd_t pgd = pgdp_get(args->pgdp);
  482. if (mm_p4d_folded(args->mm))
  483. return;
  484. pr_debug("Validating PGD clear\n");
  485. WARN_ON(pgd_none(pgd));
  486. pgd_clear(args->pgdp);
  487. pgd = pgdp_get(args->pgdp);
  488. WARN_ON(!pgd_none(pgd));
  489. }
  490. static void __init pgd_populate_tests(struct pgtable_debug_args *args)
  491. {
  492. pgd_t pgd;
  493. if (mm_p4d_folded(args->mm))
  494. return;
  495. pr_debug("Validating PGD populate\n");
  496. /*
  497. * This entry points to next level page table page.
  498. * Hence this must not qualify as pgd_bad().
  499. */
  500. p4d_clear(args->p4dp);
  501. pgd_clear(args->pgdp);
  502. pgd_populate(args->mm, args->pgdp, args->start_p4dp);
  503. pgd = pgdp_get(args->pgdp);
  504. WARN_ON(pgd_bad(pgd));
  505. }
  506. #else /* !__PAGETABLE_P4D_FOLDED */
  507. static void __init p4d_clear_tests(struct pgtable_debug_args *args) { }
  508. static void __init pgd_clear_tests(struct pgtable_debug_args *args) { }
  509. static void __init p4d_populate_tests(struct pgtable_debug_args *args) { }
  510. static void __init pgd_populate_tests(struct pgtable_debug_args *args) { }
  511. #endif /* PAGETABLE_P4D_FOLDED */
  512. static void __init pte_clear_tests(struct pgtable_debug_args *args)
  513. {
  514. struct page *page;
  515. pte_t pte = pfn_pte(args->pte_pfn, args->page_prot);
  516. page = (args->pte_pfn != ULONG_MAX) ? pfn_to_page(args->pte_pfn) : NULL;
  517. if (!page)
  518. return;
  519. /*
  520. * flush_dcache_page() is called after set_pte_at() to clear
  521. * PG_arch_1 for the page on ARM64. The page flag isn't cleared
  522. * when it's released and page allocation check will fail when
  523. * the page is allocated again. For architectures other than ARM64,
  524. * the unexpected overhead of cache flushing is acceptable.
  525. */
  526. pr_debug("Validating PTE clear\n");
  527. if (WARN_ON(!args->ptep))
  528. return;
  529. set_pte_at(args->mm, args->vaddr, args->ptep, pte);
  530. WARN_ON(pte_none(pte));
  531. flush_dcache_page(page);
  532. barrier();
  533. ptep_clear(args->mm, args->vaddr, args->ptep);
  534. pte = ptep_get(args->ptep);
  535. WARN_ON(!pte_none(pte));
  536. }
  537. static void __init pmd_clear_tests(struct pgtable_debug_args *args)
  538. {
  539. pmd_t pmd = pmdp_get(args->pmdp);
  540. pr_debug("Validating PMD clear\n");
  541. WARN_ON(pmd_none(pmd));
  542. pmd_clear(args->pmdp);
  543. pmd = pmdp_get(args->pmdp);
  544. WARN_ON(!pmd_none(pmd));
  545. }
  546. static void __init pmd_populate_tests(struct pgtable_debug_args *args)
  547. {
  548. pmd_t pmd;
  549. pr_debug("Validating PMD populate\n");
  550. /*
  551. * This entry points to next level page table page.
  552. * Hence this must not qualify as pmd_bad().
  553. */
  554. pmd_populate(args->mm, args->pmdp, args->start_ptep);
  555. pmd = pmdp_get(args->pmdp);
  556. WARN_ON(pmd_bad(pmd));
  557. }
  558. static void __init pte_special_tests(struct pgtable_debug_args *args)
  559. {
  560. pte_t pte = pfn_pte(args->fixed_pte_pfn, args->page_prot);
  561. if (!IS_ENABLED(CONFIG_ARCH_HAS_PTE_SPECIAL))
  562. return;
  563. pr_debug("Validating PTE special\n");
  564. WARN_ON(!pte_special(pte_mkspecial(pte)));
  565. }
  566. static void __init pte_protnone_tests(struct pgtable_debug_args *args)
  567. {
  568. pte_t pte = pfn_pte(args->fixed_pte_pfn, args->page_prot_none);
  569. if (!IS_ENABLED(CONFIG_NUMA_BALANCING))
  570. return;
  571. pr_debug("Validating PTE protnone\n");
  572. WARN_ON(!pte_protnone(pte));
  573. WARN_ON(!pte_present(pte));
  574. }
  575. #ifdef CONFIG_TRANSPARENT_HUGEPAGE
  576. static void __init pmd_protnone_tests(struct pgtable_debug_args *args)
  577. {
  578. pmd_t pmd;
  579. if (!IS_ENABLED(CONFIG_NUMA_BALANCING))
  580. return;
  581. if (!has_transparent_hugepage())
  582. return;
  583. pr_debug("Validating PMD protnone\n");
  584. pmd = pmd_mkhuge(pfn_pmd(args->fixed_pmd_pfn, args->page_prot_none));
  585. WARN_ON(!pmd_protnone(pmd));
  586. WARN_ON(!pmd_present(pmd));
  587. }
  588. #else /* !CONFIG_TRANSPARENT_HUGEPAGE */
  589. static void __init pmd_protnone_tests(struct pgtable_debug_args *args) { }
  590. #endif /* CONFIG_TRANSPARENT_HUGEPAGE */
  591. #ifdef CONFIG_ARCH_HAS_PTE_DEVMAP
  592. static void __init pte_devmap_tests(struct pgtable_debug_args *args)
  593. {
  594. pte_t pte = pfn_pte(args->fixed_pte_pfn, args->page_prot);
  595. pr_debug("Validating PTE devmap\n");
  596. WARN_ON(!pte_devmap(pte_mkdevmap(pte)));
  597. }
  598. #ifdef CONFIG_TRANSPARENT_HUGEPAGE
  599. static void __init pmd_devmap_tests(struct pgtable_debug_args *args)
  600. {
  601. pmd_t pmd;
  602. if (!has_transparent_hugepage())
  603. return;
  604. pr_debug("Validating PMD devmap\n");
  605. pmd = pfn_pmd(args->fixed_pmd_pfn, args->page_prot);
  606. WARN_ON(!pmd_devmap(pmd_mkdevmap(pmd)));
  607. }
  608. #ifdef CONFIG_HAVE_ARCH_TRANSPARENT_HUGEPAGE_PUD
  609. static void __init pud_devmap_tests(struct pgtable_debug_args *args)
  610. {
  611. pud_t pud;
  612. if (!has_transparent_pud_hugepage())
  613. return;
  614. pr_debug("Validating PUD devmap\n");
  615. pud = pfn_pud(args->fixed_pud_pfn, args->page_prot);
  616. WARN_ON(!pud_devmap(pud_mkdevmap(pud)));
  617. }
  618. #else /* !CONFIG_HAVE_ARCH_TRANSPARENT_HUGEPAGE_PUD */
  619. static void __init pud_devmap_tests(struct pgtable_debug_args *args) { }
  620. #endif /* CONFIG_HAVE_ARCH_TRANSPARENT_HUGEPAGE_PUD */
  621. #else /* CONFIG_TRANSPARENT_HUGEPAGE */
  622. static void __init pmd_devmap_tests(struct pgtable_debug_args *args) { }
  623. static void __init pud_devmap_tests(struct pgtable_debug_args *args) { }
  624. #endif /* CONFIG_TRANSPARENT_HUGEPAGE */
  625. #else
  626. static void __init pte_devmap_tests(struct pgtable_debug_args *args) { }
  627. static void __init pmd_devmap_tests(struct pgtable_debug_args *args) { }
  628. static void __init pud_devmap_tests(struct pgtable_debug_args *args) { }
  629. #endif /* CONFIG_ARCH_HAS_PTE_DEVMAP */
  630. static void __init pte_soft_dirty_tests(struct pgtable_debug_args *args)
  631. {
  632. pte_t pte = pfn_pte(args->fixed_pte_pfn, args->page_prot);
  633. if (!IS_ENABLED(CONFIG_MEM_SOFT_DIRTY))
  634. return;
  635. pr_debug("Validating PTE soft dirty\n");
  636. WARN_ON(!pte_soft_dirty(pte_mksoft_dirty(pte)));
  637. WARN_ON(pte_soft_dirty(pte_clear_soft_dirty(pte)));
  638. }
  639. static void __init pte_swap_soft_dirty_tests(struct pgtable_debug_args *args)
  640. {
  641. pte_t pte = pfn_pte(args->fixed_pte_pfn, args->page_prot);
  642. if (!IS_ENABLED(CONFIG_MEM_SOFT_DIRTY))
  643. return;
  644. pr_debug("Validating PTE swap soft dirty\n");
  645. WARN_ON(!pte_swp_soft_dirty(pte_swp_mksoft_dirty(pte)));
  646. WARN_ON(pte_swp_soft_dirty(pte_swp_clear_soft_dirty(pte)));
  647. }
  648. #ifdef CONFIG_TRANSPARENT_HUGEPAGE
  649. static void __init pmd_soft_dirty_tests(struct pgtable_debug_args *args)
  650. {
  651. pmd_t pmd;
  652. if (!IS_ENABLED(CONFIG_MEM_SOFT_DIRTY))
  653. return;
  654. if (!has_transparent_hugepage())
  655. return;
  656. pr_debug("Validating PMD soft dirty\n");
  657. pmd = pfn_pmd(args->fixed_pmd_pfn, args->page_prot);
  658. WARN_ON(!pmd_soft_dirty(pmd_mksoft_dirty(pmd)));
  659. WARN_ON(pmd_soft_dirty(pmd_clear_soft_dirty(pmd)));
  660. }
  661. static void __init pmd_swap_soft_dirty_tests(struct pgtable_debug_args *args)
  662. {
  663. pmd_t pmd;
  664. if (!IS_ENABLED(CONFIG_MEM_SOFT_DIRTY) ||
  665. !IS_ENABLED(CONFIG_ARCH_ENABLE_THP_MIGRATION))
  666. return;
  667. if (!has_transparent_hugepage())
  668. return;
  669. pr_debug("Validating PMD swap soft dirty\n");
  670. pmd = pfn_pmd(args->fixed_pmd_pfn, args->page_prot);
  671. WARN_ON(!pmd_swp_soft_dirty(pmd_swp_mksoft_dirty(pmd)));
  672. WARN_ON(pmd_swp_soft_dirty(pmd_swp_clear_soft_dirty(pmd)));
  673. }
  674. #else /* !CONFIG_TRANSPARENT_HUGEPAGE */
  675. static void __init pmd_soft_dirty_tests(struct pgtable_debug_args *args) { }
  676. static void __init pmd_swap_soft_dirty_tests(struct pgtable_debug_args *args) { }
  677. #endif /* CONFIG_TRANSPARENT_HUGEPAGE */
  678. static void __init pte_swap_exclusive_tests(struct pgtable_debug_args *args)
  679. {
  680. unsigned long max_swap_offset;
  681. swp_entry_t entry, entry2;
  682. pte_t pte;
  683. pr_debug("Validating PTE swap exclusive\n");
  684. /* See generic_max_swapfile_size(): probe the maximum offset */
  685. max_swap_offset = swp_offset(pte_to_swp_entry(swp_entry_to_pte(swp_entry(0, ~0UL))));
  686. /* Create a swp entry with all possible bits set */
  687. entry = swp_entry((1 << MAX_SWAPFILES_SHIFT) - 1, max_swap_offset);
  688. pte = swp_entry_to_pte(entry);
  689. WARN_ON(pte_swp_exclusive(pte));
  690. WARN_ON(!is_swap_pte(pte));
  691. entry2 = pte_to_swp_entry(pte);
  692. WARN_ON(memcmp(&entry, &entry2, sizeof(entry)));
  693. pte = pte_swp_mkexclusive(pte);
  694. WARN_ON(!pte_swp_exclusive(pte));
  695. WARN_ON(!is_swap_pte(pte));
  696. WARN_ON(pte_swp_soft_dirty(pte));
  697. entry2 = pte_to_swp_entry(pte);
  698. WARN_ON(memcmp(&entry, &entry2, sizeof(entry)));
  699. pte = pte_swp_clear_exclusive(pte);
  700. WARN_ON(pte_swp_exclusive(pte));
  701. WARN_ON(!is_swap_pte(pte));
  702. entry2 = pte_to_swp_entry(pte);
  703. WARN_ON(memcmp(&entry, &entry2, sizeof(entry)));
  704. }
  705. static void __init pte_swap_tests(struct pgtable_debug_args *args)
  706. {
  707. swp_entry_t swp;
  708. pte_t pte;
  709. pr_debug("Validating PTE swap\n");
  710. pte = pfn_pte(args->fixed_pte_pfn, args->page_prot);
  711. swp = __pte_to_swp_entry(pte);
  712. pte = __swp_entry_to_pte(swp);
  713. WARN_ON(args->fixed_pte_pfn != pte_pfn(pte));
  714. }
  715. #ifdef CONFIG_ARCH_ENABLE_THP_MIGRATION
  716. static void __init pmd_swap_tests(struct pgtable_debug_args *args)
  717. {
  718. swp_entry_t swp;
  719. pmd_t pmd;
  720. if (!has_transparent_hugepage())
  721. return;
  722. pr_debug("Validating PMD swap\n");
  723. pmd = pfn_pmd(args->fixed_pmd_pfn, args->page_prot);
  724. swp = __pmd_to_swp_entry(pmd);
  725. pmd = __swp_entry_to_pmd(swp);
  726. WARN_ON(args->fixed_pmd_pfn != pmd_pfn(pmd));
  727. }
  728. #else /* !CONFIG_ARCH_ENABLE_THP_MIGRATION */
  729. static void __init pmd_swap_tests(struct pgtable_debug_args *args) { }
  730. #endif /* CONFIG_ARCH_ENABLE_THP_MIGRATION */
  731. static void __init swap_migration_tests(struct pgtable_debug_args *args)
  732. {
  733. struct page *page;
  734. swp_entry_t swp;
  735. if (!IS_ENABLED(CONFIG_MIGRATION))
  736. return;
  737. /*
  738. * swap_migration_tests() requires a dedicated page as it needs to
  739. * be locked before creating a migration entry from it. Locking the
  740. * page that actually maps kernel text ('start_kernel') can be real
  741. * problematic. Lets use the allocated page explicitly for this
  742. * purpose.
  743. */
  744. page = (args->pte_pfn != ULONG_MAX) ? pfn_to_page(args->pte_pfn) : NULL;
  745. if (!page)
  746. return;
  747. pr_debug("Validating swap migration\n");
  748. /*
  749. * make_[readable|writable]_migration_entry() expects given page to
  750. * be locked, otherwise it stumbles upon a BUG_ON().
  751. */
  752. __SetPageLocked(page);
  753. swp = make_writable_migration_entry(page_to_pfn(page));
  754. WARN_ON(!is_migration_entry(swp));
  755. WARN_ON(!is_writable_migration_entry(swp));
  756. swp = make_readable_migration_entry(swp_offset(swp));
  757. WARN_ON(!is_migration_entry(swp));
  758. WARN_ON(is_writable_migration_entry(swp));
  759. swp = make_readable_migration_entry(page_to_pfn(page));
  760. WARN_ON(!is_migration_entry(swp));
  761. WARN_ON(is_writable_migration_entry(swp));
  762. __ClearPageLocked(page);
  763. }
  764. #ifdef CONFIG_HUGETLB_PAGE
  765. static void __init hugetlb_basic_tests(struct pgtable_debug_args *args)
  766. {
  767. struct page *page;
  768. pte_t pte;
  769. pr_debug("Validating HugeTLB basic\n");
  770. /*
  771. * Accessing the page associated with the pfn is safe here,
  772. * as it was previously derived from a real kernel symbol.
  773. */
  774. page = pfn_to_page(args->fixed_pmd_pfn);
  775. pte = mk_huge_pte(page, args->page_prot);
  776. WARN_ON(!huge_pte_dirty(huge_pte_mkdirty(pte)));
  777. WARN_ON(!huge_pte_write(huge_pte_mkwrite(huge_pte_wrprotect(pte))));
  778. WARN_ON(huge_pte_write(huge_pte_wrprotect(huge_pte_mkwrite(pte))));
  779. #ifdef CONFIG_ARCH_WANT_GENERAL_HUGETLB
  780. pte = pfn_pte(args->fixed_pmd_pfn, args->page_prot);
  781. WARN_ON(!pte_huge(arch_make_huge_pte(pte, PMD_SHIFT, VM_ACCESS_FLAGS)));
  782. #endif /* CONFIG_ARCH_WANT_GENERAL_HUGETLB */
  783. }
  784. #else /* !CONFIG_HUGETLB_PAGE */
  785. static void __init hugetlb_basic_tests(struct pgtable_debug_args *args) { }
  786. #endif /* CONFIG_HUGETLB_PAGE */
  787. #ifdef CONFIG_TRANSPARENT_HUGEPAGE
  788. static void __init pmd_thp_tests(struct pgtable_debug_args *args)
  789. {
  790. pmd_t pmd;
  791. if (!has_transparent_hugepage())
  792. return;
  793. pr_debug("Validating PMD based THP\n");
  794. /*
  795. * pmd_trans_huge() and pmd_present() must return positive after
  796. * MMU invalidation with pmd_mkinvalid(). This behavior is an
  797. * optimization for transparent huge page. pmd_trans_huge() must
  798. * be true if pmd_page() returns a valid THP to avoid taking the
  799. * pmd_lock when others walk over non transhuge pmds (i.e. there
  800. * are no THP allocated). Especially when splitting a THP and
  801. * removing the present bit from the pmd, pmd_trans_huge() still
  802. * needs to return true. pmd_present() should be true whenever
  803. * pmd_trans_huge() returns true.
  804. */
  805. pmd = pfn_pmd(args->fixed_pmd_pfn, args->page_prot);
  806. WARN_ON(!pmd_trans_huge(pmd_mkhuge(pmd)));
  807. #ifndef __HAVE_ARCH_PMDP_INVALIDATE
  808. WARN_ON(!pmd_trans_huge(pmd_mkinvalid(pmd_mkhuge(pmd))));
  809. WARN_ON(!pmd_present(pmd_mkinvalid(pmd_mkhuge(pmd))));
  810. WARN_ON(!pmd_leaf(pmd_mkinvalid(pmd_mkhuge(pmd))));
  811. #endif /* __HAVE_ARCH_PMDP_INVALIDATE */
  812. }
  813. #ifdef CONFIG_HAVE_ARCH_TRANSPARENT_HUGEPAGE_PUD
  814. static void __init pud_thp_tests(struct pgtable_debug_args *args)
  815. {
  816. pud_t pud;
  817. if (!has_transparent_pud_hugepage())
  818. return;
  819. pr_debug("Validating PUD based THP\n");
  820. pud = pfn_pud(args->fixed_pud_pfn, args->page_prot);
  821. WARN_ON(!pud_trans_huge(pud_mkhuge(pud)));
  822. /*
  823. * pud_mkinvalid() has been dropped for now. Enable back
  824. * these tests when it comes back with a modified pud_present().
  825. *
  826. * WARN_ON(!pud_trans_huge(pud_mkinvalid(pud_mkhuge(pud))));
  827. * WARN_ON(!pud_present(pud_mkinvalid(pud_mkhuge(pud))));
  828. */
  829. }
  830. #else /* !CONFIG_HAVE_ARCH_TRANSPARENT_HUGEPAGE_PUD */
  831. static void __init pud_thp_tests(struct pgtable_debug_args *args) { }
  832. #endif /* CONFIG_HAVE_ARCH_TRANSPARENT_HUGEPAGE_PUD */
  833. #else /* !CONFIG_TRANSPARENT_HUGEPAGE */
  834. static void __init pmd_thp_tests(struct pgtable_debug_args *args) { }
  835. static void __init pud_thp_tests(struct pgtable_debug_args *args) { }
  836. #endif /* CONFIG_TRANSPARENT_HUGEPAGE */
  837. static unsigned long __init get_random_vaddr(void)
  838. {
  839. unsigned long random_vaddr, random_pages, total_user_pages;
  840. total_user_pages = (TASK_SIZE - FIRST_USER_ADDRESS) / PAGE_SIZE;
  841. random_pages = get_random_long() % total_user_pages;
  842. random_vaddr = FIRST_USER_ADDRESS + random_pages * PAGE_SIZE;
  843. return random_vaddr;
  844. }
  845. static void __init destroy_args(struct pgtable_debug_args *args)
  846. {
  847. struct page *page = NULL;
  848. /* Free (huge) page */
  849. if (IS_ENABLED(CONFIG_TRANSPARENT_HUGEPAGE) &&
  850. has_transparent_pud_hugepage() &&
  851. args->pud_pfn != ULONG_MAX) {
  852. if (args->is_contiguous_page) {
  853. free_contig_range(args->pud_pfn,
  854. (1 << (HPAGE_PUD_SHIFT - PAGE_SHIFT)));
  855. } else {
  856. page = pfn_to_page(args->pud_pfn);
  857. __free_pages(page, HPAGE_PUD_SHIFT - PAGE_SHIFT);
  858. }
  859. args->pud_pfn = ULONG_MAX;
  860. args->pmd_pfn = ULONG_MAX;
  861. args->pte_pfn = ULONG_MAX;
  862. }
  863. if (IS_ENABLED(CONFIG_TRANSPARENT_HUGEPAGE) &&
  864. has_transparent_hugepage() &&
  865. args->pmd_pfn != ULONG_MAX) {
  866. if (args->is_contiguous_page) {
  867. free_contig_range(args->pmd_pfn, (1 << HPAGE_PMD_ORDER));
  868. } else {
  869. page = pfn_to_page(args->pmd_pfn);
  870. __free_pages(page, HPAGE_PMD_ORDER);
  871. }
  872. args->pmd_pfn = ULONG_MAX;
  873. args->pte_pfn = ULONG_MAX;
  874. }
  875. if (args->pte_pfn != ULONG_MAX) {
  876. page = pfn_to_page(args->pte_pfn);
  877. __free_page(page);
  878. args->pte_pfn = ULONG_MAX;
  879. }
  880. /* Free page table entries */
  881. if (args->start_ptep) {
  882. pte_free(args->mm, args->start_ptep);
  883. mm_dec_nr_ptes(args->mm);
  884. }
  885. if (args->start_pmdp) {
  886. pmd_free(args->mm, args->start_pmdp);
  887. mm_dec_nr_pmds(args->mm);
  888. }
  889. if (args->start_pudp) {
  890. pud_free(args->mm, args->start_pudp);
  891. mm_dec_nr_puds(args->mm);
  892. }
  893. if (args->start_p4dp)
  894. p4d_free(args->mm, args->start_p4dp);
  895. /* Free vma and mm struct */
  896. if (args->vma)
  897. vm_area_free(args->vma);
  898. if (args->mm)
  899. mmdrop(args->mm);
  900. }
  901. static struct page * __init
  902. debug_vm_pgtable_alloc_huge_page(struct pgtable_debug_args *args, int order)
  903. {
  904. struct page *page = NULL;
  905. #ifdef CONFIG_CONTIG_ALLOC
  906. if (order > MAX_PAGE_ORDER) {
  907. page = alloc_contig_pages((1 << order), GFP_KERNEL,
  908. first_online_node, NULL);
  909. if (page) {
  910. args->is_contiguous_page = true;
  911. return page;
  912. }
  913. }
  914. #endif
  915. if (order <= MAX_PAGE_ORDER)
  916. page = alloc_pages(GFP_KERNEL, order);
  917. return page;
  918. }
  919. /*
  920. * Check if a physical memory range described by <pstart, pend> contains
  921. * an area that is of size psize, and aligned to psize.
  922. *
  923. * Don't use address 0, an all-zeroes physical address might mask bugs, and
  924. * it's not used on x86.
  925. */
  926. static void __init phys_align_check(phys_addr_t pstart,
  927. phys_addr_t pend, unsigned long psize,
  928. phys_addr_t *physp, unsigned long *alignp)
  929. {
  930. phys_addr_t aligned_start, aligned_end;
  931. if (pstart == 0)
  932. pstart = PAGE_SIZE;
  933. aligned_start = ALIGN(pstart, psize);
  934. aligned_end = aligned_start + psize;
  935. if (aligned_end > aligned_start && aligned_end <= pend) {
  936. *alignp = psize;
  937. *physp = aligned_start;
  938. }
  939. }
  940. static void __init init_fixed_pfns(struct pgtable_debug_args *args)
  941. {
  942. u64 idx;
  943. phys_addr_t phys, pstart, pend;
  944. /*
  945. * Initialize the fixed pfns. To do this, try to find a
  946. * valid physical range, preferably aligned to PUD_SIZE,
  947. * but settling for aligned to PMD_SIZE as a fallback. If
  948. * neither of those is found, use the physical address of
  949. * the start_kernel symbol.
  950. *
  951. * The memory doesn't need to be allocated, it just needs to exist
  952. * as usable memory. It won't be touched.
  953. *
  954. * The alignment is recorded, and can be checked to see if we
  955. * can run the tests that require an actual valid physical
  956. * address range on some architectures ({pmd,pud}_huge_test
  957. * on x86).
  958. */
  959. phys = __pa_symbol(&start_kernel);
  960. args->fixed_alignment = PAGE_SIZE;
  961. for_each_mem_range(idx, &pstart, &pend) {
  962. /* First check for a PUD-aligned area */
  963. phys_align_check(pstart, pend, PUD_SIZE, &phys,
  964. &args->fixed_alignment);
  965. /* If a PUD-aligned area is found, we're done */
  966. if (args->fixed_alignment == PUD_SIZE)
  967. break;
  968. /*
  969. * If no PMD-aligned area found yet, check for one,
  970. * but continue the loop to look for a PUD-aligned area.
  971. */
  972. if (args->fixed_alignment < PMD_SIZE)
  973. phys_align_check(pstart, pend, PMD_SIZE, &phys,
  974. &args->fixed_alignment);
  975. }
  976. args->fixed_pgd_pfn = __phys_to_pfn(phys & PGDIR_MASK);
  977. args->fixed_p4d_pfn = __phys_to_pfn(phys & P4D_MASK);
  978. args->fixed_pud_pfn = __phys_to_pfn(phys & PUD_MASK);
  979. args->fixed_pmd_pfn = __phys_to_pfn(phys & PMD_MASK);
  980. args->fixed_pte_pfn = __phys_to_pfn(phys & PAGE_MASK);
  981. WARN_ON(!pfn_valid(args->fixed_pte_pfn));
  982. }
  983. static int __init init_args(struct pgtable_debug_args *args)
  984. {
  985. struct page *page = NULL;
  986. int ret = 0;
  987. /*
  988. * Initialize the debugging data.
  989. *
  990. * vm_get_page_prot(VM_NONE) or vm_get_page_prot(VM_SHARED|VM_NONE)
  991. * will help create page table entries with PROT_NONE permission as
  992. * required for pxx_protnone_tests().
  993. */
  994. memset(args, 0, sizeof(*args));
  995. args->vaddr = get_random_vaddr();
  996. args->page_prot = vm_get_page_prot(VM_ACCESS_FLAGS);
  997. args->page_prot_none = vm_get_page_prot(VM_NONE);
  998. args->is_contiguous_page = false;
  999. args->pud_pfn = ULONG_MAX;
  1000. args->pmd_pfn = ULONG_MAX;
  1001. args->pte_pfn = ULONG_MAX;
  1002. args->fixed_pgd_pfn = ULONG_MAX;
  1003. args->fixed_p4d_pfn = ULONG_MAX;
  1004. args->fixed_pud_pfn = ULONG_MAX;
  1005. args->fixed_pmd_pfn = ULONG_MAX;
  1006. args->fixed_pte_pfn = ULONG_MAX;
  1007. /* Allocate mm and vma */
  1008. args->mm = mm_alloc();
  1009. if (!args->mm) {
  1010. pr_err("Failed to allocate mm struct\n");
  1011. ret = -ENOMEM;
  1012. goto error;
  1013. }
  1014. args->vma = vm_area_alloc(args->mm);
  1015. if (!args->vma) {
  1016. pr_err("Failed to allocate vma\n");
  1017. ret = -ENOMEM;
  1018. goto error;
  1019. }
  1020. /*
  1021. * Allocate page table entries. They will be modified in the tests.
  1022. * Lets save the page table entries so that they can be released
  1023. * when the tests are completed.
  1024. */
  1025. args->pgdp = pgd_offset(args->mm, args->vaddr);
  1026. args->p4dp = p4d_alloc(args->mm, args->pgdp, args->vaddr);
  1027. if (!args->p4dp) {
  1028. pr_err("Failed to allocate p4d entries\n");
  1029. ret = -ENOMEM;
  1030. goto error;
  1031. }
  1032. args->start_p4dp = p4d_offset(args->pgdp, 0UL);
  1033. WARN_ON(!args->start_p4dp);
  1034. args->pudp = pud_alloc(args->mm, args->p4dp, args->vaddr);
  1035. if (!args->pudp) {
  1036. pr_err("Failed to allocate pud entries\n");
  1037. ret = -ENOMEM;
  1038. goto error;
  1039. }
  1040. args->start_pudp = pud_offset(args->p4dp, 0UL);
  1041. WARN_ON(!args->start_pudp);
  1042. args->pmdp = pmd_alloc(args->mm, args->pudp, args->vaddr);
  1043. if (!args->pmdp) {
  1044. pr_err("Failed to allocate pmd entries\n");
  1045. ret = -ENOMEM;
  1046. goto error;
  1047. }
  1048. args->start_pmdp = pmd_offset(args->pudp, 0UL);
  1049. WARN_ON(!args->start_pmdp);
  1050. if (pte_alloc(args->mm, args->pmdp)) {
  1051. pr_err("Failed to allocate pte entries\n");
  1052. ret = -ENOMEM;
  1053. goto error;
  1054. }
  1055. args->start_ptep = pmd_pgtable(pmdp_get(args->pmdp));
  1056. WARN_ON(!args->start_ptep);
  1057. init_fixed_pfns(args);
  1058. /*
  1059. * Allocate (huge) pages because some of the tests need to access
  1060. * the data in the pages. The corresponding tests will be skipped
  1061. * if we fail to allocate (huge) pages.
  1062. */
  1063. if (IS_ENABLED(CONFIG_TRANSPARENT_HUGEPAGE) &&
  1064. has_transparent_pud_hugepage()) {
  1065. page = debug_vm_pgtable_alloc_huge_page(args,
  1066. HPAGE_PUD_SHIFT - PAGE_SHIFT);
  1067. if (page) {
  1068. args->pud_pfn = page_to_pfn(page);
  1069. args->pmd_pfn = args->pud_pfn;
  1070. args->pte_pfn = args->pud_pfn;
  1071. return 0;
  1072. }
  1073. }
  1074. if (IS_ENABLED(CONFIG_TRANSPARENT_HUGEPAGE) &&
  1075. has_transparent_hugepage()) {
  1076. page = debug_vm_pgtable_alloc_huge_page(args, HPAGE_PMD_ORDER);
  1077. if (page) {
  1078. args->pmd_pfn = page_to_pfn(page);
  1079. args->pte_pfn = args->pmd_pfn;
  1080. return 0;
  1081. }
  1082. }
  1083. page = alloc_page(GFP_KERNEL);
  1084. if (page)
  1085. args->pte_pfn = page_to_pfn(page);
  1086. return 0;
  1087. error:
  1088. destroy_args(args);
  1089. return ret;
  1090. }
  1091. static int __init debug_vm_pgtable(void)
  1092. {
  1093. struct pgtable_debug_args args;
  1094. spinlock_t *ptl = NULL;
  1095. int idx, ret;
  1096. pr_info("Validating architecture page table helpers\n");
  1097. ret = init_args(&args);
  1098. if (ret)
  1099. return ret;
  1100. /*
  1101. * Iterate over each possible vm_flags to make sure that all
  1102. * the basic page table transformation validations just hold
  1103. * true irrespective of the starting protection value for a
  1104. * given page table entry.
  1105. *
  1106. * Protection based vm_flags combinations are always linear
  1107. * and increasing i.e starting from VM_NONE and going up to
  1108. * (VM_SHARED | READ | WRITE | EXEC).
  1109. */
  1110. #define VM_FLAGS_START (VM_NONE)
  1111. #define VM_FLAGS_END (VM_SHARED | VM_EXEC | VM_WRITE | VM_READ)
  1112. for (idx = VM_FLAGS_START; idx <= VM_FLAGS_END; idx++) {
  1113. pte_basic_tests(&args, idx);
  1114. pmd_basic_tests(&args, idx);
  1115. pud_basic_tests(&args, idx);
  1116. }
  1117. /*
  1118. * Both P4D and PGD level tests are very basic which do not
  1119. * involve creating page table entries from the protection
  1120. * value and the given pfn. Hence just keep them out from
  1121. * the above iteration for now to save some test execution
  1122. * time.
  1123. */
  1124. p4d_basic_tests(&args);
  1125. pgd_basic_tests(&args);
  1126. pmd_leaf_tests(&args);
  1127. pud_leaf_tests(&args);
  1128. pte_special_tests(&args);
  1129. pte_protnone_tests(&args);
  1130. pmd_protnone_tests(&args);
  1131. pte_devmap_tests(&args);
  1132. pmd_devmap_tests(&args);
  1133. pud_devmap_tests(&args);
  1134. pte_soft_dirty_tests(&args);
  1135. pmd_soft_dirty_tests(&args);
  1136. pte_swap_soft_dirty_tests(&args);
  1137. pmd_swap_soft_dirty_tests(&args);
  1138. pte_swap_exclusive_tests(&args);
  1139. pte_swap_tests(&args);
  1140. pmd_swap_tests(&args);
  1141. swap_migration_tests(&args);
  1142. pmd_thp_tests(&args);
  1143. pud_thp_tests(&args);
  1144. hugetlb_basic_tests(&args);
  1145. /*
  1146. * Page table modifying tests. They need to hold
  1147. * proper page table lock.
  1148. */
  1149. args.ptep = pte_offset_map_lock(args.mm, args.pmdp, args.vaddr, &ptl);
  1150. pte_clear_tests(&args);
  1151. pte_advanced_tests(&args);
  1152. if (args.ptep)
  1153. pte_unmap_unlock(args.ptep, ptl);
  1154. ptl = pmd_lock(args.mm, args.pmdp);
  1155. pmd_clear_tests(&args);
  1156. pmd_advanced_tests(&args);
  1157. pmd_huge_tests(&args);
  1158. pmd_populate_tests(&args);
  1159. spin_unlock(ptl);
  1160. ptl = pud_lock(args.mm, args.pudp);
  1161. pud_clear_tests(&args);
  1162. pud_advanced_tests(&args);
  1163. pud_huge_tests(&args);
  1164. pud_populate_tests(&args);
  1165. spin_unlock(ptl);
  1166. spin_lock(&(args.mm->page_table_lock));
  1167. p4d_clear_tests(&args);
  1168. pgd_clear_tests(&args);
  1169. p4d_populate_tests(&args);
  1170. pgd_populate_tests(&args);
  1171. spin_unlock(&(args.mm->page_table_lock));
  1172. destroy_args(&args);
  1173. return 0;
  1174. }
  1175. late_initcall(debug_vm_pgtable);