debug_vm_pgtable.c 40 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093109410951096109710981099110011011102110311041105110611071108110911101111111211131114111511161117111811191120112111221123112411251126112711281129113011311132113311341135113611371138113911401141114211431144114511461147114811491150115111521153115411551156115711581159116011611162116311641165116611671168116911701171117211731174117511761177117811791180118111821183118411851186118711881189119011911192119311941195119611971198119912001201120212031204120512061207120812091210121112121213121412151216121712181219122012211222122312241225122612271228122912301231123212331234123512361237123812391240124112421243124412451246124712481249125012511252125312541255125612571258125912601261126212631264126512661267126812691270127112721273127412751276127712781279128012811282128312841285128612871288128912901291129212931294129512961297129812991300130113021303130413051306130713081309131013111312131313141315131613171318131913201321132213231324132513261327132813291330133113321333133413351336133713381339134013411342134313441345134613471348134913501351135213531354135513561357135813591360136113621363136413651366136713681369137013711372137313741375137613771378137913801381138213831384138513861387138813891390139113921393139413951396139713981399140014011402140314041405
  1. // SPDX-License-Identifier: GPL-2.0-only
  2. /*
  3. * This kernel test validates architecture page table helpers and
  4. * accessors and helps in verifying their continued compliance with
  5. * expected generic MM semantics.
  6. *
  7. * Copyright (C) 2019 ARM Ltd.
  8. *
  9. * Author: Anshuman Khandual <anshuman.khandual@arm.com>
  10. */
  11. #define pr_fmt(fmt) "debug_vm_pgtable: [%-25s]: " fmt, __func__
  12. #include <linux/gfp.h>
  13. #include <linux/highmem.h>
  14. #include <linux/hugetlb.h>
  15. #include <linux/kernel.h>
  16. #include <linux/kconfig.h>
  17. #include <linux/memblock.h>
  18. #include <linux/mm.h>
  19. #include <linux/mman.h>
  20. #include <linux/mm_types.h>
  21. #include <linux/module.h>
  22. #include <linux/pfn_t.h>
  23. #include <linux/printk.h>
  24. #include <linux/pgtable.h>
  25. #include <linux/random.h>
  26. #include <linux/spinlock.h>
  27. #include <linux/swap.h>
  28. #include <linux/swapops.h>
  29. #include <linux/start_kernel.h>
  30. #include <linux/sched/mm.h>
  31. #include <linux/io.h>
  32. #include <linux/vmalloc.h>
  33. #include <asm/cacheflush.h>
  34. #include <asm/pgalloc.h>
  35. #include <asm/tlbflush.h>
  36. /*
  37. * Please refer Documentation/mm/arch_pgtable_helpers.rst for the semantics
  38. * expectations that are being validated here. All future changes in here
  39. * or the documentation need to be in sync.
  40. */
  41. #define RANDOM_NZVALUE GENMASK(7, 0)
  42. struct pgtable_debug_args {
  43. struct mm_struct *mm;
  44. struct vm_area_struct *vma;
  45. pgd_t *pgdp;
  46. p4d_t *p4dp;
  47. pud_t *pudp;
  48. pmd_t *pmdp;
  49. pte_t *ptep;
  50. p4d_t *start_p4dp;
  51. pud_t *start_pudp;
  52. pmd_t *start_pmdp;
  53. pgtable_t start_ptep;
  54. unsigned long vaddr;
  55. pgprot_t page_prot;
  56. pgprot_t page_prot_none;
  57. bool is_contiguous_page;
  58. unsigned long pud_pfn;
  59. unsigned long pmd_pfn;
  60. unsigned long pte_pfn;
  61. unsigned long fixed_alignment;
  62. unsigned long fixed_pgd_pfn;
  63. unsigned long fixed_p4d_pfn;
  64. unsigned long fixed_pud_pfn;
  65. unsigned long fixed_pmd_pfn;
  66. unsigned long fixed_pte_pfn;
  67. };
  68. static void __init pte_basic_tests(struct pgtable_debug_args *args, int idx)
  69. {
  70. pgprot_t prot = vm_get_page_prot(idx);
  71. pte_t pte = pfn_pte(args->fixed_pte_pfn, prot);
  72. unsigned long val = idx, *ptr = &val;
  73. pr_debug("Validating PTE basic (%pGv)\n", ptr);
  74. /*
  75. * This test needs to be executed after the given page table entry
  76. * is created with pfn_pte() to make sure that vm_get_page_prot(idx)
  77. * does not have the dirty bit enabled from the beginning. This is
  78. * important for platforms like arm64 where (!PTE_RDONLY) indicate
  79. * dirty bit being set.
  80. */
  81. WARN_ON(pte_dirty(pte_wrprotect(pte)));
  82. WARN_ON(!pte_same(pte, pte));
  83. WARN_ON(!pte_young(pte_mkyoung(pte_mkold(pte))));
  84. WARN_ON(!pte_dirty(pte_mkdirty(pte_mkclean(pte))));
  85. WARN_ON(!pte_write(pte_mkwrite(pte_wrprotect(pte), args->vma)));
  86. WARN_ON(pte_young(pte_mkold(pte_mkyoung(pte))));
  87. WARN_ON(pte_dirty(pte_mkclean(pte_mkdirty(pte))));
  88. WARN_ON(pte_write(pte_wrprotect(pte_mkwrite(pte, args->vma))));
  89. WARN_ON(pte_dirty(pte_wrprotect(pte_mkclean(pte))));
  90. WARN_ON(!pte_dirty(pte_wrprotect(pte_mkdirty(pte))));
  91. }
  92. static void __init pte_advanced_tests(struct pgtable_debug_args *args)
  93. {
  94. struct page *page;
  95. pte_t pte;
  96. /*
  97. * Architectures optimize set_pte_at by avoiding TLB flush.
  98. * This requires set_pte_at to be not used to update an
  99. * existing pte entry. Clear pte before we do set_pte_at
  100. *
  101. * flush_dcache_page() is called after set_pte_at() to clear
  102. * PG_arch_1 for the page on ARM64. The page flag isn't cleared
  103. * when it's released and page allocation check will fail when
  104. * the page is allocated again. For architectures other than ARM64,
  105. * the unexpected overhead of cache flushing is acceptable.
  106. */
  107. page = (args->pte_pfn != ULONG_MAX) ? pfn_to_page(args->pte_pfn) : NULL;
  108. if (!page)
  109. return;
  110. pr_debug("Validating PTE advanced\n");
  111. if (WARN_ON(!args->ptep))
  112. return;
  113. pte = pfn_pte(args->pte_pfn, args->page_prot);
  114. set_pte_at(args->mm, args->vaddr, args->ptep, pte);
  115. flush_dcache_page(page);
  116. ptep_set_wrprotect(args->mm, args->vaddr, args->ptep);
  117. pte = ptep_get(args->ptep);
  118. WARN_ON(pte_write(pte));
  119. ptep_get_and_clear(args->mm, args->vaddr, args->ptep);
  120. pte = ptep_get(args->ptep);
  121. WARN_ON(!pte_none(pte));
  122. pte = pfn_pte(args->pte_pfn, args->page_prot);
  123. pte = pte_wrprotect(pte);
  124. pte = pte_mkclean(pte);
  125. set_pte_at(args->mm, args->vaddr, args->ptep, pte);
  126. flush_dcache_page(page);
  127. pte = pte_mkwrite(pte, args->vma);
  128. pte = pte_mkdirty(pte);
  129. ptep_set_access_flags(args->vma, args->vaddr, args->ptep, pte, 1);
  130. pte = ptep_get(args->ptep);
  131. WARN_ON(!(pte_write(pte) && pte_dirty(pte)));
  132. ptep_get_and_clear_full(args->mm, args->vaddr, args->ptep, 1);
  133. pte = ptep_get(args->ptep);
  134. WARN_ON(!pte_none(pte));
  135. pte = pfn_pte(args->pte_pfn, args->page_prot);
  136. pte = pte_mkyoung(pte);
  137. set_pte_at(args->mm, args->vaddr, args->ptep, pte);
  138. flush_dcache_page(page);
  139. ptep_test_and_clear_young(args->vma, args->vaddr, args->ptep);
  140. pte = ptep_get(args->ptep);
  141. WARN_ON(pte_young(pte));
  142. ptep_get_and_clear_full(args->mm, args->vaddr, args->ptep, 1);
  143. }
  144. #ifdef CONFIG_TRANSPARENT_HUGEPAGE
  145. static void __init pmd_basic_tests(struct pgtable_debug_args *args, int idx)
  146. {
  147. pgprot_t prot = vm_get_page_prot(idx);
  148. unsigned long val = idx, *ptr = &val;
  149. pmd_t pmd;
  150. if (!has_transparent_hugepage())
  151. return;
  152. pr_debug("Validating PMD basic (%pGv)\n", ptr);
  153. pmd = pfn_pmd(args->fixed_pmd_pfn, prot);
  154. /*
  155. * This test needs to be executed after the given page table entry
  156. * is created with pfn_pmd() to make sure that vm_get_page_prot(idx)
  157. * does not have the dirty bit enabled from the beginning. This is
  158. * important for platforms like arm64 where (!PTE_RDONLY) indicate
  159. * dirty bit being set.
  160. */
  161. WARN_ON(pmd_dirty(pmd_wrprotect(pmd)));
  162. WARN_ON(!pmd_same(pmd, pmd));
  163. WARN_ON(!pmd_young(pmd_mkyoung(pmd_mkold(pmd))));
  164. WARN_ON(!pmd_dirty(pmd_mkdirty(pmd_mkclean(pmd))));
  165. WARN_ON(!pmd_write(pmd_mkwrite(pmd_wrprotect(pmd), args->vma)));
  166. WARN_ON(pmd_young(pmd_mkold(pmd_mkyoung(pmd))));
  167. WARN_ON(pmd_dirty(pmd_mkclean(pmd_mkdirty(pmd))));
  168. WARN_ON(pmd_write(pmd_wrprotect(pmd_mkwrite(pmd, args->vma))));
  169. WARN_ON(pmd_dirty(pmd_wrprotect(pmd_mkclean(pmd))));
  170. WARN_ON(!pmd_dirty(pmd_wrprotect(pmd_mkdirty(pmd))));
  171. /*
  172. * A huge page does not point to next level page table
  173. * entry. Hence this must qualify as pmd_bad().
  174. */
  175. WARN_ON(!pmd_bad(pmd_mkhuge(pmd)));
  176. }
  177. static void __init pmd_advanced_tests(struct pgtable_debug_args *args)
  178. {
  179. struct page *page;
  180. pmd_t pmd;
  181. unsigned long vaddr = args->vaddr;
  182. if (!has_transparent_hugepage())
  183. return;
  184. page = (args->pmd_pfn != ULONG_MAX) ? pfn_to_page(args->pmd_pfn) : NULL;
  185. if (!page)
  186. return;
  187. /*
  188. * flush_dcache_page() is called after set_pmd_at() to clear
  189. * PG_arch_1 for the page on ARM64. The page flag isn't cleared
  190. * when it's released and page allocation check will fail when
  191. * the page is allocated again. For architectures other than ARM64,
  192. * the unexpected overhead of cache flushing is acceptable.
  193. */
  194. pr_debug("Validating PMD advanced\n");
  195. /* Align the address wrt HPAGE_PMD_SIZE */
  196. vaddr &= HPAGE_PMD_MASK;
  197. pgtable_trans_huge_deposit(args->mm, args->pmdp, args->start_ptep);
  198. pmd = pfn_pmd(args->pmd_pfn, args->page_prot);
  199. set_pmd_at(args->mm, vaddr, args->pmdp, pmd);
  200. flush_dcache_page(page);
  201. pmdp_set_wrprotect(args->mm, vaddr, args->pmdp);
  202. pmd = pmdp_get(args->pmdp);
  203. WARN_ON(pmd_write(pmd));
  204. pmdp_huge_get_and_clear(args->mm, vaddr, args->pmdp);
  205. pmd = pmdp_get(args->pmdp);
  206. WARN_ON(!pmd_none(pmd));
  207. pmd = pfn_pmd(args->pmd_pfn, args->page_prot);
  208. pmd = pmd_wrprotect(pmd);
  209. pmd = pmd_mkclean(pmd);
  210. set_pmd_at(args->mm, vaddr, args->pmdp, pmd);
  211. flush_dcache_page(page);
  212. pmd = pmd_mkwrite(pmd, args->vma);
  213. pmd = pmd_mkdirty(pmd);
  214. pmdp_set_access_flags(args->vma, vaddr, args->pmdp, pmd, 1);
  215. pmd = pmdp_get(args->pmdp);
  216. WARN_ON(!(pmd_write(pmd) && pmd_dirty(pmd)));
  217. pmdp_huge_get_and_clear_full(args->vma, vaddr, args->pmdp, 1);
  218. pmd = pmdp_get(args->pmdp);
  219. WARN_ON(!pmd_none(pmd));
  220. pmd = pmd_mkhuge(pfn_pmd(args->pmd_pfn, args->page_prot));
  221. pmd = pmd_mkyoung(pmd);
  222. set_pmd_at(args->mm, vaddr, args->pmdp, pmd);
  223. flush_dcache_page(page);
  224. pmdp_test_and_clear_young(args->vma, vaddr, args->pmdp);
  225. pmd = pmdp_get(args->pmdp);
  226. WARN_ON(pmd_young(pmd));
  227. /* Clear the pte entries */
  228. pmdp_huge_get_and_clear(args->mm, vaddr, args->pmdp);
  229. pgtable_trans_huge_withdraw(args->mm, args->pmdp);
  230. }
  231. static void __init pmd_leaf_tests(struct pgtable_debug_args *args)
  232. {
  233. pmd_t pmd;
  234. if (!has_transparent_hugepage())
  235. return;
  236. pr_debug("Validating PMD leaf\n");
  237. pmd = pfn_pmd(args->fixed_pmd_pfn, args->page_prot);
  238. /*
  239. * PMD based THP is a leaf entry.
  240. */
  241. pmd = pmd_mkhuge(pmd);
  242. WARN_ON(!pmd_leaf(pmd));
  243. }
  244. #ifdef CONFIG_HAVE_ARCH_TRANSPARENT_HUGEPAGE_PUD
  245. static void __init pud_basic_tests(struct pgtable_debug_args *args, int idx)
  246. {
  247. pgprot_t prot = vm_get_page_prot(idx);
  248. unsigned long val = idx, *ptr = &val;
  249. pud_t pud;
  250. if (!has_transparent_pud_hugepage())
  251. return;
  252. pr_debug("Validating PUD basic (%pGv)\n", ptr);
  253. pud = pfn_pud(args->fixed_pud_pfn, prot);
  254. /*
  255. * This test needs to be executed after the given page table entry
  256. * is created with pfn_pud() to make sure that vm_get_page_prot(idx)
  257. * does not have the dirty bit enabled from the beginning. This is
  258. * important for platforms like arm64 where (!PTE_RDONLY) indicate
  259. * dirty bit being set.
  260. */
  261. WARN_ON(pud_dirty(pud_wrprotect(pud)));
  262. WARN_ON(!pud_same(pud, pud));
  263. WARN_ON(!pud_young(pud_mkyoung(pud_mkold(pud))));
  264. WARN_ON(!pud_dirty(pud_mkdirty(pud_mkclean(pud))));
  265. WARN_ON(pud_dirty(pud_mkclean(pud_mkdirty(pud))));
  266. WARN_ON(!pud_write(pud_mkwrite(pud_wrprotect(pud))));
  267. WARN_ON(pud_write(pud_wrprotect(pud_mkwrite(pud))));
  268. WARN_ON(pud_young(pud_mkold(pud_mkyoung(pud))));
  269. WARN_ON(pud_dirty(pud_wrprotect(pud_mkclean(pud))));
  270. WARN_ON(!pud_dirty(pud_wrprotect(pud_mkdirty(pud))));
  271. if (mm_pmd_folded(args->mm))
  272. return;
  273. /*
  274. * A huge page does not point to next level page table
  275. * entry. Hence this must qualify as pud_bad().
  276. */
  277. WARN_ON(!pud_bad(pud_mkhuge(pud)));
  278. }
  279. static void __init pud_advanced_tests(struct pgtable_debug_args *args)
  280. {
  281. struct page *page;
  282. unsigned long vaddr = args->vaddr;
  283. pud_t pud;
  284. if (!has_transparent_pud_hugepage())
  285. return;
  286. page = (args->pud_pfn != ULONG_MAX) ? pfn_to_page(args->pud_pfn) : NULL;
  287. if (!page)
  288. return;
  289. /*
  290. * flush_dcache_page() is called after set_pud_at() to clear
  291. * PG_arch_1 for the page on ARM64. The page flag isn't cleared
  292. * when it's released and page allocation check will fail when
  293. * the page is allocated again. For architectures other than ARM64,
  294. * the unexpected overhead of cache flushing is acceptable.
  295. */
  296. pr_debug("Validating PUD advanced\n");
  297. /* Align the address wrt HPAGE_PUD_SIZE */
  298. vaddr &= HPAGE_PUD_MASK;
  299. pud = pfn_pud(args->pud_pfn, args->page_prot);
  300. /*
  301. * Some architectures have debug checks to make sure
  302. * huge pud mapping are only found with devmap entries
  303. * For now test with only devmap entries.
  304. */
  305. pud = pud_mkdevmap(pud);
  306. set_pud_at(args->mm, vaddr, args->pudp, pud);
  307. flush_dcache_page(page);
  308. pudp_set_wrprotect(args->mm, vaddr, args->pudp);
  309. pud = pudp_get(args->pudp);
  310. WARN_ON(pud_write(pud));
  311. #ifndef __PAGETABLE_PMD_FOLDED
  312. pudp_huge_get_and_clear(args->mm, vaddr, args->pudp);
  313. pud = pudp_get(args->pudp);
  314. WARN_ON(!pud_none(pud));
  315. #endif /* __PAGETABLE_PMD_FOLDED */
  316. pud = pfn_pud(args->pud_pfn, args->page_prot);
  317. pud = pud_mkdevmap(pud);
  318. pud = pud_wrprotect(pud);
  319. pud = pud_mkclean(pud);
  320. set_pud_at(args->mm, vaddr, args->pudp, pud);
  321. flush_dcache_page(page);
  322. pud = pud_mkwrite(pud);
  323. pud = pud_mkdirty(pud);
  324. pudp_set_access_flags(args->vma, vaddr, args->pudp, pud, 1);
  325. pud = pudp_get(args->pudp);
  326. WARN_ON(!(pud_write(pud) && pud_dirty(pud)));
  327. #ifndef __PAGETABLE_PMD_FOLDED
  328. pudp_huge_get_and_clear_full(args->vma, vaddr, args->pudp, 1);
  329. pud = pudp_get(args->pudp);
  330. WARN_ON(!pud_none(pud));
  331. #endif /* __PAGETABLE_PMD_FOLDED */
  332. pud = pfn_pud(args->pud_pfn, args->page_prot);
  333. pud = pud_mkdevmap(pud);
  334. pud = pud_mkyoung(pud);
  335. set_pud_at(args->mm, vaddr, args->pudp, pud);
  336. flush_dcache_page(page);
  337. pudp_test_and_clear_young(args->vma, vaddr, args->pudp);
  338. pud = pudp_get(args->pudp);
  339. WARN_ON(pud_young(pud));
  340. pudp_huge_get_and_clear(args->mm, vaddr, args->pudp);
  341. }
  342. static void __init pud_leaf_tests(struct pgtable_debug_args *args)
  343. {
  344. pud_t pud;
  345. if (!has_transparent_pud_hugepage())
  346. return;
  347. pr_debug("Validating PUD leaf\n");
  348. pud = pfn_pud(args->fixed_pud_pfn, args->page_prot);
  349. /*
  350. * PUD based THP is a leaf entry.
  351. */
  352. pud = pud_mkhuge(pud);
  353. WARN_ON(!pud_leaf(pud));
  354. }
  355. #else /* !CONFIG_HAVE_ARCH_TRANSPARENT_HUGEPAGE_PUD */
  356. static void __init pud_basic_tests(struct pgtable_debug_args *args, int idx) { }
  357. static void __init pud_advanced_tests(struct pgtable_debug_args *args) { }
  358. static void __init pud_leaf_tests(struct pgtable_debug_args *args) { }
  359. #endif /* CONFIG_HAVE_ARCH_TRANSPARENT_HUGEPAGE_PUD */
  360. #else /* !CONFIG_TRANSPARENT_HUGEPAGE */
  361. static void __init pmd_basic_tests(struct pgtable_debug_args *args, int idx) { }
  362. static void __init pud_basic_tests(struct pgtable_debug_args *args, int idx) { }
  363. static void __init pmd_advanced_tests(struct pgtable_debug_args *args) { }
  364. static void __init pud_advanced_tests(struct pgtable_debug_args *args) { }
  365. static void __init pmd_leaf_tests(struct pgtable_debug_args *args) { }
  366. static void __init pud_leaf_tests(struct pgtable_debug_args *args) { }
  367. #endif /* CONFIG_TRANSPARENT_HUGEPAGE */
  368. #ifdef CONFIG_HAVE_ARCH_HUGE_VMAP
  369. static void __init pmd_huge_tests(struct pgtable_debug_args *args)
  370. {
  371. pmd_t pmd;
  372. if (!arch_vmap_pmd_supported(args->page_prot) ||
  373. args->fixed_alignment < PMD_SIZE)
  374. return;
  375. pr_debug("Validating PMD huge\n");
  376. /*
  377. * X86 defined pmd_set_huge() verifies that the given
  378. * PMD is not a populated non-leaf entry.
  379. */
  380. WRITE_ONCE(*args->pmdp, __pmd(0));
  381. WARN_ON(!pmd_set_huge(args->pmdp, __pfn_to_phys(args->fixed_pmd_pfn), args->page_prot));
  382. WARN_ON(!pmd_clear_huge(args->pmdp));
  383. pmd = pmdp_get(args->pmdp);
  384. WARN_ON(!pmd_none(pmd));
  385. }
  386. static void __init pud_huge_tests(struct pgtable_debug_args *args)
  387. {
  388. pud_t pud;
  389. if (!arch_vmap_pud_supported(args->page_prot) ||
  390. args->fixed_alignment < PUD_SIZE)
  391. return;
  392. pr_debug("Validating PUD huge\n");
  393. /*
  394. * X86 defined pud_set_huge() verifies that the given
  395. * PUD is not a populated non-leaf entry.
  396. */
  397. WRITE_ONCE(*args->pudp, __pud(0));
  398. WARN_ON(!pud_set_huge(args->pudp, __pfn_to_phys(args->fixed_pud_pfn), args->page_prot));
  399. WARN_ON(!pud_clear_huge(args->pudp));
  400. pud = pudp_get(args->pudp);
  401. WARN_ON(!pud_none(pud));
  402. }
  403. #else /* !CONFIG_HAVE_ARCH_HUGE_VMAP */
  404. static void __init pmd_huge_tests(struct pgtable_debug_args *args) { }
  405. static void __init pud_huge_tests(struct pgtable_debug_args *args) { }
  406. #endif /* CONFIG_HAVE_ARCH_HUGE_VMAP */
  407. static void __init p4d_basic_tests(struct pgtable_debug_args *args)
  408. {
  409. p4d_t p4d;
  410. pr_debug("Validating P4D basic\n");
  411. memset(&p4d, RANDOM_NZVALUE, sizeof(p4d_t));
  412. WARN_ON(!p4d_same(p4d, p4d));
  413. }
  414. static void __init pgd_basic_tests(struct pgtable_debug_args *args)
  415. {
  416. pgd_t pgd;
  417. pr_debug("Validating PGD basic\n");
  418. memset(&pgd, RANDOM_NZVALUE, sizeof(pgd_t));
  419. WARN_ON(!pgd_same(pgd, pgd));
  420. }
  421. #ifndef __PAGETABLE_PUD_FOLDED
  422. static void __init pud_clear_tests(struct pgtable_debug_args *args)
  423. {
  424. pud_t pud = pudp_get(args->pudp);
  425. if (mm_pmd_folded(args->mm))
  426. return;
  427. pr_debug("Validating PUD clear\n");
  428. WARN_ON(pud_none(pud));
  429. pud_clear(args->pudp);
  430. pud = pudp_get(args->pudp);
  431. WARN_ON(!pud_none(pud));
  432. }
  433. static void __init pud_populate_tests(struct pgtable_debug_args *args)
  434. {
  435. pud_t pud;
  436. if (mm_pmd_folded(args->mm))
  437. return;
  438. pr_debug("Validating PUD populate\n");
  439. /*
  440. * This entry points to next level page table page.
  441. * Hence this must not qualify as pud_bad().
  442. */
  443. pud_populate(args->mm, args->pudp, args->start_pmdp);
  444. pud = pudp_get(args->pudp);
  445. WARN_ON(pud_bad(pud));
  446. }
  447. #else /* !__PAGETABLE_PUD_FOLDED */
  448. static void __init pud_clear_tests(struct pgtable_debug_args *args) { }
  449. static void __init pud_populate_tests(struct pgtable_debug_args *args) { }
  450. #endif /* PAGETABLE_PUD_FOLDED */
  451. #ifndef __PAGETABLE_P4D_FOLDED
  452. static void __init p4d_clear_tests(struct pgtable_debug_args *args)
  453. {
  454. p4d_t p4d = p4dp_get(args->p4dp);
  455. if (mm_pud_folded(args->mm))
  456. return;
  457. pr_debug("Validating P4D clear\n");
  458. WARN_ON(p4d_none(p4d));
  459. p4d_clear(args->p4dp);
  460. p4d = p4dp_get(args->p4dp);
  461. WARN_ON(!p4d_none(p4d));
  462. }
  463. static void __init p4d_populate_tests(struct pgtable_debug_args *args)
  464. {
  465. p4d_t p4d;
  466. if (mm_pud_folded(args->mm))
  467. return;
  468. pr_debug("Validating P4D populate\n");
  469. /*
  470. * This entry points to next level page table page.
  471. * Hence this must not qualify as p4d_bad().
  472. */
  473. pud_clear(args->pudp);
  474. p4d_clear(args->p4dp);
  475. p4d_populate(args->mm, args->p4dp, args->start_pudp);
  476. p4d = p4dp_get(args->p4dp);
  477. WARN_ON(p4d_bad(p4d));
  478. }
  479. static void __init pgd_clear_tests(struct pgtable_debug_args *args)
  480. {
  481. pgd_t pgd = pgdp_get(args->pgdp);
  482. if (mm_p4d_folded(args->mm))
  483. return;
  484. pr_debug("Validating PGD clear\n");
  485. WARN_ON(pgd_none(pgd));
  486. pgd_clear(args->pgdp);
  487. pgd = pgdp_get(args->pgdp);
  488. WARN_ON(!pgd_none(pgd));
  489. }
  490. static void __init pgd_populate_tests(struct pgtable_debug_args *args)
  491. {
  492. pgd_t pgd;
  493. if (mm_p4d_folded(args->mm))
  494. return;
  495. pr_debug("Validating PGD populate\n");
  496. /*
  497. * This entry points to next level page table page.
  498. * Hence this must not qualify as pgd_bad().
  499. */
  500. p4d_clear(args->p4dp);
  501. pgd_clear(args->pgdp);
  502. pgd_populate(args->mm, args->pgdp, args->start_p4dp);
  503. pgd = pgdp_get(args->pgdp);
  504. WARN_ON(pgd_bad(pgd));
  505. }
  506. #else /* !__PAGETABLE_P4D_FOLDED */
  507. static void __init p4d_clear_tests(struct pgtable_debug_args *args) { }
  508. static void __init pgd_clear_tests(struct pgtable_debug_args *args) { }
  509. static void __init p4d_populate_tests(struct pgtable_debug_args *args) { }
  510. static void __init pgd_populate_tests(struct pgtable_debug_args *args) { }
  511. #endif /* PAGETABLE_P4D_FOLDED */
  512. static void __init pte_clear_tests(struct pgtable_debug_args *args)
  513. {
  514. struct page *page;
  515. pte_t pte = pfn_pte(args->pte_pfn, args->page_prot);
  516. page = (args->pte_pfn != ULONG_MAX) ? pfn_to_page(args->pte_pfn) : NULL;
  517. if (!page)
  518. return;
  519. /*
  520. * flush_dcache_page() is called after set_pte_at() to clear
  521. * PG_arch_1 for the page on ARM64. The page flag isn't cleared
  522. * when it's released and page allocation check will fail when
  523. * the page is allocated again. For architectures other than ARM64,
  524. * the unexpected overhead of cache flushing is acceptable.
  525. */
  526. pr_debug("Validating PTE clear\n");
  527. if (WARN_ON(!args->ptep))
  528. return;
  529. set_pte_at(args->mm, args->vaddr, args->ptep, pte);
  530. WARN_ON(pte_none(pte));
  531. flush_dcache_page(page);
  532. barrier();
  533. ptep_clear(args->mm, args->vaddr, args->ptep);
  534. pte = ptep_get(args->ptep);
  535. WARN_ON(!pte_none(pte));
  536. }
  537. static void __init pmd_clear_tests(struct pgtable_debug_args *args)
  538. {
  539. pmd_t pmd = pmdp_get(args->pmdp);
  540. pr_debug("Validating PMD clear\n");
  541. WARN_ON(pmd_none(pmd));
  542. pmd_clear(args->pmdp);
  543. pmd = pmdp_get(args->pmdp);
  544. WARN_ON(!pmd_none(pmd));
  545. }
  546. static void __init pmd_populate_tests(struct pgtable_debug_args *args)
  547. {
  548. pmd_t pmd;
  549. pr_debug("Validating PMD populate\n");
  550. /*
  551. * This entry points to next level page table page.
  552. * Hence this must not qualify as pmd_bad().
  553. */
  554. pmd_populate(args->mm, args->pmdp, args->start_ptep);
  555. pmd = pmdp_get(args->pmdp);
  556. WARN_ON(pmd_bad(pmd));
  557. }
  558. static void __init pte_special_tests(struct pgtable_debug_args *args)
  559. {
  560. pte_t pte = pfn_pte(args->fixed_pte_pfn, args->page_prot);
  561. if (!IS_ENABLED(CONFIG_ARCH_HAS_PTE_SPECIAL))
  562. return;
  563. pr_debug("Validating PTE special\n");
  564. WARN_ON(!pte_special(pte_mkspecial(pte)));
  565. }
  566. static void __init pte_protnone_tests(struct pgtable_debug_args *args)
  567. {
  568. pte_t pte = pfn_pte(args->fixed_pte_pfn, args->page_prot_none);
  569. if (!IS_ENABLED(CONFIG_NUMA_BALANCING))
  570. return;
  571. pr_debug("Validating PTE protnone\n");
  572. WARN_ON(!pte_protnone(pte));
  573. WARN_ON(!pte_present(pte));
  574. }
  575. #ifdef CONFIG_TRANSPARENT_HUGEPAGE
  576. static void __init pmd_protnone_tests(struct pgtable_debug_args *args)
  577. {
  578. pmd_t pmd;
  579. if (!IS_ENABLED(CONFIG_NUMA_BALANCING))
  580. return;
  581. if (!has_transparent_hugepage())
  582. return;
  583. pr_debug("Validating PMD protnone\n");
  584. pmd = pmd_mkhuge(pfn_pmd(args->fixed_pmd_pfn, args->page_prot_none));
  585. WARN_ON(!pmd_protnone(pmd));
  586. WARN_ON(!pmd_present(pmd));
  587. }
  588. #else /* !CONFIG_TRANSPARENT_HUGEPAGE */
  589. static void __init pmd_protnone_tests(struct pgtable_debug_args *args) { }
  590. #endif /* CONFIG_TRANSPARENT_HUGEPAGE */
  591. #ifdef CONFIG_ARCH_HAS_PTE_DEVMAP
  592. static void __init pte_devmap_tests(struct pgtable_debug_args *args)
  593. {
  594. pte_t pte = pfn_pte(args->fixed_pte_pfn, args->page_prot);
  595. pr_debug("Validating PTE devmap\n");
  596. WARN_ON(!pte_devmap(pte_mkdevmap(pte)));
  597. }
  598. #ifdef CONFIG_TRANSPARENT_HUGEPAGE
  599. static void __init pmd_devmap_tests(struct pgtable_debug_args *args)
  600. {
  601. pmd_t pmd;
  602. if (!has_transparent_hugepage())
  603. return;
  604. pr_debug("Validating PMD devmap\n");
  605. pmd = pfn_pmd(args->fixed_pmd_pfn, args->page_prot);
  606. WARN_ON(!pmd_devmap(pmd_mkdevmap(pmd)));
  607. }
  608. #ifdef CONFIG_HAVE_ARCH_TRANSPARENT_HUGEPAGE_PUD
  609. static void __init pud_devmap_tests(struct pgtable_debug_args *args)
  610. {
  611. pud_t pud;
  612. if (!has_transparent_pud_hugepage())
  613. return;
  614. pr_debug("Validating PUD devmap\n");
  615. pud = pfn_pud(args->fixed_pud_pfn, args->page_prot);
  616. WARN_ON(!pud_devmap(pud_mkdevmap(pud)));
  617. }
  618. #else /* !CONFIG_HAVE_ARCH_TRANSPARENT_HUGEPAGE_PUD */
  619. static void __init pud_devmap_tests(struct pgtable_debug_args *args) { }
  620. #endif /* CONFIG_HAVE_ARCH_TRANSPARENT_HUGEPAGE_PUD */
  621. #else /* CONFIG_TRANSPARENT_HUGEPAGE */
  622. static void __init pmd_devmap_tests(struct pgtable_debug_args *args) { }
  623. static void __init pud_devmap_tests(struct pgtable_debug_args *args) { }
  624. #endif /* CONFIG_TRANSPARENT_HUGEPAGE */
  625. #else
  626. static void __init pte_devmap_tests(struct pgtable_debug_args *args) { }
  627. static void __init pmd_devmap_tests(struct pgtable_debug_args *args) { }
  628. static void __init pud_devmap_tests(struct pgtable_debug_args *args) { }
  629. #endif /* CONFIG_ARCH_HAS_PTE_DEVMAP */
  630. static void __init pte_soft_dirty_tests(struct pgtable_debug_args *args)
  631. {
  632. pte_t pte = pfn_pte(args->fixed_pte_pfn, args->page_prot);
  633. if (!IS_ENABLED(CONFIG_MEM_SOFT_DIRTY))
  634. return;
  635. pr_debug("Validating PTE soft dirty\n");
  636. WARN_ON(!pte_soft_dirty(pte_mksoft_dirty(pte)));
  637. WARN_ON(pte_soft_dirty(pte_clear_soft_dirty(pte)));
  638. }
  639. static void __init pte_swap_soft_dirty_tests(struct pgtable_debug_args *args)
  640. {
  641. pte_t pte = pfn_pte(args->fixed_pte_pfn, args->page_prot);
  642. if (!IS_ENABLED(CONFIG_MEM_SOFT_DIRTY))
  643. return;
  644. pr_debug("Validating PTE swap soft dirty\n");
  645. WARN_ON(!pte_swp_soft_dirty(pte_swp_mksoft_dirty(pte)));
  646. WARN_ON(pte_swp_soft_dirty(pte_swp_clear_soft_dirty(pte)));
  647. }
  648. #ifdef CONFIG_TRANSPARENT_HUGEPAGE
  649. static void __init pmd_soft_dirty_tests(struct pgtable_debug_args *args)
  650. {
  651. pmd_t pmd;
  652. if (!IS_ENABLED(CONFIG_MEM_SOFT_DIRTY))
  653. return;
  654. if (!has_transparent_hugepage())
  655. return;
  656. pr_debug("Validating PMD soft dirty\n");
  657. pmd = pfn_pmd(args->fixed_pmd_pfn, args->page_prot);
  658. WARN_ON(!pmd_soft_dirty(pmd_mksoft_dirty(pmd)));
  659. WARN_ON(pmd_soft_dirty(pmd_clear_soft_dirty(pmd)));
  660. }
  661. static void __init pmd_swap_soft_dirty_tests(struct pgtable_debug_args *args)
  662. {
  663. pmd_t pmd;
  664. if (!IS_ENABLED(CONFIG_MEM_SOFT_DIRTY) ||
  665. !IS_ENABLED(CONFIG_ARCH_ENABLE_THP_MIGRATION))
  666. return;
  667. if (!has_transparent_hugepage())
  668. return;
  669. pr_debug("Validating PMD swap soft dirty\n");
  670. pmd = pfn_pmd(args->fixed_pmd_pfn, args->page_prot);
  671. WARN_ON(!pmd_swp_soft_dirty(pmd_swp_mksoft_dirty(pmd)));
  672. WARN_ON(pmd_swp_soft_dirty(pmd_swp_clear_soft_dirty(pmd)));
  673. }
  674. #else /* !CONFIG_TRANSPARENT_HUGEPAGE */
  675. static void __init pmd_soft_dirty_tests(struct pgtable_debug_args *args) { }
  676. static void __init pmd_swap_soft_dirty_tests(struct pgtable_debug_args *args) { }
  677. #endif /* CONFIG_TRANSPARENT_HUGEPAGE */
  678. static void __init pte_swap_exclusive_tests(struct pgtable_debug_args *args)
  679. {
  680. unsigned long max_swap_offset;
  681. swp_entry_t entry, entry2;
  682. pte_t pte;
  683. pr_debug("Validating PTE swap exclusive\n");
  684. /* See generic_max_swapfile_size(): probe the maximum offset */
  685. max_swap_offset = swp_offset(pte_to_swp_entry(swp_entry_to_pte(swp_entry(0, ~0UL))));
  686. /* Create a swp entry with all possible bits set */
  687. entry = swp_entry((1 << MAX_SWAPFILES_SHIFT) - 1, max_swap_offset);
  688. pte = swp_entry_to_pte(entry);
  689. WARN_ON(pte_swp_exclusive(pte));
  690. WARN_ON(!is_swap_pte(pte));
  691. entry2 = pte_to_swp_entry(pte);
  692. WARN_ON(memcmp(&entry, &entry2, sizeof(entry)));
  693. pte = pte_swp_mkexclusive(pte);
  694. WARN_ON(!pte_swp_exclusive(pte));
  695. WARN_ON(!is_swap_pte(pte));
  696. WARN_ON(pte_swp_soft_dirty(pte));
  697. entry2 = pte_to_swp_entry(pte);
  698. WARN_ON(memcmp(&entry, &entry2, sizeof(entry)));
  699. pte = pte_swp_clear_exclusive(pte);
  700. WARN_ON(pte_swp_exclusive(pte));
  701. WARN_ON(!is_swap_pte(pte));
  702. entry2 = pte_to_swp_entry(pte);
  703. WARN_ON(memcmp(&entry, &entry2, sizeof(entry)));
  704. }
  705. static void __init pte_swap_tests(struct pgtable_debug_args *args)
  706. {
  707. swp_entry_t swp;
  708. pte_t pte;
  709. pr_debug("Validating PTE swap\n");
  710. pte = pfn_pte(args->fixed_pte_pfn, args->page_prot);
  711. swp = __pte_to_swp_entry(pte);
  712. pte = __swp_entry_to_pte(swp);
  713. WARN_ON(args->fixed_pte_pfn != pte_pfn(pte));
  714. }
  715. #ifdef CONFIG_ARCH_ENABLE_THP_MIGRATION
  716. static void __init pmd_swap_tests(struct pgtable_debug_args *args)
  717. {
  718. swp_entry_t swp;
  719. pmd_t pmd;
  720. if (!has_transparent_hugepage())
  721. return;
  722. pr_debug("Validating PMD swap\n");
  723. pmd = pfn_pmd(args->fixed_pmd_pfn, args->page_prot);
  724. swp = __pmd_to_swp_entry(pmd);
  725. pmd = __swp_entry_to_pmd(swp);
  726. WARN_ON(args->fixed_pmd_pfn != pmd_pfn(pmd));
  727. }
  728. #else /* !CONFIG_ARCH_ENABLE_THP_MIGRATION */
  729. static void __init pmd_swap_tests(struct pgtable_debug_args *args) { }
  730. #endif /* CONFIG_ARCH_ENABLE_THP_MIGRATION */
  731. static void __init swap_migration_tests(struct pgtable_debug_args *args)
  732. {
  733. struct page *page;
  734. swp_entry_t swp;
  735. if (!IS_ENABLED(CONFIG_MIGRATION))
  736. return;
  737. /*
  738. * swap_migration_tests() requires a dedicated page as it needs to
  739. * be locked before creating a migration entry from it. Locking the
  740. * page that actually maps kernel text ('start_kernel') can be real
  741. * problematic. Lets use the allocated page explicitly for this
  742. * purpose.
  743. */
  744. page = (args->pte_pfn != ULONG_MAX) ? pfn_to_page(args->pte_pfn) : NULL;
  745. if (!page)
  746. return;
  747. pr_debug("Validating swap migration\n");
  748. /*
  749. * make_[readable|writable]_migration_entry() expects given page to
  750. * be locked, otherwise it stumbles upon a BUG_ON().
  751. */
  752. __SetPageLocked(page);
  753. swp = make_writable_migration_entry(page_to_pfn(page));
  754. WARN_ON(!is_migration_entry(swp));
  755. WARN_ON(!is_writable_migration_entry(swp));
  756. swp = make_readable_migration_entry(swp_offset(swp));
  757. WARN_ON(!is_migration_entry(swp));
  758. WARN_ON(is_writable_migration_entry(swp));
  759. swp = make_readable_migration_entry(page_to_pfn(page));
  760. WARN_ON(!is_migration_entry(swp));
  761. WARN_ON(is_writable_migration_entry(swp));
  762. __ClearPageLocked(page);
  763. }
  764. #ifdef CONFIG_HUGETLB_PAGE
  765. static void __init hugetlb_basic_tests(struct pgtable_debug_args *args)
  766. {
  767. struct page *page;
  768. pte_t pte;
  769. pr_debug("Validating HugeTLB basic\n");
  770. /*
  771. * Accessing the page associated with the pfn is safe here,
  772. * as it was previously derived from a real kernel symbol.
  773. */
  774. page = pfn_to_page(args->fixed_pmd_pfn);
  775. pte = mk_huge_pte(page, args->page_prot);
  776. WARN_ON(!huge_pte_dirty(huge_pte_mkdirty(pte)));
  777. WARN_ON(!huge_pte_write(huge_pte_mkwrite(huge_pte_wrprotect(pte))));
  778. WARN_ON(huge_pte_write(huge_pte_wrprotect(huge_pte_mkwrite(pte))));
  779. #ifdef CONFIG_ARCH_WANT_GENERAL_HUGETLB
  780. pte = pfn_pte(args->fixed_pmd_pfn, args->page_prot);
  781. WARN_ON(!pte_huge(arch_make_huge_pte(pte, PMD_SHIFT, VM_ACCESS_FLAGS)));
  782. #endif /* CONFIG_ARCH_WANT_GENERAL_HUGETLB */
  783. }
  784. #else /* !CONFIG_HUGETLB_PAGE */
  785. static void __init hugetlb_basic_tests(struct pgtable_debug_args *args) { }
  786. #endif /* CONFIG_HUGETLB_PAGE */
  787. #ifdef CONFIG_TRANSPARENT_HUGEPAGE
  788. static void __init pmd_thp_tests(struct pgtable_debug_args *args)
  789. {
  790. pmd_t pmd;
  791. if (!has_transparent_hugepage())
  792. return;
  793. pr_debug("Validating PMD based THP\n");
  794. /*
  795. * pmd_trans_huge() and pmd_present() must return positive after
  796. * MMU invalidation with pmd_mkinvalid(). This behavior is an
  797. * optimization for transparent huge page. pmd_trans_huge() must
  798. * be true if pmd_page() returns a valid THP to avoid taking the
  799. * pmd_lock when others walk over non transhuge pmds (i.e. there
  800. * are no THP allocated). Especially when splitting a THP and
  801. * removing the present bit from the pmd, pmd_trans_huge() still
  802. * needs to return true. pmd_present() should be true whenever
  803. * pmd_trans_huge() returns true.
  804. */
  805. pmd = pfn_pmd(args->fixed_pmd_pfn, args->page_prot);
  806. WARN_ON(!pmd_trans_huge(pmd_mkhuge(pmd)));
  807. #ifndef __HAVE_ARCH_PMDP_INVALIDATE
  808. WARN_ON(!pmd_trans_huge(pmd_mkinvalid(pmd_mkhuge(pmd))));
  809. WARN_ON(!pmd_present(pmd_mkinvalid(pmd_mkhuge(pmd))));
  810. WARN_ON(!pmd_leaf(pmd_mkinvalid(pmd_mkhuge(pmd))));
  811. #endif /* __HAVE_ARCH_PMDP_INVALIDATE */
  812. }
  813. #ifdef CONFIG_HAVE_ARCH_TRANSPARENT_HUGEPAGE_PUD
  814. static void __init pud_thp_tests(struct pgtable_debug_args *args)
  815. {
  816. pud_t pud;
  817. if (!has_transparent_pud_hugepage())
  818. return;
  819. pr_debug("Validating PUD based THP\n");
  820. pud = pfn_pud(args->fixed_pud_pfn, args->page_prot);
  821. WARN_ON(!pud_trans_huge(pud_mkhuge(pud)));
  822. /*
  823. * pud_mkinvalid() has been dropped for now. Enable back
  824. * these tests when it comes back with a modified pud_present().
  825. *
  826. * WARN_ON(!pud_trans_huge(pud_mkinvalid(pud_mkhuge(pud))));
  827. * WARN_ON(!pud_present(pud_mkinvalid(pud_mkhuge(pud))));
  828. */
  829. }
  830. #else /* !CONFIG_HAVE_ARCH_TRANSPARENT_HUGEPAGE_PUD */
  831. static void __init pud_thp_tests(struct pgtable_debug_args *args) { }
  832. #endif /* CONFIG_HAVE_ARCH_TRANSPARENT_HUGEPAGE_PUD */
  833. #else /* !CONFIG_TRANSPARENT_HUGEPAGE */
  834. static void __init pmd_thp_tests(struct pgtable_debug_args *args) { }
  835. static void __init pud_thp_tests(struct pgtable_debug_args *args) { }
  836. #endif /* CONFIG_TRANSPARENT_HUGEPAGE */
  837. static unsigned long __init get_random_vaddr(void)
  838. {
  839. unsigned long random_vaddr, random_pages, total_user_pages;
  840. total_user_pages = (TASK_SIZE - FIRST_USER_ADDRESS) / PAGE_SIZE;
  841. random_pages = get_random_long() % total_user_pages;
  842. random_vaddr = FIRST_USER_ADDRESS + random_pages * PAGE_SIZE;
  843. return random_vaddr;
  844. }
  845. static void __init destroy_args(struct pgtable_debug_args *args)
  846. {
  847. struct page *page = NULL;
  848. /* Free (huge) page */
  849. if (IS_ENABLED(CONFIG_TRANSPARENT_HUGEPAGE) &&
  850. has_transparent_pud_hugepage() &&
  851. args->pud_pfn != ULONG_MAX) {
  852. if (args->is_contiguous_page) {
  853. free_contig_range(args->pud_pfn,
  854. (1 << (HPAGE_PUD_SHIFT - PAGE_SHIFT)));
  855. } else {
  856. page = pfn_to_page(args->pud_pfn);
  857. __free_pages(page, HPAGE_PUD_SHIFT - PAGE_SHIFT);
  858. }
  859. args->pud_pfn = ULONG_MAX;
  860. args->pmd_pfn = ULONG_MAX;
  861. args->pte_pfn = ULONG_MAX;
  862. }
  863. if (IS_ENABLED(CONFIG_TRANSPARENT_HUGEPAGE) &&
  864. has_transparent_hugepage() &&
  865. args->pmd_pfn != ULONG_MAX) {
  866. if (args->is_contiguous_page) {
  867. free_contig_range(args->pmd_pfn, (1 << HPAGE_PMD_ORDER));
  868. } else {
  869. page = pfn_to_page(args->pmd_pfn);
  870. __free_pages(page, HPAGE_PMD_ORDER);
  871. }
  872. args->pmd_pfn = ULONG_MAX;
  873. args->pte_pfn = ULONG_MAX;
  874. }
  875. if (args->pte_pfn != ULONG_MAX) {
  876. page = pfn_to_page(args->pte_pfn);
  877. __free_page(page);
  878. args->pte_pfn = ULONG_MAX;
  879. }
  880. /* Free page table entries */
  881. if (args->start_ptep) {
  882. pmd_clear(args->pmdp);
  883. pte_free(args->mm, args->start_ptep);
  884. mm_dec_nr_ptes(args->mm);
  885. }
  886. if (args->start_pmdp) {
  887. pud_clear(args->pudp);
  888. pmd_free(args->mm, args->start_pmdp);
  889. mm_dec_nr_pmds(args->mm);
  890. }
  891. if (args->start_pudp) {
  892. p4d_clear(args->p4dp);
  893. pud_free(args->mm, args->start_pudp);
  894. mm_dec_nr_puds(args->mm);
  895. }
  896. if (args->start_p4dp) {
  897. pgd_clear(args->pgdp);
  898. p4d_free(args->mm, args->start_p4dp);
  899. }
  900. /* Free vma and mm struct */
  901. if (args->vma)
  902. vm_area_free(args->vma);
  903. if (args->mm)
  904. mmput(args->mm);
  905. }
  906. static struct page * __init
  907. debug_vm_pgtable_alloc_huge_page(struct pgtable_debug_args *args, int order)
  908. {
  909. struct page *page = NULL;
  910. #ifdef CONFIG_CONTIG_ALLOC
  911. if (order > MAX_PAGE_ORDER) {
  912. page = alloc_contig_pages((1 << order), GFP_KERNEL,
  913. first_online_node, NULL);
  914. if (page) {
  915. args->is_contiguous_page = true;
  916. return page;
  917. }
  918. }
  919. #endif
  920. if (order <= MAX_PAGE_ORDER)
  921. page = alloc_pages(GFP_KERNEL, order);
  922. return page;
  923. }
  924. /*
  925. * Check if a physical memory range described by <pstart, pend> contains
  926. * an area that is of size psize, and aligned to psize.
  927. *
  928. * Don't use address 0, an all-zeroes physical address might mask bugs, and
  929. * it's not used on x86.
  930. */
  931. static void __init phys_align_check(phys_addr_t pstart,
  932. phys_addr_t pend, unsigned long psize,
  933. phys_addr_t *physp, unsigned long *alignp)
  934. {
  935. phys_addr_t aligned_start, aligned_end;
  936. if (pstart == 0)
  937. pstart = PAGE_SIZE;
  938. aligned_start = ALIGN(pstart, psize);
  939. aligned_end = aligned_start + psize;
  940. if (aligned_end > aligned_start && aligned_end <= pend) {
  941. *alignp = psize;
  942. *physp = aligned_start;
  943. }
  944. }
  945. static void __init init_fixed_pfns(struct pgtable_debug_args *args)
  946. {
  947. u64 idx;
  948. phys_addr_t phys, pstart, pend;
  949. /*
  950. * Initialize the fixed pfns. To do this, try to find a
  951. * valid physical range, preferably aligned to PUD_SIZE,
  952. * but settling for aligned to PMD_SIZE as a fallback. If
  953. * neither of those is found, use the physical address of
  954. * the start_kernel symbol.
  955. *
  956. * The memory doesn't need to be allocated, it just needs to exist
  957. * as usable memory. It won't be touched.
  958. *
  959. * The alignment is recorded, and can be checked to see if we
  960. * can run the tests that require an actual valid physical
  961. * address range on some architectures ({pmd,pud}_huge_test
  962. * on x86).
  963. */
  964. phys = __pa_symbol(&start_kernel);
  965. args->fixed_alignment = PAGE_SIZE;
  966. for_each_mem_range(idx, &pstart, &pend) {
  967. /* First check for a PUD-aligned area */
  968. phys_align_check(pstart, pend, PUD_SIZE, &phys,
  969. &args->fixed_alignment);
  970. /* If a PUD-aligned area is found, we're done */
  971. if (args->fixed_alignment == PUD_SIZE)
  972. break;
  973. /*
  974. * If no PMD-aligned area found yet, check for one,
  975. * but continue the loop to look for a PUD-aligned area.
  976. */
  977. if (args->fixed_alignment < PMD_SIZE)
  978. phys_align_check(pstart, pend, PMD_SIZE, &phys,
  979. &args->fixed_alignment);
  980. }
  981. args->fixed_pgd_pfn = __phys_to_pfn(phys & PGDIR_MASK);
  982. args->fixed_p4d_pfn = __phys_to_pfn(phys & P4D_MASK);
  983. args->fixed_pud_pfn = __phys_to_pfn(phys & PUD_MASK);
  984. args->fixed_pmd_pfn = __phys_to_pfn(phys & PMD_MASK);
  985. args->fixed_pte_pfn = __phys_to_pfn(phys & PAGE_MASK);
  986. WARN_ON(!pfn_valid(args->fixed_pte_pfn));
  987. }
  988. static int __init init_args(struct pgtable_debug_args *args)
  989. {
  990. struct page *page = NULL;
  991. int ret = 0;
  992. /*
  993. * Initialize the debugging data.
  994. *
  995. * vm_get_page_prot(VM_NONE) or vm_get_page_prot(VM_SHARED|VM_NONE)
  996. * will help create page table entries with PROT_NONE permission as
  997. * required for pxx_protnone_tests().
  998. */
  999. memset(args, 0, sizeof(*args));
  1000. args->vaddr = get_random_vaddr();
  1001. args->page_prot = vm_get_page_prot(VM_ACCESS_FLAGS);
  1002. args->page_prot_none = vm_get_page_prot(VM_NONE);
  1003. args->is_contiguous_page = false;
  1004. args->pud_pfn = ULONG_MAX;
  1005. args->pmd_pfn = ULONG_MAX;
  1006. args->pte_pfn = ULONG_MAX;
  1007. args->fixed_pgd_pfn = ULONG_MAX;
  1008. args->fixed_p4d_pfn = ULONG_MAX;
  1009. args->fixed_pud_pfn = ULONG_MAX;
  1010. args->fixed_pmd_pfn = ULONG_MAX;
  1011. args->fixed_pte_pfn = ULONG_MAX;
  1012. /* Allocate mm and vma */
  1013. args->mm = mm_alloc();
  1014. if (!args->mm) {
  1015. pr_err("Failed to allocate mm struct\n");
  1016. ret = -ENOMEM;
  1017. goto error;
  1018. }
  1019. args->vma = vm_area_alloc(args->mm);
  1020. if (!args->vma) {
  1021. pr_err("Failed to allocate vma\n");
  1022. ret = -ENOMEM;
  1023. goto error;
  1024. }
  1025. /*
  1026. * Allocate page table entries. They will be modified in the tests.
  1027. * Lets save the page table entries so that they can be released
  1028. * when the tests are completed.
  1029. */
  1030. args->pgdp = pgd_offset(args->mm, args->vaddr);
  1031. args->p4dp = p4d_alloc(args->mm, args->pgdp, args->vaddr);
  1032. if (!args->p4dp) {
  1033. pr_err("Failed to allocate p4d entries\n");
  1034. ret = -ENOMEM;
  1035. goto error;
  1036. }
  1037. args->start_p4dp = p4d_offset(args->pgdp, 0UL);
  1038. WARN_ON(!args->start_p4dp);
  1039. args->pudp = pud_alloc(args->mm, args->p4dp, args->vaddr);
  1040. if (!args->pudp) {
  1041. pr_err("Failed to allocate pud entries\n");
  1042. ret = -ENOMEM;
  1043. goto error;
  1044. }
  1045. args->start_pudp = pud_offset(args->p4dp, 0UL);
  1046. WARN_ON(!args->start_pudp);
  1047. args->pmdp = pmd_alloc(args->mm, args->pudp, args->vaddr);
  1048. if (!args->pmdp) {
  1049. pr_err("Failed to allocate pmd entries\n");
  1050. ret = -ENOMEM;
  1051. goto error;
  1052. }
  1053. args->start_pmdp = pmd_offset(args->pudp, 0UL);
  1054. WARN_ON(!args->start_pmdp);
  1055. if (pte_alloc(args->mm, args->pmdp)) {
  1056. pr_err("Failed to allocate pte entries\n");
  1057. ret = -ENOMEM;
  1058. goto error;
  1059. }
  1060. args->start_ptep = pmd_pgtable(pmdp_get(args->pmdp));
  1061. WARN_ON(!args->start_ptep);
  1062. init_fixed_pfns(args);
  1063. /*
  1064. * Allocate (huge) pages because some of the tests need to access
  1065. * the data in the pages. The corresponding tests will be skipped
  1066. * if we fail to allocate (huge) pages.
  1067. */
  1068. if (IS_ENABLED(CONFIG_TRANSPARENT_HUGEPAGE) &&
  1069. has_transparent_pud_hugepage()) {
  1070. page = debug_vm_pgtable_alloc_huge_page(args,
  1071. HPAGE_PUD_SHIFT - PAGE_SHIFT);
  1072. if (page) {
  1073. args->pud_pfn = page_to_pfn(page);
  1074. args->pmd_pfn = args->pud_pfn;
  1075. args->pte_pfn = args->pud_pfn;
  1076. return 0;
  1077. }
  1078. }
  1079. if (IS_ENABLED(CONFIG_TRANSPARENT_HUGEPAGE) &&
  1080. has_transparent_hugepage()) {
  1081. page = debug_vm_pgtable_alloc_huge_page(args, HPAGE_PMD_ORDER);
  1082. if (page) {
  1083. args->pmd_pfn = page_to_pfn(page);
  1084. args->pte_pfn = args->pmd_pfn;
  1085. return 0;
  1086. }
  1087. }
  1088. page = alloc_page(GFP_KERNEL);
  1089. if (page)
  1090. args->pte_pfn = page_to_pfn(page);
  1091. return 0;
  1092. error:
  1093. destroy_args(args);
  1094. return ret;
  1095. }
  1096. static int __init debug_vm_pgtable(void)
  1097. {
  1098. struct pgtable_debug_args args;
  1099. spinlock_t *ptl = NULL;
  1100. int idx, ret;
  1101. pr_info("Validating architecture page table helpers\n");
  1102. ret = init_args(&args);
  1103. if (ret)
  1104. return ret;
  1105. /*
  1106. * Iterate over each possible vm_flags to make sure that all
  1107. * the basic page table transformation validations just hold
  1108. * true irrespective of the starting protection value for a
  1109. * given page table entry.
  1110. *
  1111. * Protection based vm_flags combinations are always linear
  1112. * and increasing i.e starting from VM_NONE and going up to
  1113. * (VM_SHARED | READ | WRITE | EXEC).
  1114. */
  1115. #define VM_FLAGS_START (VM_NONE)
  1116. #define VM_FLAGS_END (VM_SHARED | VM_EXEC | VM_WRITE | VM_READ)
  1117. for (idx = VM_FLAGS_START; idx <= VM_FLAGS_END; idx++) {
  1118. pte_basic_tests(&args, idx);
  1119. pmd_basic_tests(&args, idx);
  1120. pud_basic_tests(&args, idx);
  1121. }
  1122. /*
  1123. * Both P4D and PGD level tests are very basic which do not
  1124. * involve creating page table entries from the protection
  1125. * value and the given pfn. Hence just keep them out from
  1126. * the above iteration for now to save some test execution
  1127. * time.
  1128. */
  1129. p4d_basic_tests(&args);
  1130. pgd_basic_tests(&args);
  1131. pmd_leaf_tests(&args);
  1132. pud_leaf_tests(&args);
  1133. pte_special_tests(&args);
  1134. pte_protnone_tests(&args);
  1135. pmd_protnone_tests(&args);
  1136. pte_devmap_tests(&args);
  1137. pmd_devmap_tests(&args);
  1138. pud_devmap_tests(&args);
  1139. pte_soft_dirty_tests(&args);
  1140. pmd_soft_dirty_tests(&args);
  1141. pte_swap_soft_dirty_tests(&args);
  1142. pmd_swap_soft_dirty_tests(&args);
  1143. pte_swap_exclusive_tests(&args);
  1144. pte_swap_tests(&args);
  1145. pmd_swap_tests(&args);
  1146. swap_migration_tests(&args);
  1147. pmd_thp_tests(&args);
  1148. pud_thp_tests(&args);
  1149. hugetlb_basic_tests(&args);
  1150. /*
  1151. * Page table modifying tests. They need to hold
  1152. * proper page table lock.
  1153. */
  1154. args.ptep = pte_offset_map_lock(args.mm, args.pmdp, args.vaddr, &ptl);
  1155. pte_clear_tests(&args);
  1156. pte_advanced_tests(&args);
  1157. if (args.ptep)
  1158. pte_unmap_unlock(args.ptep, ptl);
  1159. ptl = pmd_lock(args.mm, args.pmdp);
  1160. pmd_clear_tests(&args);
  1161. pmd_advanced_tests(&args);
  1162. pmd_huge_tests(&args);
  1163. pmd_populate_tests(&args);
  1164. spin_unlock(ptl);
  1165. ptl = pud_lock(args.mm, args.pudp);
  1166. pud_clear_tests(&args);
  1167. pud_advanced_tests(&args);
  1168. pud_huge_tests(&args);
  1169. pud_populate_tests(&args);
  1170. spin_unlock(ptl);
  1171. spin_lock(&(args.mm->page_table_lock));
  1172. p4d_clear_tests(&args);
  1173. pgd_clear_tests(&args);
  1174. p4d_populate_tests(&args);
  1175. pgd_populate_tests(&args);
  1176. spin_unlock(&(args.mm->page_table_lock));
  1177. destroy_args(&args);
  1178. return 0;
  1179. }
  1180. late_initcall(debug_vm_pgtable);