1 // SPDX-License-Identifier: GPL-2.0
3 * Copyright IBM Corp. 2011
6 #include <linux/hugetlb.h>
7 #include <linux/proc_fs.h>
8 #include <linux/vmalloc.h>
10 #include <asm/cacheflush.h>
11 #include <asm/facility.h>
12 #include <asm/pgalloc.h>
13 #include <asm/kfence.h>
16 #include <asm/set_memory.h>
18 static inline unsigned long sske_frame(unsigned long addr, unsigned char skey)
20 asm volatile(".insn rrf,0xb22b0000,%[skey],%[addr],1,0"
21 : [addr] "+a" (addr) : [skey] "d" (skey));
25 void __storage_key_init_range(unsigned long start, unsigned long end)
27 unsigned long boundary, size;
30 if (MACHINE_HAS_EDAT1) {
31 /* set storage keys for a 1MB frame */
33 boundary = (start + size) & ~(size - 1);
34 if (boundary <= end) {
36 start = sske_frame(start, PAGE_DEFAULT_KEY);
37 } while (start < boundary);
41 page_set_storage_key(start, PAGE_DEFAULT_KEY, 1);
47 atomic_long_t __bootdata_preserved(direct_pages_count[PG_DIRECT_MAP_MAX]);
49 void arch_report_meminfo(struct seq_file *m)
51 seq_printf(m, "DirectMap4k: %8lu kB\n",
52 atomic_long_read(&direct_pages_count[PG_DIRECT_MAP_4K]) << 2);
53 seq_printf(m, "DirectMap1M: %8lu kB\n",
54 atomic_long_read(&direct_pages_count[PG_DIRECT_MAP_1M]) << 10);
55 seq_printf(m, "DirectMap2G: %8lu kB\n",
56 atomic_long_read(&direct_pages_count[PG_DIRECT_MAP_2G]) << 21);
58 #endif /* CONFIG_PROC_FS */
60 static void pgt_set(unsigned long *old, unsigned long new, unsigned long addr,
63 unsigned long *table, mask;
66 if (MACHINE_HAS_EDAT2) {
68 case CRDTE_DTT_REGION3:
69 mask = ~(PTRS_PER_PUD * sizeof(pud_t) - 1);
71 case CRDTE_DTT_SEGMENT:
72 mask = ~(PTRS_PER_PMD * sizeof(pmd_t) - 1);
75 mask = ~(PTRS_PER_PTE * sizeof(pte_t) - 1);
78 table = (unsigned long *)((unsigned long)old & mask);
79 crdte(*old, new, table, dtt, addr, get_lowcore()->kernel_asce.val);
80 } else if (MACHINE_HAS_IDTE) {
83 csp((unsigned int *)old + 1, *old, new);
87 static int walk_pte_level(pmd_t *pmdp, unsigned long addr, unsigned long end,
92 if (flags == SET_MEMORY_4K)
94 ptep = pte_offset_kernel(pmdp, addr);
99 if (flags & SET_MEMORY_RO)
100 new = pte_wrprotect(new);
101 else if (flags & SET_MEMORY_RW)
102 new = pte_mkwrite_novma(pte_mkdirty(new));
103 if (flags & SET_MEMORY_NX)
104 new = set_pte_bit(new, __pgprot(_PAGE_NOEXEC));
105 else if (flags & SET_MEMORY_X)
106 new = clear_pte_bit(new, __pgprot(_PAGE_NOEXEC));
107 if (flags & SET_MEMORY_INV) {
108 new = set_pte_bit(new, __pgprot(_PAGE_INVALID));
109 } else if (flags & SET_MEMORY_DEF) {
110 new = __pte(pte_val(new) & PAGE_MASK);
111 new = set_pte_bit(new, PAGE_KERNEL);
113 new = clear_pte_bit(new, __pgprot(_PAGE_NOEXEC));
115 pgt_set((unsigned long *)ptep, pte_val(new), addr, CRDTE_DTT_PAGE);
119 } while (addr < end);
123 static int split_pmd_page(pmd_t *pmdp, unsigned long addr)
125 unsigned long pte_addr, prot;
126 pte_t *pt_dir, *ptep;
130 pt_dir = vmem_pte_alloc();
133 pte_addr = pmd_pfn(*pmdp) << PAGE_SHIFT;
134 ro = !!(pmd_val(*pmdp) & _SEGMENT_ENTRY_PROTECT);
135 nx = !!(pmd_val(*pmdp) & _SEGMENT_ENTRY_NOEXEC);
136 prot = pgprot_val(ro ? PAGE_KERNEL_RO : PAGE_KERNEL);
138 prot &= ~_PAGE_NOEXEC;
140 for (i = 0; i < PTRS_PER_PTE; i++) {
141 set_pte(ptep, __pte(pte_addr | prot));
142 pte_addr += PAGE_SIZE;
145 new = __pmd(__pa(pt_dir) | _SEGMENT_ENTRY);
146 pgt_set((unsigned long *)pmdp, pmd_val(new), addr, CRDTE_DTT_SEGMENT);
147 update_page_count(PG_DIRECT_MAP_4K, PTRS_PER_PTE);
148 update_page_count(PG_DIRECT_MAP_1M, -1);
152 static void modify_pmd_page(pmd_t *pmdp, unsigned long addr,
157 if (flags & SET_MEMORY_RO)
158 new = pmd_wrprotect(new);
159 else if (flags & SET_MEMORY_RW)
160 new = pmd_mkwrite_novma(pmd_mkdirty(new));
161 if (flags & SET_MEMORY_NX)
162 new = set_pmd_bit(new, __pgprot(_SEGMENT_ENTRY_NOEXEC));
163 else if (flags & SET_MEMORY_X)
164 new = clear_pmd_bit(new, __pgprot(_SEGMENT_ENTRY_NOEXEC));
165 if (flags & SET_MEMORY_INV) {
166 new = set_pmd_bit(new, __pgprot(_SEGMENT_ENTRY_INVALID));
167 } else if (flags & SET_MEMORY_DEF) {
168 new = __pmd(pmd_val(new) & PMD_MASK);
169 new = set_pmd_bit(new, SEGMENT_KERNEL);
171 new = clear_pmd_bit(new, __pgprot(_SEGMENT_ENTRY_NOEXEC));
173 pgt_set((unsigned long *)pmdp, pmd_val(new), addr, CRDTE_DTT_SEGMENT);
176 static int walk_pmd_level(pud_t *pudp, unsigned long addr, unsigned long end,
184 pmdp = pmd_offset(pudp, addr);
188 next = pmd_addr_end(addr, end);
189 if (pmd_leaf(*pmdp)) {
190 need_split = !!(flags & SET_MEMORY_4K);
191 need_split |= !!(addr & ~PMD_MASK);
192 need_split |= !!(addr + PMD_SIZE > next);
194 rc = split_pmd_page(pmdp, addr);
199 modify_pmd_page(pmdp, addr, flags);
201 rc = walk_pte_level(pmdp, addr, next, flags);
208 } while (addr < end);
212 static int split_pud_page(pud_t *pudp, unsigned long addr)
214 unsigned long pmd_addr, prot;
215 pmd_t *pm_dir, *pmdp;
219 pm_dir = vmem_crst_alloc(_SEGMENT_ENTRY_EMPTY);
222 pmd_addr = pud_pfn(*pudp) << PAGE_SHIFT;
223 ro = !!(pud_val(*pudp) & _REGION_ENTRY_PROTECT);
224 nx = !!(pud_val(*pudp) & _REGION_ENTRY_NOEXEC);
225 prot = pgprot_val(ro ? SEGMENT_KERNEL_RO : SEGMENT_KERNEL);
227 prot &= ~_SEGMENT_ENTRY_NOEXEC;
229 for (i = 0; i < PTRS_PER_PMD; i++) {
230 set_pmd(pmdp, __pmd(pmd_addr | prot));
231 pmd_addr += PMD_SIZE;
234 new = __pud(__pa(pm_dir) | _REGION3_ENTRY);
235 pgt_set((unsigned long *)pudp, pud_val(new), addr, CRDTE_DTT_REGION3);
236 update_page_count(PG_DIRECT_MAP_1M, PTRS_PER_PMD);
237 update_page_count(PG_DIRECT_MAP_2G, -1);
241 static void modify_pud_page(pud_t *pudp, unsigned long addr,
246 if (flags & SET_MEMORY_RO)
247 new = pud_wrprotect(new);
248 else if (flags & SET_MEMORY_RW)
249 new = pud_mkwrite(pud_mkdirty(new));
250 if (flags & SET_MEMORY_NX)
251 new = set_pud_bit(new, __pgprot(_REGION_ENTRY_NOEXEC));
252 else if (flags & SET_MEMORY_X)
253 new = clear_pud_bit(new, __pgprot(_REGION_ENTRY_NOEXEC));
254 if (flags & SET_MEMORY_INV) {
255 new = set_pud_bit(new, __pgprot(_REGION_ENTRY_INVALID));
256 } else if (flags & SET_MEMORY_DEF) {
257 new = __pud(pud_val(new) & PUD_MASK);
258 new = set_pud_bit(new, REGION3_KERNEL);
260 new = clear_pud_bit(new, __pgprot(_REGION_ENTRY_NOEXEC));
262 pgt_set((unsigned long *)pudp, pud_val(new), addr, CRDTE_DTT_REGION3);
265 static int walk_pud_level(p4d_t *p4d, unsigned long addr, unsigned long end,
273 pudp = pud_offset(p4d, addr);
277 next = pud_addr_end(addr, end);
278 if (pud_leaf(*pudp)) {
279 need_split = !!(flags & SET_MEMORY_4K);
280 need_split |= !!(addr & ~PUD_MASK);
281 need_split |= !!(addr + PUD_SIZE > next);
283 rc = split_pud_page(pudp, addr);
288 modify_pud_page(pudp, addr, flags);
290 rc = walk_pmd_level(pudp, addr, next, flags);
295 } while (addr < end && !rc);
299 static int walk_p4d_level(pgd_t *pgd, unsigned long addr, unsigned long end,
306 p4dp = p4d_offset(pgd, addr);
310 next = p4d_addr_end(addr, end);
311 rc = walk_pud_level(p4dp, addr, next, flags);
315 } while (addr < end && !rc);
319 DEFINE_MUTEX(cpa_mutex);
321 static int change_page_attr(unsigned long addr, unsigned long end,
328 pgdp = pgd_offset_k(addr);
332 next = pgd_addr_end(addr, end);
333 rc = walk_p4d_level(pgdp, addr, next, flags);
337 } while (pgdp++, addr = next, addr < end && !rc);
341 static int change_page_attr_alias(unsigned long addr, unsigned long end,
344 unsigned long alias, offset, va_start, va_end;
345 struct vm_struct *area;
349 * Changes to read-only permissions on kernel VA mappings are also
350 * applied to the kernel direct mapping. Execute permissions are
351 * intentionally not transferred to keep all allocated pages within
352 * the direct mapping non-executable.
354 flags &= SET_MEMORY_RO | SET_MEMORY_RW;
360 area = find_vm_area((void *)addr);
361 if (!area || !(area->flags & VM_ALLOC))
363 va_start = (unsigned long)area->addr;
364 va_end = va_start + area->nr_pages * PAGE_SIZE;
365 offset = (addr - va_start) >> PAGE_SHIFT;
366 alias = (unsigned long)page_address(area->pages[offset]);
367 rc = change_page_attr(alias, alias + PAGE_SIZE, flags);
377 int __set_memory(unsigned long addr, unsigned long numpages, unsigned long flags)
383 flags &= ~(SET_MEMORY_NX | SET_MEMORY_X);
389 end = addr + numpages * PAGE_SIZE;
390 mutex_lock(&cpa_mutex);
391 rc = change_page_attr(addr, end, flags);
394 rc = change_page_attr_alias(addr, end, flags);
396 mutex_unlock(&cpa_mutex);
400 int set_direct_map_invalid_noflush(struct page *page)
402 return __set_memory((unsigned long)page_to_virt(page), 1, SET_MEMORY_INV);
405 int set_direct_map_default_noflush(struct page *page)
407 return __set_memory((unsigned long)page_to_virt(page), 1, SET_MEMORY_DEF);
410 bool kernel_page_present(struct page *page)
415 addr = (unsigned long)page_address(page);
417 " lra %[addr],0(%[addr])\n"
419 : CC_OUT(cc, cc), [addr] "+a" (addr)
422 return CC_TRANSFORM(cc) == 0;
425 #if defined(CONFIG_DEBUG_PAGEALLOC) || defined(CONFIG_KFENCE)
427 static void ipte_range(pte_t *pte, unsigned long address, int nr)
431 if (test_facility(13)) {
432 __ptep_ipte_range(address, nr - 1, pte, IPTE_GLOBAL);
435 for (i = 0; i < nr; i++) {
436 __ptep_ipte(address, pte, 0, 0, IPTE_GLOBAL);
437 address += PAGE_SIZE;
442 void __kernel_map_pages(struct page *page, int numpages, int enable)
444 unsigned long address;
448 for (i = 0; i < numpages;) {
449 address = (unsigned long)page_to_virt(page + i);
450 ptep = virt_to_kpte(address);
451 nr = (unsigned long)ptep >> ilog2(sizeof(long));
452 nr = PTRS_PER_PTE - (nr & (PTRS_PER_PTE - 1));
453 nr = min(numpages - i, nr);
455 for (j = 0; j < nr; j++) {
456 pte = clear_pte_bit(*ptep, __pgprot(_PAGE_INVALID));
458 address += PAGE_SIZE;
462 ipte_range(ptep, address, nr);
468 #endif /* CONFIG_DEBUG_PAGEALLOC */