pgtable.c 30 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146114711481149115011511152115311541155115611571158115911601161116211631164116511661167116811691170117111721173117411751176
  1. // SPDX-License-Identifier: GPL-2.0
  2. /*
  3. * Copyright IBM Corp. 2007, 2011
  4. * Author(s): Martin Schwidefsky <[email protected]>
  5. */
  6. #include <linux/sched.h>
  7. #include <linux/kernel.h>
  8. #include <linux/errno.h>
  9. #include <linux/gfp.h>
  10. #include <linux/mm.h>
  11. #include <linux/swap.h>
  12. #include <linux/smp.h>
  13. #include <linux/spinlock.h>
  14. #include <linux/rcupdate.h>
  15. #include <linux/slab.h>
  16. #include <linux/swapops.h>
  17. #include <linux/sysctl.h>
  18. #include <linux/ksm.h>
  19. #include <linux/mman.h>
  20. #include <asm/tlb.h>
  21. #include <asm/tlbflush.h>
  22. #include <asm/mmu_context.h>
  23. #include <asm/page-states.h>
  24. pgprot_t pgprot_writecombine(pgprot_t prot)
  25. {
  26. /*
  27. * mio_wb_bit_mask may be set on a different CPU, but it is only set
  28. * once at init and only read afterwards.
  29. */
  30. return __pgprot(pgprot_val(prot) | mio_wb_bit_mask);
  31. }
  32. EXPORT_SYMBOL_GPL(pgprot_writecombine);
  33. pgprot_t pgprot_writethrough(pgprot_t prot)
  34. {
  35. /*
  36. * mio_wb_bit_mask may be set on a different CPU, but it is only set
  37. * once at init and only read afterwards.
  38. */
  39. return __pgprot(pgprot_val(prot) & ~mio_wb_bit_mask);
  40. }
  41. EXPORT_SYMBOL_GPL(pgprot_writethrough);
  42. static inline void ptep_ipte_local(struct mm_struct *mm, unsigned long addr,
  43. pte_t *ptep, int nodat)
  44. {
  45. unsigned long opt, asce;
  46. if (MACHINE_HAS_TLB_GUEST) {
  47. opt = 0;
  48. asce = READ_ONCE(mm->context.gmap_asce);
  49. if (asce == 0UL || nodat)
  50. opt |= IPTE_NODAT;
  51. if (asce != -1UL) {
  52. asce = asce ? : mm->context.asce;
  53. opt |= IPTE_GUEST_ASCE;
  54. }
  55. __ptep_ipte(addr, ptep, opt, asce, IPTE_LOCAL);
  56. } else {
  57. __ptep_ipte(addr, ptep, 0, 0, IPTE_LOCAL);
  58. }
  59. }
  60. static inline void ptep_ipte_global(struct mm_struct *mm, unsigned long addr,
  61. pte_t *ptep, int nodat)
  62. {
  63. unsigned long opt, asce;
  64. if (MACHINE_HAS_TLB_GUEST) {
  65. opt = 0;
  66. asce = READ_ONCE(mm->context.gmap_asce);
  67. if (asce == 0UL || nodat)
  68. opt |= IPTE_NODAT;
  69. if (asce != -1UL) {
  70. asce = asce ? : mm->context.asce;
  71. opt |= IPTE_GUEST_ASCE;
  72. }
  73. __ptep_ipte(addr, ptep, opt, asce, IPTE_GLOBAL);
  74. } else {
  75. __ptep_ipte(addr, ptep, 0, 0, IPTE_GLOBAL);
  76. }
  77. }
  78. static inline pte_t ptep_flush_direct(struct mm_struct *mm,
  79. unsigned long addr, pte_t *ptep,
  80. int nodat)
  81. {
  82. pte_t old;
  83. old = *ptep;
  84. if (unlikely(pte_val(old) & _PAGE_INVALID))
  85. return old;
  86. atomic_inc(&mm->context.flush_count);
  87. if (MACHINE_HAS_TLB_LC &&
  88. cpumask_equal(mm_cpumask(mm), cpumask_of(smp_processor_id())))
  89. ptep_ipte_local(mm, addr, ptep, nodat);
  90. else
  91. ptep_ipte_global(mm, addr, ptep, nodat);
  92. atomic_dec(&mm->context.flush_count);
  93. return old;
  94. }
  95. static inline pte_t ptep_flush_lazy(struct mm_struct *mm,
  96. unsigned long addr, pte_t *ptep,
  97. int nodat)
  98. {
  99. pte_t old;
  100. old = *ptep;
  101. if (unlikely(pte_val(old) & _PAGE_INVALID))
  102. return old;
  103. atomic_inc(&mm->context.flush_count);
  104. if (cpumask_equal(&mm->context.cpu_attach_mask,
  105. cpumask_of(smp_processor_id()))) {
  106. set_pte(ptep, set_pte_bit(*ptep, __pgprot(_PAGE_INVALID)));
  107. mm->context.flush_mm = 1;
  108. } else
  109. ptep_ipte_global(mm, addr, ptep, nodat);
  110. atomic_dec(&mm->context.flush_count);
  111. return old;
  112. }
  113. static inline pgste_t pgste_get_lock(pte_t *ptep)
  114. {
  115. unsigned long new = 0;
  116. #ifdef CONFIG_PGSTE
  117. unsigned long old;
  118. asm(
  119. " lg %0,%2\n"
  120. "0: lgr %1,%0\n"
  121. " nihh %0,0xff7f\n" /* clear PCL bit in old */
  122. " oihh %1,0x0080\n" /* set PCL bit in new */
  123. " csg %0,%1,%2\n"
  124. " jl 0b\n"
  125. : "=&d" (old), "=&d" (new), "=Q" (ptep[PTRS_PER_PTE])
  126. : "Q" (ptep[PTRS_PER_PTE]) : "cc", "memory");
  127. #endif
  128. return __pgste(new);
  129. }
  130. static inline void pgste_set_unlock(pte_t *ptep, pgste_t pgste)
  131. {
  132. #ifdef CONFIG_PGSTE
  133. asm(
  134. " nihh %1,0xff7f\n" /* clear PCL bit */
  135. " stg %1,%0\n"
  136. : "=Q" (ptep[PTRS_PER_PTE])
  137. : "d" (pgste_val(pgste)), "Q" (ptep[PTRS_PER_PTE])
  138. : "cc", "memory");
  139. #endif
  140. }
  141. static inline pgste_t pgste_get(pte_t *ptep)
  142. {
  143. unsigned long pgste = 0;
  144. #ifdef CONFIG_PGSTE
  145. pgste = *(unsigned long *)(ptep + PTRS_PER_PTE);
  146. #endif
  147. return __pgste(pgste);
  148. }
  149. static inline void pgste_set(pte_t *ptep, pgste_t pgste)
  150. {
  151. #ifdef CONFIG_PGSTE
  152. *(pgste_t *)(ptep + PTRS_PER_PTE) = pgste;
  153. #endif
  154. }
  155. static inline pgste_t pgste_update_all(pte_t pte, pgste_t pgste,
  156. struct mm_struct *mm)
  157. {
  158. #ifdef CONFIG_PGSTE
  159. unsigned long address, bits, skey;
  160. if (!mm_uses_skeys(mm) || pte_val(pte) & _PAGE_INVALID)
  161. return pgste;
  162. address = pte_val(pte) & PAGE_MASK;
  163. skey = (unsigned long) page_get_storage_key(address);
  164. bits = skey & (_PAGE_CHANGED | _PAGE_REFERENCED);
  165. /* Transfer page changed & referenced bit to guest bits in pgste */
  166. pgste_val(pgste) |= bits << 48; /* GR bit & GC bit */
  167. /* Copy page access key and fetch protection bit to pgste */
  168. pgste_val(pgste) &= ~(PGSTE_ACC_BITS | PGSTE_FP_BIT);
  169. pgste_val(pgste) |= (skey & (_PAGE_ACC_BITS | _PAGE_FP_BIT)) << 56;
  170. #endif
  171. return pgste;
  172. }
  173. static inline void pgste_set_key(pte_t *ptep, pgste_t pgste, pte_t entry,
  174. struct mm_struct *mm)
  175. {
  176. #ifdef CONFIG_PGSTE
  177. unsigned long address;
  178. unsigned long nkey;
  179. if (!mm_uses_skeys(mm) || pte_val(entry) & _PAGE_INVALID)
  180. return;
  181. VM_BUG_ON(!(pte_val(*ptep) & _PAGE_INVALID));
  182. address = pte_val(entry) & PAGE_MASK;
  183. /*
  184. * Set page access key and fetch protection bit from pgste.
  185. * The guest C/R information is still in the PGSTE, set real
  186. * key C/R to 0.
  187. */
  188. nkey = (pgste_val(pgste) & (PGSTE_ACC_BITS | PGSTE_FP_BIT)) >> 56;
  189. nkey |= (pgste_val(pgste) & (PGSTE_GR_BIT | PGSTE_GC_BIT)) >> 48;
  190. page_set_storage_key(address, nkey, 0);
  191. #endif
  192. }
  193. static inline pgste_t pgste_set_pte(pte_t *ptep, pgste_t pgste, pte_t entry)
  194. {
  195. #ifdef CONFIG_PGSTE
  196. if ((pte_val(entry) & _PAGE_PRESENT) &&
  197. (pte_val(entry) & _PAGE_WRITE) &&
  198. !(pte_val(entry) & _PAGE_INVALID)) {
  199. if (!MACHINE_HAS_ESOP) {
  200. /*
  201. * Without enhanced suppression-on-protection force
  202. * the dirty bit on for all writable ptes.
  203. */
  204. entry = set_pte_bit(entry, __pgprot(_PAGE_DIRTY));
  205. entry = clear_pte_bit(entry, __pgprot(_PAGE_PROTECT));
  206. }
  207. if (!(pte_val(entry) & _PAGE_PROTECT))
  208. /* This pte allows write access, set user-dirty */
  209. pgste_val(pgste) |= PGSTE_UC_BIT;
  210. }
  211. #endif
  212. set_pte(ptep, entry);
  213. return pgste;
  214. }
  215. static inline pgste_t pgste_pte_notify(struct mm_struct *mm,
  216. unsigned long addr,
  217. pte_t *ptep, pgste_t pgste)
  218. {
  219. #ifdef CONFIG_PGSTE
  220. unsigned long bits;
  221. bits = pgste_val(pgste) & (PGSTE_IN_BIT | PGSTE_VSIE_BIT);
  222. if (bits) {
  223. pgste_val(pgste) ^= bits;
  224. ptep_notify(mm, addr, ptep, bits);
  225. }
  226. #endif
  227. return pgste;
  228. }
  229. static inline pgste_t ptep_xchg_start(struct mm_struct *mm,
  230. unsigned long addr, pte_t *ptep)
  231. {
  232. pgste_t pgste = __pgste(0);
  233. if (mm_has_pgste(mm)) {
  234. pgste = pgste_get_lock(ptep);
  235. pgste = pgste_pte_notify(mm, addr, ptep, pgste);
  236. }
  237. return pgste;
  238. }
  239. static inline pte_t ptep_xchg_commit(struct mm_struct *mm,
  240. unsigned long addr, pte_t *ptep,
  241. pgste_t pgste, pte_t old, pte_t new)
  242. {
  243. if (mm_has_pgste(mm)) {
  244. if (pte_val(old) & _PAGE_INVALID)
  245. pgste_set_key(ptep, pgste, new, mm);
  246. if (pte_val(new) & _PAGE_INVALID) {
  247. pgste = pgste_update_all(old, pgste, mm);
  248. if ((pgste_val(pgste) & _PGSTE_GPS_USAGE_MASK) ==
  249. _PGSTE_GPS_USAGE_UNUSED)
  250. old = set_pte_bit(old, __pgprot(_PAGE_UNUSED));
  251. }
  252. pgste = pgste_set_pte(ptep, pgste, new);
  253. pgste_set_unlock(ptep, pgste);
  254. } else {
  255. set_pte(ptep, new);
  256. }
  257. return old;
  258. }
  259. pte_t ptep_xchg_direct(struct mm_struct *mm, unsigned long addr,
  260. pte_t *ptep, pte_t new)
  261. {
  262. pgste_t pgste;
  263. pte_t old;
  264. int nodat;
  265. preempt_disable();
  266. pgste = ptep_xchg_start(mm, addr, ptep);
  267. nodat = !!(pgste_val(pgste) & _PGSTE_GPS_NODAT);
  268. old = ptep_flush_direct(mm, addr, ptep, nodat);
  269. old = ptep_xchg_commit(mm, addr, ptep, pgste, old, new);
  270. preempt_enable();
  271. return old;
  272. }
  273. EXPORT_SYMBOL(ptep_xchg_direct);
  274. pte_t ptep_xchg_lazy(struct mm_struct *mm, unsigned long addr,
  275. pte_t *ptep, pte_t new)
  276. {
  277. pgste_t pgste;
  278. pte_t old;
  279. int nodat;
  280. preempt_disable();
  281. pgste = ptep_xchg_start(mm, addr, ptep);
  282. nodat = !!(pgste_val(pgste) & _PGSTE_GPS_NODAT);
  283. old = ptep_flush_lazy(mm, addr, ptep, nodat);
  284. old = ptep_xchg_commit(mm, addr, ptep, pgste, old, new);
  285. preempt_enable();
  286. return old;
  287. }
  288. EXPORT_SYMBOL(ptep_xchg_lazy);
  289. pte_t ptep_modify_prot_start(struct vm_area_struct *vma, unsigned long addr,
  290. pte_t *ptep)
  291. {
  292. pgste_t pgste;
  293. pte_t old;
  294. int nodat;
  295. struct mm_struct *mm = vma->vm_mm;
  296. preempt_disable();
  297. pgste = ptep_xchg_start(mm, addr, ptep);
  298. nodat = !!(pgste_val(pgste) & _PGSTE_GPS_NODAT);
  299. old = ptep_flush_lazy(mm, addr, ptep, nodat);
  300. if (mm_has_pgste(mm)) {
  301. pgste = pgste_update_all(old, pgste, mm);
  302. pgste_set(ptep, pgste);
  303. }
  304. return old;
  305. }
  306. void ptep_modify_prot_commit(struct vm_area_struct *vma, unsigned long addr,
  307. pte_t *ptep, pte_t old_pte, pte_t pte)
  308. {
  309. pgste_t pgste;
  310. struct mm_struct *mm = vma->vm_mm;
  311. if (!MACHINE_HAS_NX)
  312. pte = clear_pte_bit(pte, __pgprot(_PAGE_NOEXEC));
  313. if (mm_has_pgste(mm)) {
  314. pgste = pgste_get(ptep);
  315. pgste_set_key(ptep, pgste, pte, mm);
  316. pgste = pgste_set_pte(ptep, pgste, pte);
  317. pgste_set_unlock(ptep, pgste);
  318. } else {
  319. set_pte(ptep, pte);
  320. }
  321. preempt_enable();
  322. }
  323. static inline void pmdp_idte_local(struct mm_struct *mm,
  324. unsigned long addr, pmd_t *pmdp)
  325. {
  326. if (MACHINE_HAS_TLB_GUEST)
  327. __pmdp_idte(addr, pmdp, IDTE_NODAT | IDTE_GUEST_ASCE,
  328. mm->context.asce, IDTE_LOCAL);
  329. else
  330. __pmdp_idte(addr, pmdp, 0, 0, IDTE_LOCAL);
  331. if (mm_has_pgste(mm) && mm->context.allow_gmap_hpage_1m)
  332. gmap_pmdp_idte_local(mm, addr);
  333. }
  334. static inline void pmdp_idte_global(struct mm_struct *mm,
  335. unsigned long addr, pmd_t *pmdp)
  336. {
  337. if (MACHINE_HAS_TLB_GUEST) {
  338. __pmdp_idte(addr, pmdp, IDTE_NODAT | IDTE_GUEST_ASCE,
  339. mm->context.asce, IDTE_GLOBAL);
  340. if (mm_has_pgste(mm) && mm->context.allow_gmap_hpage_1m)
  341. gmap_pmdp_idte_global(mm, addr);
  342. } else if (MACHINE_HAS_IDTE) {
  343. __pmdp_idte(addr, pmdp, 0, 0, IDTE_GLOBAL);
  344. if (mm_has_pgste(mm) && mm->context.allow_gmap_hpage_1m)
  345. gmap_pmdp_idte_global(mm, addr);
  346. } else {
  347. __pmdp_csp(pmdp);
  348. if (mm_has_pgste(mm) && mm->context.allow_gmap_hpage_1m)
  349. gmap_pmdp_csp(mm, addr);
  350. }
  351. }
  352. static inline pmd_t pmdp_flush_direct(struct mm_struct *mm,
  353. unsigned long addr, pmd_t *pmdp)
  354. {
  355. pmd_t old;
  356. old = *pmdp;
  357. if (pmd_val(old) & _SEGMENT_ENTRY_INVALID)
  358. return old;
  359. atomic_inc(&mm->context.flush_count);
  360. if (MACHINE_HAS_TLB_LC &&
  361. cpumask_equal(mm_cpumask(mm), cpumask_of(smp_processor_id())))
  362. pmdp_idte_local(mm, addr, pmdp);
  363. else
  364. pmdp_idte_global(mm, addr, pmdp);
  365. atomic_dec(&mm->context.flush_count);
  366. return old;
  367. }
  368. static inline pmd_t pmdp_flush_lazy(struct mm_struct *mm,
  369. unsigned long addr, pmd_t *pmdp)
  370. {
  371. pmd_t old;
  372. old = *pmdp;
  373. if (pmd_val(old) & _SEGMENT_ENTRY_INVALID)
  374. return old;
  375. atomic_inc(&mm->context.flush_count);
  376. if (cpumask_equal(&mm->context.cpu_attach_mask,
  377. cpumask_of(smp_processor_id()))) {
  378. set_pmd(pmdp, set_pmd_bit(*pmdp, __pgprot(_SEGMENT_ENTRY_INVALID)));
  379. mm->context.flush_mm = 1;
  380. if (mm_has_pgste(mm))
  381. gmap_pmdp_invalidate(mm, addr);
  382. } else {
  383. pmdp_idte_global(mm, addr, pmdp);
  384. }
  385. atomic_dec(&mm->context.flush_count);
  386. return old;
  387. }
  388. #ifdef CONFIG_PGSTE
  389. static int pmd_lookup(struct mm_struct *mm, unsigned long addr, pmd_t **pmdp)
  390. {
  391. struct vm_area_struct *vma;
  392. pgd_t *pgd;
  393. p4d_t *p4d;
  394. pud_t *pud;
  395. /* We need a valid VMA, otherwise this is clearly a fault. */
  396. vma = vma_lookup(mm, addr);
  397. if (!vma)
  398. return -EFAULT;
  399. pgd = pgd_offset(mm, addr);
  400. if (!pgd_present(*pgd))
  401. return -ENOENT;
  402. p4d = p4d_offset(pgd, addr);
  403. if (!p4d_present(*p4d))
  404. return -ENOENT;
  405. pud = pud_offset(p4d, addr);
  406. if (!pud_present(*pud))
  407. return -ENOENT;
  408. /* Large PUDs are not supported yet. */
  409. if (pud_large(*pud))
  410. return -EFAULT;
  411. *pmdp = pmd_offset(pud, addr);
  412. return 0;
  413. }
  414. #endif
  415. pmd_t pmdp_xchg_direct(struct mm_struct *mm, unsigned long addr,
  416. pmd_t *pmdp, pmd_t new)
  417. {
  418. pmd_t old;
  419. preempt_disable();
  420. old = pmdp_flush_direct(mm, addr, pmdp);
  421. set_pmd(pmdp, new);
  422. preempt_enable();
  423. return old;
  424. }
  425. EXPORT_SYMBOL(pmdp_xchg_direct);
  426. pmd_t pmdp_xchg_lazy(struct mm_struct *mm, unsigned long addr,
  427. pmd_t *pmdp, pmd_t new)
  428. {
  429. pmd_t old;
  430. preempt_disable();
  431. old = pmdp_flush_lazy(mm, addr, pmdp);
  432. set_pmd(pmdp, new);
  433. preempt_enable();
  434. return old;
  435. }
  436. EXPORT_SYMBOL(pmdp_xchg_lazy);
  437. static inline void pudp_idte_local(struct mm_struct *mm,
  438. unsigned long addr, pud_t *pudp)
  439. {
  440. if (MACHINE_HAS_TLB_GUEST)
  441. __pudp_idte(addr, pudp, IDTE_NODAT | IDTE_GUEST_ASCE,
  442. mm->context.asce, IDTE_LOCAL);
  443. else
  444. __pudp_idte(addr, pudp, 0, 0, IDTE_LOCAL);
  445. }
  446. static inline void pudp_idte_global(struct mm_struct *mm,
  447. unsigned long addr, pud_t *pudp)
  448. {
  449. if (MACHINE_HAS_TLB_GUEST)
  450. __pudp_idte(addr, pudp, IDTE_NODAT | IDTE_GUEST_ASCE,
  451. mm->context.asce, IDTE_GLOBAL);
  452. else if (MACHINE_HAS_IDTE)
  453. __pudp_idte(addr, pudp, 0, 0, IDTE_GLOBAL);
  454. else
  455. /*
  456. * Invalid bit position is the same for pmd and pud, so we can
  457. * re-use _pmd_csp() here
  458. */
  459. __pmdp_csp((pmd_t *) pudp);
  460. }
  461. static inline pud_t pudp_flush_direct(struct mm_struct *mm,
  462. unsigned long addr, pud_t *pudp)
  463. {
  464. pud_t old;
  465. old = *pudp;
  466. if (pud_val(old) & _REGION_ENTRY_INVALID)
  467. return old;
  468. atomic_inc(&mm->context.flush_count);
  469. if (MACHINE_HAS_TLB_LC &&
  470. cpumask_equal(mm_cpumask(mm), cpumask_of(smp_processor_id())))
  471. pudp_idte_local(mm, addr, pudp);
  472. else
  473. pudp_idte_global(mm, addr, pudp);
  474. atomic_dec(&mm->context.flush_count);
  475. return old;
  476. }
  477. pud_t pudp_xchg_direct(struct mm_struct *mm, unsigned long addr,
  478. pud_t *pudp, pud_t new)
  479. {
  480. pud_t old;
  481. preempt_disable();
  482. old = pudp_flush_direct(mm, addr, pudp);
  483. set_pud(pudp, new);
  484. preempt_enable();
  485. return old;
  486. }
  487. EXPORT_SYMBOL(pudp_xchg_direct);
  488. #ifdef CONFIG_TRANSPARENT_HUGEPAGE
  489. void pgtable_trans_huge_deposit(struct mm_struct *mm, pmd_t *pmdp,
  490. pgtable_t pgtable)
  491. {
  492. struct list_head *lh = (struct list_head *) pgtable;
  493. assert_spin_locked(pmd_lockptr(mm, pmdp));
  494. /* FIFO */
  495. if (!pmd_huge_pte(mm, pmdp))
  496. INIT_LIST_HEAD(lh);
  497. else
  498. list_add(lh, (struct list_head *) pmd_huge_pte(mm, pmdp));
  499. pmd_huge_pte(mm, pmdp) = pgtable;
  500. }
  501. pgtable_t pgtable_trans_huge_withdraw(struct mm_struct *mm, pmd_t *pmdp)
  502. {
  503. struct list_head *lh;
  504. pgtable_t pgtable;
  505. pte_t *ptep;
  506. assert_spin_locked(pmd_lockptr(mm, pmdp));
  507. /* FIFO */
  508. pgtable = pmd_huge_pte(mm, pmdp);
  509. lh = (struct list_head *) pgtable;
  510. if (list_empty(lh))
  511. pmd_huge_pte(mm, pmdp) = NULL;
  512. else {
  513. pmd_huge_pte(mm, pmdp) = (pgtable_t) lh->next;
  514. list_del(lh);
  515. }
  516. ptep = (pte_t *) pgtable;
  517. set_pte(ptep, __pte(_PAGE_INVALID));
  518. ptep++;
  519. set_pte(ptep, __pte(_PAGE_INVALID));
  520. return pgtable;
  521. }
  522. #endif /* CONFIG_TRANSPARENT_HUGEPAGE */
  523. #ifdef CONFIG_PGSTE
  524. void ptep_set_pte_at(struct mm_struct *mm, unsigned long addr,
  525. pte_t *ptep, pte_t entry)
  526. {
  527. pgste_t pgste;
  528. /* the mm_has_pgste() check is done in set_pte_at() */
  529. preempt_disable();
  530. pgste = pgste_get_lock(ptep);
  531. pgste_val(pgste) &= ~_PGSTE_GPS_ZERO;
  532. pgste_set_key(ptep, pgste, entry, mm);
  533. pgste = pgste_set_pte(ptep, pgste, entry);
  534. pgste_set_unlock(ptep, pgste);
  535. preempt_enable();
  536. }
  537. void ptep_set_notify(struct mm_struct *mm, unsigned long addr, pte_t *ptep)
  538. {
  539. pgste_t pgste;
  540. preempt_disable();
  541. pgste = pgste_get_lock(ptep);
  542. pgste_val(pgste) |= PGSTE_IN_BIT;
  543. pgste_set_unlock(ptep, pgste);
  544. preempt_enable();
  545. }
  546. /**
  547. * ptep_force_prot - change access rights of a locked pte
  548. * @mm: pointer to the process mm_struct
  549. * @addr: virtual address in the guest address space
  550. * @ptep: pointer to the page table entry
  551. * @prot: indicates guest access rights: PROT_NONE, PROT_READ or PROT_WRITE
  552. * @bit: pgste bit to set (e.g. for notification)
  553. *
  554. * Returns 0 if the access rights were changed and -EAGAIN if the current
  555. * and requested access rights are incompatible.
  556. */
  557. int ptep_force_prot(struct mm_struct *mm, unsigned long addr,
  558. pte_t *ptep, int prot, unsigned long bit)
  559. {
  560. pte_t entry;
  561. pgste_t pgste;
  562. int pte_i, pte_p, nodat;
  563. pgste = pgste_get_lock(ptep);
  564. entry = *ptep;
  565. /* Check pte entry after all locks have been acquired */
  566. pte_i = pte_val(entry) & _PAGE_INVALID;
  567. pte_p = pte_val(entry) & _PAGE_PROTECT;
  568. if ((pte_i && (prot != PROT_NONE)) ||
  569. (pte_p && (prot & PROT_WRITE))) {
  570. pgste_set_unlock(ptep, pgste);
  571. return -EAGAIN;
  572. }
  573. /* Change access rights and set pgste bit */
  574. nodat = !!(pgste_val(pgste) & _PGSTE_GPS_NODAT);
  575. if (prot == PROT_NONE && !pte_i) {
  576. ptep_flush_direct(mm, addr, ptep, nodat);
  577. pgste = pgste_update_all(entry, pgste, mm);
  578. entry = set_pte_bit(entry, __pgprot(_PAGE_INVALID));
  579. }
  580. if (prot == PROT_READ && !pte_p) {
  581. ptep_flush_direct(mm, addr, ptep, nodat);
  582. entry = clear_pte_bit(entry, __pgprot(_PAGE_INVALID));
  583. entry = set_pte_bit(entry, __pgprot(_PAGE_PROTECT));
  584. }
  585. pgste_val(pgste) |= bit;
  586. pgste = pgste_set_pte(ptep, pgste, entry);
  587. pgste_set_unlock(ptep, pgste);
  588. return 0;
  589. }
  590. int ptep_shadow_pte(struct mm_struct *mm, unsigned long saddr,
  591. pte_t *sptep, pte_t *tptep, pte_t pte)
  592. {
  593. pgste_t spgste, tpgste;
  594. pte_t spte, tpte;
  595. int rc = -EAGAIN;
  596. if (!(pte_val(*tptep) & _PAGE_INVALID))
  597. return 0; /* already shadowed */
  598. spgste = pgste_get_lock(sptep);
  599. spte = *sptep;
  600. if (!(pte_val(spte) & _PAGE_INVALID) &&
  601. !((pte_val(spte) & _PAGE_PROTECT) &&
  602. !(pte_val(pte) & _PAGE_PROTECT))) {
  603. pgste_val(spgste) |= PGSTE_VSIE_BIT;
  604. tpgste = pgste_get_lock(tptep);
  605. tpte = __pte((pte_val(spte) & PAGE_MASK) |
  606. (pte_val(pte) & _PAGE_PROTECT));
  607. /* don't touch the storage key - it belongs to parent pgste */
  608. tpgste = pgste_set_pte(tptep, tpgste, tpte);
  609. pgste_set_unlock(tptep, tpgste);
  610. rc = 1;
  611. }
  612. pgste_set_unlock(sptep, spgste);
  613. return rc;
  614. }
  615. void ptep_unshadow_pte(struct mm_struct *mm, unsigned long saddr, pte_t *ptep)
  616. {
  617. pgste_t pgste;
  618. int nodat;
  619. pgste = pgste_get_lock(ptep);
  620. /* notifier is called by the caller */
  621. nodat = !!(pgste_val(pgste) & _PGSTE_GPS_NODAT);
  622. ptep_flush_direct(mm, saddr, ptep, nodat);
  623. /* don't touch the storage key - it belongs to parent pgste */
  624. pgste = pgste_set_pte(ptep, pgste, __pte(_PAGE_INVALID));
  625. pgste_set_unlock(ptep, pgste);
  626. }
  627. static void ptep_zap_swap_entry(struct mm_struct *mm, swp_entry_t entry)
  628. {
  629. if (!non_swap_entry(entry))
  630. dec_mm_counter(mm, MM_SWAPENTS);
  631. else if (is_migration_entry(entry)) {
  632. struct page *page = pfn_swap_entry_to_page(entry);
  633. dec_mm_counter(mm, mm_counter(page));
  634. }
  635. free_swap_and_cache(entry);
  636. }
  637. void ptep_zap_unused(struct mm_struct *mm, unsigned long addr,
  638. pte_t *ptep, int reset)
  639. {
  640. unsigned long pgstev;
  641. pgste_t pgste;
  642. pte_t pte;
  643. /* Zap unused and logically-zero pages */
  644. preempt_disable();
  645. pgste = pgste_get_lock(ptep);
  646. pgstev = pgste_val(pgste);
  647. pte = *ptep;
  648. if (!reset && pte_swap(pte) &&
  649. ((pgstev & _PGSTE_GPS_USAGE_MASK) == _PGSTE_GPS_USAGE_UNUSED ||
  650. (pgstev & _PGSTE_GPS_ZERO))) {
  651. ptep_zap_swap_entry(mm, pte_to_swp_entry(pte));
  652. pte_clear(mm, addr, ptep);
  653. }
  654. if (reset)
  655. pgste_val(pgste) &= ~(_PGSTE_GPS_USAGE_MASK | _PGSTE_GPS_NODAT);
  656. pgste_set_unlock(ptep, pgste);
  657. preempt_enable();
  658. }
  659. void ptep_zap_key(struct mm_struct *mm, unsigned long addr, pte_t *ptep)
  660. {
  661. unsigned long ptev;
  662. pgste_t pgste;
  663. /* Clear storage key ACC and F, but set R/C */
  664. preempt_disable();
  665. pgste = pgste_get_lock(ptep);
  666. pgste_val(pgste) &= ~(PGSTE_ACC_BITS | PGSTE_FP_BIT);
  667. pgste_val(pgste) |= PGSTE_GR_BIT | PGSTE_GC_BIT;
  668. ptev = pte_val(*ptep);
  669. if (!(ptev & _PAGE_INVALID) && (ptev & _PAGE_WRITE))
  670. page_set_storage_key(ptev & PAGE_MASK, PAGE_DEFAULT_KEY, 0);
  671. pgste_set_unlock(ptep, pgste);
  672. preempt_enable();
  673. }
  674. /*
  675. * Test and reset if a guest page is dirty
  676. */
  677. bool ptep_test_and_clear_uc(struct mm_struct *mm, unsigned long addr,
  678. pte_t *ptep)
  679. {
  680. pgste_t pgste;
  681. pte_t pte;
  682. bool dirty;
  683. int nodat;
  684. pgste = pgste_get_lock(ptep);
  685. dirty = !!(pgste_val(pgste) & PGSTE_UC_BIT);
  686. pgste_val(pgste) &= ~PGSTE_UC_BIT;
  687. pte = *ptep;
  688. if (dirty && (pte_val(pte) & _PAGE_PRESENT)) {
  689. pgste = pgste_pte_notify(mm, addr, ptep, pgste);
  690. nodat = !!(pgste_val(pgste) & _PGSTE_GPS_NODAT);
  691. ptep_ipte_global(mm, addr, ptep, nodat);
  692. if (MACHINE_HAS_ESOP || !(pte_val(pte) & _PAGE_WRITE))
  693. pte = set_pte_bit(pte, __pgprot(_PAGE_PROTECT));
  694. else
  695. pte = set_pte_bit(pte, __pgprot(_PAGE_INVALID));
  696. set_pte(ptep, pte);
  697. }
  698. pgste_set_unlock(ptep, pgste);
  699. return dirty;
  700. }
  701. EXPORT_SYMBOL_GPL(ptep_test_and_clear_uc);
  702. int set_guest_storage_key(struct mm_struct *mm, unsigned long addr,
  703. unsigned char key, bool nq)
  704. {
  705. unsigned long keyul, paddr;
  706. spinlock_t *ptl;
  707. pgste_t old, new;
  708. pmd_t *pmdp;
  709. pte_t *ptep;
  710. /*
  711. * If we don't have a PTE table and if there is no huge page mapped,
  712. * we can ignore attempts to set the key to 0, because it already is 0.
  713. */
  714. switch (pmd_lookup(mm, addr, &pmdp)) {
  715. case -ENOENT:
  716. return key ? -EFAULT : 0;
  717. case 0:
  718. break;
  719. default:
  720. return -EFAULT;
  721. }
  722. ptl = pmd_lock(mm, pmdp);
  723. if (!pmd_present(*pmdp)) {
  724. spin_unlock(ptl);
  725. return key ? -EFAULT : 0;
  726. }
  727. if (pmd_large(*pmdp)) {
  728. paddr = pmd_val(*pmdp) & HPAGE_MASK;
  729. paddr |= addr & ~HPAGE_MASK;
  730. /*
  731. * Huge pmds need quiescing operations, they are
  732. * always mapped.
  733. */
  734. page_set_storage_key(paddr, key, 1);
  735. spin_unlock(ptl);
  736. return 0;
  737. }
  738. spin_unlock(ptl);
  739. ptep = pte_offset_map_lock(mm, pmdp, addr, &ptl);
  740. new = old = pgste_get_lock(ptep);
  741. pgste_val(new) &= ~(PGSTE_GR_BIT | PGSTE_GC_BIT |
  742. PGSTE_ACC_BITS | PGSTE_FP_BIT);
  743. keyul = (unsigned long) key;
  744. pgste_val(new) |= (keyul & (_PAGE_CHANGED | _PAGE_REFERENCED)) << 48;
  745. pgste_val(new) |= (keyul & (_PAGE_ACC_BITS | _PAGE_FP_BIT)) << 56;
  746. if (!(pte_val(*ptep) & _PAGE_INVALID)) {
  747. unsigned long bits, skey;
  748. paddr = pte_val(*ptep) & PAGE_MASK;
  749. skey = (unsigned long) page_get_storage_key(paddr);
  750. bits = skey & (_PAGE_CHANGED | _PAGE_REFERENCED);
  751. skey = key & (_PAGE_ACC_BITS | _PAGE_FP_BIT);
  752. /* Set storage key ACC and FP */
  753. page_set_storage_key(paddr, skey, !nq);
  754. /* Merge host changed & referenced into pgste */
  755. pgste_val(new) |= bits << 52;
  756. }
  757. /* changing the guest storage key is considered a change of the page */
  758. if ((pgste_val(new) ^ pgste_val(old)) &
  759. (PGSTE_ACC_BITS | PGSTE_FP_BIT | PGSTE_GR_BIT | PGSTE_GC_BIT))
  760. pgste_val(new) |= PGSTE_UC_BIT;
  761. pgste_set_unlock(ptep, new);
  762. pte_unmap_unlock(ptep, ptl);
  763. return 0;
  764. }
  765. EXPORT_SYMBOL(set_guest_storage_key);
  766. /*
  767. * Conditionally set a guest storage key (handling csske).
  768. * oldkey will be updated when either mr or mc is set and a pointer is given.
  769. *
  770. * Returns 0 if a guests storage key update wasn't necessary, 1 if the guest
  771. * storage key was updated and -EFAULT on access errors.
  772. */
  773. int cond_set_guest_storage_key(struct mm_struct *mm, unsigned long addr,
  774. unsigned char key, unsigned char *oldkey,
  775. bool nq, bool mr, bool mc)
  776. {
  777. unsigned char tmp, mask = _PAGE_ACC_BITS | _PAGE_FP_BIT;
  778. int rc;
  779. /* we can drop the pgste lock between getting and setting the key */
  780. if (mr | mc) {
  781. rc = get_guest_storage_key(current->mm, addr, &tmp);
  782. if (rc)
  783. return rc;
  784. if (oldkey)
  785. *oldkey = tmp;
  786. if (!mr)
  787. mask |= _PAGE_REFERENCED;
  788. if (!mc)
  789. mask |= _PAGE_CHANGED;
  790. if (!((tmp ^ key) & mask))
  791. return 0;
  792. }
  793. rc = set_guest_storage_key(current->mm, addr, key, nq);
  794. return rc < 0 ? rc : 1;
  795. }
  796. EXPORT_SYMBOL(cond_set_guest_storage_key);
  797. /*
  798. * Reset a guest reference bit (rrbe), returning the reference and changed bit.
  799. *
  800. * Returns < 0 in case of error, otherwise the cc to be reported to the guest.
  801. */
  802. int reset_guest_reference_bit(struct mm_struct *mm, unsigned long addr)
  803. {
  804. spinlock_t *ptl;
  805. unsigned long paddr;
  806. pgste_t old, new;
  807. pmd_t *pmdp;
  808. pte_t *ptep;
  809. int cc = 0;
  810. /*
  811. * If we don't have a PTE table and if there is no huge page mapped,
  812. * the storage key is 0 and there is nothing for us to do.
  813. */
  814. switch (pmd_lookup(mm, addr, &pmdp)) {
  815. case -ENOENT:
  816. return 0;
  817. case 0:
  818. break;
  819. default:
  820. return -EFAULT;
  821. }
  822. ptl = pmd_lock(mm, pmdp);
  823. if (!pmd_present(*pmdp)) {
  824. spin_unlock(ptl);
  825. return 0;
  826. }
  827. if (pmd_large(*pmdp)) {
  828. paddr = pmd_val(*pmdp) & HPAGE_MASK;
  829. paddr |= addr & ~HPAGE_MASK;
  830. cc = page_reset_referenced(paddr);
  831. spin_unlock(ptl);
  832. return cc;
  833. }
  834. spin_unlock(ptl);
  835. ptep = pte_offset_map_lock(mm, pmdp, addr, &ptl);
  836. new = old = pgste_get_lock(ptep);
  837. /* Reset guest reference bit only */
  838. pgste_val(new) &= ~PGSTE_GR_BIT;
  839. if (!(pte_val(*ptep) & _PAGE_INVALID)) {
  840. paddr = pte_val(*ptep) & PAGE_MASK;
  841. cc = page_reset_referenced(paddr);
  842. /* Merge real referenced bit into host-set */
  843. pgste_val(new) |= ((unsigned long) cc << 53) & PGSTE_HR_BIT;
  844. }
  845. /* Reflect guest's logical view, not physical */
  846. cc |= (pgste_val(old) & (PGSTE_GR_BIT | PGSTE_GC_BIT)) >> 49;
  847. /* Changing the guest storage key is considered a change of the page */
  848. if ((pgste_val(new) ^ pgste_val(old)) & PGSTE_GR_BIT)
  849. pgste_val(new) |= PGSTE_UC_BIT;
  850. pgste_set_unlock(ptep, new);
  851. pte_unmap_unlock(ptep, ptl);
  852. return cc;
  853. }
  854. EXPORT_SYMBOL(reset_guest_reference_bit);
  855. int get_guest_storage_key(struct mm_struct *mm, unsigned long addr,
  856. unsigned char *key)
  857. {
  858. unsigned long paddr;
  859. spinlock_t *ptl;
  860. pgste_t pgste;
  861. pmd_t *pmdp;
  862. pte_t *ptep;
  863. /*
  864. * If we don't have a PTE table and if there is no huge page mapped,
  865. * the storage key is 0.
  866. */
  867. *key = 0;
  868. switch (pmd_lookup(mm, addr, &pmdp)) {
  869. case -ENOENT:
  870. return 0;
  871. case 0:
  872. break;
  873. default:
  874. return -EFAULT;
  875. }
  876. ptl = pmd_lock(mm, pmdp);
  877. if (!pmd_present(*pmdp)) {
  878. spin_unlock(ptl);
  879. return 0;
  880. }
  881. if (pmd_large(*pmdp)) {
  882. paddr = pmd_val(*pmdp) & HPAGE_MASK;
  883. paddr |= addr & ~HPAGE_MASK;
  884. *key = page_get_storage_key(paddr);
  885. spin_unlock(ptl);
  886. return 0;
  887. }
  888. spin_unlock(ptl);
  889. ptep = pte_offset_map_lock(mm, pmdp, addr, &ptl);
  890. pgste = pgste_get_lock(ptep);
  891. *key = (pgste_val(pgste) & (PGSTE_ACC_BITS | PGSTE_FP_BIT)) >> 56;
  892. paddr = pte_val(*ptep) & PAGE_MASK;
  893. if (!(pte_val(*ptep) & _PAGE_INVALID))
  894. *key = page_get_storage_key(paddr);
  895. /* Reflect guest's logical view, not physical */
  896. *key |= (pgste_val(pgste) & (PGSTE_GR_BIT | PGSTE_GC_BIT)) >> 48;
  897. pgste_set_unlock(ptep, pgste);
  898. pte_unmap_unlock(ptep, ptl);
  899. return 0;
  900. }
  901. EXPORT_SYMBOL(get_guest_storage_key);
  902. /**
  903. * pgste_perform_essa - perform ESSA actions on the PGSTE.
  904. * @mm: the memory context. It must have PGSTEs, no check is performed here!
  905. * @hva: the host virtual address of the page whose PGSTE is to be processed
  906. * @orc: the specific action to perform, see the ESSA_SET_* macros.
  907. * @oldpte: the PTE will be saved there if the pointer is not NULL.
  908. * @oldpgste: the old PGSTE will be saved there if the pointer is not NULL.
  909. *
  910. * Return: 1 if the page is to be added to the CBRL, otherwise 0,
  911. * or < 0 in case of error. -EINVAL is returned for invalid values
  912. * of orc, -EFAULT for invalid addresses.
  913. */
  914. int pgste_perform_essa(struct mm_struct *mm, unsigned long hva, int orc,
  915. unsigned long *oldpte, unsigned long *oldpgste)
  916. {
  917. struct vm_area_struct *vma;
  918. unsigned long pgstev;
  919. spinlock_t *ptl;
  920. pgste_t pgste;
  921. pte_t *ptep;
  922. int res = 0;
  923. WARN_ON_ONCE(orc > ESSA_MAX);
  924. if (unlikely(orc > ESSA_MAX))
  925. return -EINVAL;
  926. vma = vma_lookup(mm, hva);
  927. if (!vma || is_vm_hugetlb_page(vma))
  928. return -EFAULT;
  929. ptep = get_locked_pte(mm, hva, &ptl);
  930. if (unlikely(!ptep))
  931. return -EFAULT;
  932. pgste = pgste_get_lock(ptep);
  933. pgstev = pgste_val(pgste);
  934. if (oldpte)
  935. *oldpte = pte_val(*ptep);
  936. if (oldpgste)
  937. *oldpgste = pgstev;
  938. switch (orc) {
  939. case ESSA_GET_STATE:
  940. break;
  941. case ESSA_SET_STABLE:
  942. pgstev &= ~(_PGSTE_GPS_USAGE_MASK | _PGSTE_GPS_NODAT);
  943. pgstev |= _PGSTE_GPS_USAGE_STABLE;
  944. break;
  945. case ESSA_SET_UNUSED:
  946. pgstev &= ~_PGSTE_GPS_USAGE_MASK;
  947. pgstev |= _PGSTE_GPS_USAGE_UNUSED;
  948. if (pte_val(*ptep) & _PAGE_INVALID)
  949. res = 1;
  950. break;
  951. case ESSA_SET_VOLATILE:
  952. pgstev &= ~_PGSTE_GPS_USAGE_MASK;
  953. pgstev |= _PGSTE_GPS_USAGE_VOLATILE;
  954. if (pte_val(*ptep) & _PAGE_INVALID)
  955. res = 1;
  956. break;
  957. case ESSA_SET_POT_VOLATILE:
  958. pgstev &= ~_PGSTE_GPS_USAGE_MASK;
  959. if (!(pte_val(*ptep) & _PAGE_INVALID)) {
  960. pgstev |= _PGSTE_GPS_USAGE_POT_VOLATILE;
  961. break;
  962. }
  963. if (pgstev & _PGSTE_GPS_ZERO) {
  964. pgstev |= _PGSTE_GPS_USAGE_VOLATILE;
  965. break;
  966. }
  967. if (!(pgstev & PGSTE_GC_BIT)) {
  968. pgstev |= _PGSTE_GPS_USAGE_VOLATILE;
  969. res = 1;
  970. break;
  971. }
  972. break;
  973. case ESSA_SET_STABLE_RESIDENT:
  974. pgstev &= ~_PGSTE_GPS_USAGE_MASK;
  975. pgstev |= _PGSTE_GPS_USAGE_STABLE;
  976. /*
  977. * Since the resident state can go away any time after this
  978. * call, we will not make this page resident. We can revisit
  979. * this decision if a guest will ever start using this.
  980. */
  981. break;
  982. case ESSA_SET_STABLE_IF_RESIDENT:
  983. if (!(pte_val(*ptep) & _PAGE_INVALID)) {
  984. pgstev &= ~_PGSTE_GPS_USAGE_MASK;
  985. pgstev |= _PGSTE_GPS_USAGE_STABLE;
  986. }
  987. break;
  988. case ESSA_SET_STABLE_NODAT:
  989. pgstev &= ~_PGSTE_GPS_USAGE_MASK;
  990. pgstev |= _PGSTE_GPS_USAGE_STABLE | _PGSTE_GPS_NODAT;
  991. break;
  992. default:
  993. /* we should never get here! */
  994. break;
  995. }
  996. /* If we are discarding a page, set it to logical zero */
  997. if (res)
  998. pgstev |= _PGSTE_GPS_ZERO;
  999. pgste_val(pgste) = pgstev;
  1000. pgste_set_unlock(ptep, pgste);
  1001. pte_unmap_unlock(ptep, ptl);
  1002. return res;
  1003. }
  1004. EXPORT_SYMBOL(pgste_perform_essa);
  1005. /**
  1006. * set_pgste_bits - set specific PGSTE bits.
  1007. * @mm: the memory context. It must have PGSTEs, no check is performed here!
  1008. * @hva: the host virtual address of the page whose PGSTE is to be processed
  1009. * @bits: a bitmask representing the bits that will be touched
  1010. * @value: the values of the bits to be written. Only the bits in the mask
  1011. * will be written.
  1012. *
  1013. * Return: 0 on success, < 0 in case of error.
  1014. */
  1015. int set_pgste_bits(struct mm_struct *mm, unsigned long hva,
  1016. unsigned long bits, unsigned long value)
  1017. {
  1018. struct vm_area_struct *vma;
  1019. spinlock_t *ptl;
  1020. pgste_t new;
  1021. pte_t *ptep;
  1022. vma = vma_lookup(mm, hva);
  1023. if (!vma || is_vm_hugetlb_page(vma))
  1024. return -EFAULT;
  1025. ptep = get_locked_pte(mm, hva, &ptl);
  1026. if (unlikely(!ptep))
  1027. return -EFAULT;
  1028. new = pgste_get_lock(ptep);
  1029. pgste_val(new) &= ~bits;
  1030. pgste_val(new) |= value & bits;
  1031. pgste_set_unlock(ptep, new);
  1032. pte_unmap_unlock(ptep, ptl);
  1033. return 0;
  1034. }
  1035. EXPORT_SYMBOL(set_pgste_bits);
  1036. /**
  1037. * get_pgste - get the current PGSTE for the given address.
  1038. * @mm: the memory context. It must have PGSTEs, no check is performed here!
  1039. * @hva: the host virtual address of the page whose PGSTE is to be processed
  1040. * @pgstep: will be written with the current PGSTE for the given address.
  1041. *
  1042. * Return: 0 on success, < 0 in case of error.
  1043. */
  1044. int get_pgste(struct mm_struct *mm, unsigned long hva, unsigned long *pgstep)
  1045. {
  1046. struct vm_area_struct *vma;
  1047. spinlock_t *ptl;
  1048. pte_t *ptep;
  1049. vma = vma_lookup(mm, hva);
  1050. if (!vma || is_vm_hugetlb_page(vma))
  1051. return -EFAULT;
  1052. ptep = get_locked_pte(mm, hva, &ptl);
  1053. if (unlikely(!ptep))
  1054. return -EFAULT;
  1055. *pgstep = pgste_val(pgste_get(ptep));
  1056. pte_unmap_unlock(ptep, ptl);
  1057. return 0;
  1058. }
  1059. EXPORT_SYMBOL(get_pgste);
  1060. #endif