linux/include/linux/swapops.h
<<
>>
Prefs
   1/* SPDX-License-Identifier: GPL-2.0 */
   2#ifndef _LINUX_SWAPOPS_H
   3#define _LINUX_SWAPOPS_H
   4
   5#include <linux/radix-tree.h>
   6#include <linux/bug.h>
   7#include <linux/mm_types.h>
   8
   9#ifdef CONFIG_MMU
  10
  11/*
  12 * swapcache pages are stored in the swapper_space radix tree.  We want to
  13 * get good packing density in that tree, so the index should be dense in
  14 * the low-order bits.
  15 *
  16 * We arrange the `type' and `offset' fields so that `type' is at the seven
  17 * high-order bits of the swp_entry_t and `offset' is right-aligned in the
  18 * remaining bits.  Although `type' itself needs only five bits, we allow for
  19 * shmem/tmpfs to shift it all up a further two bits: see swp_to_radix_entry().
  20 *
  21 * swp_entry_t's are *never* stored anywhere in their arch-dependent format.
  22 */
  23#define SWP_TYPE_SHIFT  (BITS_PER_XA_VALUE - MAX_SWAPFILES_SHIFT)
  24#define SWP_OFFSET_MASK ((1UL << SWP_TYPE_SHIFT) - 1)
  25
  26/* Clear all flags but only keep swp_entry_t related information */
  27static inline pte_t pte_swp_clear_flags(pte_t pte)
  28{
  29        if (pte_swp_soft_dirty(pte))
  30                pte = pte_swp_clear_soft_dirty(pte);
  31        if (pte_swp_uffd_wp(pte))
  32                pte = pte_swp_clear_uffd_wp(pte);
  33        return pte;
  34}
  35
  36/*
  37 * Store a type+offset into a swp_entry_t in an arch-independent format
  38 */
  39static inline swp_entry_t swp_entry(unsigned long type, pgoff_t offset)
  40{
  41        swp_entry_t ret;
  42
  43        ret.val = (type << SWP_TYPE_SHIFT) | (offset & SWP_OFFSET_MASK);
  44        return ret;
  45}
  46
  47/*
  48 * Extract the `type' field from a swp_entry_t.  The swp_entry_t is in
  49 * arch-independent format
  50 */
  51static inline unsigned swp_type(swp_entry_t entry)
  52{
  53        return (entry.val >> SWP_TYPE_SHIFT);
  54}
  55
  56/*
  57 * Extract the `offset' field from a swp_entry_t.  The swp_entry_t is in
  58 * arch-independent format
  59 */
  60static inline pgoff_t swp_offset(swp_entry_t entry)
  61{
  62        return entry.val & SWP_OFFSET_MASK;
  63}
  64
  65/* check whether a pte points to a swap entry */
  66static inline int is_swap_pte(pte_t pte)
  67{
  68        return !pte_none(pte) && !pte_present(pte);
  69}
  70
  71/*
  72 * Convert the arch-dependent pte representation of a swp_entry_t into an
  73 * arch-independent swp_entry_t.
  74 */
  75static inline swp_entry_t pte_to_swp_entry(pte_t pte)
  76{
  77        swp_entry_t arch_entry;
  78
  79        pte = pte_swp_clear_flags(pte);
  80        arch_entry = __pte_to_swp_entry(pte);
  81        return swp_entry(__swp_type(arch_entry), __swp_offset(arch_entry));
  82}
  83
  84/*
  85 * Convert the arch-independent representation of a swp_entry_t into the
  86 * arch-dependent pte representation.
  87 */
  88static inline pte_t swp_entry_to_pte(swp_entry_t entry)
  89{
  90        swp_entry_t arch_entry;
  91
  92        arch_entry = __swp_entry(swp_type(entry), swp_offset(entry));
  93        return __swp_entry_to_pte(arch_entry);
  94}
  95
  96static inline swp_entry_t radix_to_swp_entry(void *arg)
  97{
  98        swp_entry_t entry;
  99
 100        entry.val = xa_to_value(arg);
 101        return entry;
 102}
 103
 104static inline void *swp_to_radix_entry(swp_entry_t entry)
 105{
 106        return xa_mk_value(entry.val);
 107}
 108
 109#if IS_ENABLED(CONFIG_DEVICE_PRIVATE)
 110static inline swp_entry_t make_readable_device_private_entry(pgoff_t offset)
 111{
 112        return swp_entry(SWP_DEVICE_READ, offset);
 113}
 114
 115static inline swp_entry_t make_writable_device_private_entry(pgoff_t offset)
 116{
 117        return swp_entry(SWP_DEVICE_WRITE, offset);
 118}
 119
 120static inline bool is_device_private_entry(swp_entry_t entry)
 121{
 122        int type = swp_type(entry);
 123        return type == SWP_DEVICE_READ || type == SWP_DEVICE_WRITE;
 124}
 125
 126static inline bool is_writable_device_private_entry(swp_entry_t entry)
 127{
 128        return unlikely(swp_type(entry) == SWP_DEVICE_WRITE);
 129}
 130
 131static inline swp_entry_t make_readable_device_exclusive_entry(pgoff_t offset)
 132{
 133        return swp_entry(SWP_DEVICE_EXCLUSIVE_READ, offset);
 134}
 135
 136static inline swp_entry_t make_writable_device_exclusive_entry(pgoff_t offset)
 137{
 138        return swp_entry(SWP_DEVICE_EXCLUSIVE_WRITE, offset);
 139}
 140
 141static inline bool is_device_exclusive_entry(swp_entry_t entry)
 142{
 143        return swp_type(entry) == SWP_DEVICE_EXCLUSIVE_READ ||
 144                swp_type(entry) == SWP_DEVICE_EXCLUSIVE_WRITE;
 145}
 146
 147static inline bool is_writable_device_exclusive_entry(swp_entry_t entry)
 148{
 149        return unlikely(swp_type(entry) == SWP_DEVICE_EXCLUSIVE_WRITE);
 150}
 151#else /* CONFIG_DEVICE_PRIVATE */
 152static inline swp_entry_t make_readable_device_private_entry(pgoff_t offset)
 153{
 154        return swp_entry(0, 0);
 155}
 156
 157static inline swp_entry_t make_writable_device_private_entry(pgoff_t offset)
 158{
 159        return swp_entry(0, 0);
 160}
 161
 162static inline bool is_device_private_entry(swp_entry_t entry)
 163{
 164        return false;
 165}
 166
 167static inline bool is_writable_device_private_entry(swp_entry_t entry)
 168{
 169        return false;
 170}
 171
 172static inline swp_entry_t make_readable_device_exclusive_entry(pgoff_t offset)
 173{
 174        return swp_entry(0, 0);
 175}
 176
 177static inline swp_entry_t make_writable_device_exclusive_entry(pgoff_t offset)
 178{
 179        return swp_entry(0, 0);
 180}
 181
 182static inline bool is_device_exclusive_entry(swp_entry_t entry)
 183{
 184        return false;
 185}
 186
 187static inline bool is_writable_device_exclusive_entry(swp_entry_t entry)
 188{
 189        return false;
 190}
 191#endif /* CONFIG_DEVICE_PRIVATE */
 192
 193#ifdef CONFIG_MIGRATION
 194static inline int is_migration_entry(swp_entry_t entry)
 195{
 196        return unlikely(swp_type(entry) == SWP_MIGRATION_READ ||
 197                        swp_type(entry) == SWP_MIGRATION_WRITE);
 198}
 199
 200static inline int is_writable_migration_entry(swp_entry_t entry)
 201{
 202        return unlikely(swp_type(entry) == SWP_MIGRATION_WRITE);
 203}
 204
 205static inline swp_entry_t make_readable_migration_entry(pgoff_t offset)
 206{
 207        return swp_entry(SWP_MIGRATION_READ, offset);
 208}
 209
 210static inline swp_entry_t make_writable_migration_entry(pgoff_t offset)
 211{
 212        return swp_entry(SWP_MIGRATION_WRITE, offset);
 213}
 214
 215extern void __migration_entry_wait(struct mm_struct *mm, pte_t *ptep,
 216                                        spinlock_t *ptl);
 217extern void migration_entry_wait(struct mm_struct *mm, pmd_t *pmd,
 218                                        unsigned long address);
 219extern void migration_entry_wait_huge(struct vm_area_struct *vma,
 220                struct mm_struct *mm, pte_t *pte);
 221#else
 222static inline swp_entry_t make_readable_migration_entry(pgoff_t offset)
 223{
 224        return swp_entry(0, 0);
 225}
 226
 227static inline swp_entry_t make_writable_migration_entry(pgoff_t offset)
 228{
 229        return swp_entry(0, 0);
 230}
 231
 232static inline int is_migration_entry(swp_entry_t swp)
 233{
 234        return 0;
 235}
 236
 237static inline void __migration_entry_wait(struct mm_struct *mm, pte_t *ptep,
 238                                        spinlock_t *ptl) { }
 239static inline void migration_entry_wait(struct mm_struct *mm, pmd_t *pmd,
 240                                         unsigned long address) { }
 241static inline void migration_entry_wait_huge(struct vm_area_struct *vma,
 242                struct mm_struct *mm, pte_t *pte) { }
 243static inline int is_writable_migration_entry(swp_entry_t entry)
 244{
 245        return 0;
 246}
 247
 248#endif
 249
 250static inline struct page *pfn_swap_entry_to_page(swp_entry_t entry)
 251{
 252        struct page *p = pfn_to_page(swp_offset(entry));
 253
 254        /*
 255         * Any use of migration entries may only occur while the
 256         * corresponding page is locked
 257         */
 258        BUG_ON(is_migration_entry(entry) && !PageLocked(p));
 259
 260        return p;
 261}
 262
 263/*
 264 * A pfn swap entry is a special type of swap entry that always has a pfn stored
 265 * in the swap offset. They are used to represent unaddressable device memory
 266 * and to restrict access to a page undergoing migration.
 267 */
 268static inline bool is_pfn_swap_entry(swp_entry_t entry)
 269{
 270        return is_migration_entry(entry) || is_device_private_entry(entry) ||
 271               is_device_exclusive_entry(entry);
 272}
 273
 274struct page_vma_mapped_walk;
 275
 276#ifdef CONFIG_ARCH_ENABLE_THP_MIGRATION
 277extern void set_pmd_migration_entry(struct page_vma_mapped_walk *pvmw,
 278                struct page *page);
 279
 280extern void remove_migration_pmd(struct page_vma_mapped_walk *pvmw,
 281                struct page *new);
 282
 283extern void pmd_migration_entry_wait(struct mm_struct *mm, pmd_t *pmd);
 284
 285static inline swp_entry_t pmd_to_swp_entry(pmd_t pmd)
 286{
 287        swp_entry_t arch_entry;
 288
 289        if (pmd_swp_soft_dirty(pmd))
 290                pmd = pmd_swp_clear_soft_dirty(pmd);
 291        if (pmd_swp_uffd_wp(pmd))
 292                pmd = pmd_swp_clear_uffd_wp(pmd);
 293        arch_entry = __pmd_to_swp_entry(pmd);
 294        return swp_entry(__swp_type(arch_entry), __swp_offset(arch_entry));
 295}
 296
 297static inline pmd_t swp_entry_to_pmd(swp_entry_t entry)
 298{
 299        swp_entry_t arch_entry;
 300
 301        arch_entry = __swp_entry(swp_type(entry), swp_offset(entry));
 302        return __swp_entry_to_pmd(arch_entry);
 303}
 304
 305static inline int is_pmd_migration_entry(pmd_t pmd)
 306{
 307        return !pmd_present(pmd) && is_migration_entry(pmd_to_swp_entry(pmd));
 308}
 309#else
 310static inline void set_pmd_migration_entry(struct page_vma_mapped_walk *pvmw,
 311                struct page *page)
 312{
 313        BUILD_BUG();
 314}
 315
 316static inline void remove_migration_pmd(struct page_vma_mapped_walk *pvmw,
 317                struct page *new)
 318{
 319        BUILD_BUG();
 320}
 321
 322static inline void pmd_migration_entry_wait(struct mm_struct *m, pmd_t *p) { }
 323
 324static inline swp_entry_t pmd_to_swp_entry(pmd_t pmd)
 325{
 326        return swp_entry(0, 0);
 327}
 328
 329static inline pmd_t swp_entry_to_pmd(swp_entry_t entry)
 330{
 331        return __pmd(0);
 332}
 333
 334static inline int is_pmd_migration_entry(pmd_t pmd)
 335{
 336        return 0;
 337}
 338#endif
 339
 340#ifdef CONFIG_MEMORY_FAILURE
 341
 342extern atomic_long_t num_poisoned_pages __read_mostly;
 343
 344/*
 345 * Support for hardware poisoned pages
 346 */
 347static inline swp_entry_t make_hwpoison_entry(struct page *page)
 348{
 349        BUG_ON(!PageLocked(page));
 350        return swp_entry(SWP_HWPOISON, page_to_pfn(page));
 351}
 352
 353static inline int is_hwpoison_entry(swp_entry_t entry)
 354{
 355        return swp_type(entry) == SWP_HWPOISON;
 356}
 357
 358static inline unsigned long hwpoison_entry_to_pfn(swp_entry_t entry)
 359{
 360        return swp_offset(entry);
 361}
 362
 363static inline void num_poisoned_pages_inc(void)
 364{
 365        atomic_long_inc(&num_poisoned_pages);
 366}
 367
 368static inline void num_poisoned_pages_dec(void)
 369{
 370        atomic_long_dec(&num_poisoned_pages);
 371}
 372
 373#else
 374
 375static inline swp_entry_t make_hwpoison_entry(struct page *page)
 376{
 377        return swp_entry(0, 0);
 378}
 379
 380static inline int is_hwpoison_entry(swp_entry_t swp)
 381{
 382        return 0;
 383}
 384
 385static inline void num_poisoned_pages_inc(void)
 386{
 387}
 388#endif
 389
 390#if defined(CONFIG_MEMORY_FAILURE) || defined(CONFIG_MIGRATION) || \
 391    defined(CONFIG_DEVICE_PRIVATE)
 392static inline int non_swap_entry(swp_entry_t entry)
 393{
 394        return swp_type(entry) >= MAX_SWAPFILES;
 395}
 396#else
 397static inline int non_swap_entry(swp_entry_t entry)
 398{
 399        return 0;
 400}
 401#endif
 402
 403#endif /* CONFIG_MMU */
 404#endif /* _LINUX_SWAPOPS_H */
 405