linux/fs/ext4/ext4.h
<<
>>
Prefs
   1/*
   2 *  ext4.h
   3 *
   4 * Copyright (C) 1992, 1993, 1994, 1995
   5 * Remy Card (card@masi.ibp.fr)
   6 * Laboratoire MASI - Institut Blaise Pascal
   7 * Universite Pierre et Marie Curie (Paris VI)
   8 *
   9 *  from
  10 *
  11 *  linux/include/linux/minix_fs.h
  12 *
  13 *  Copyright (C) 1991, 1992  Linus Torvalds
  14 */
  15
  16#ifndef _EXT4_H
  17#define _EXT4_H
  18
  19#include <linux/types.h>
  20#include <linux/blkdev.h>
  21#include <linux/magic.h>
  22#include <linux/jbd2.h>
  23#include <linux/quota.h>
  24#include <linux/rwsem.h>
  25#include <linux/rbtree.h>
  26#include <linux/seqlock.h>
  27#include <linux/mutex.h>
  28#include <linux/timer.h>
  29#include <linux/version.h>
  30#include <linux/wait.h>
  31#include <linux/blockgroup_lock.h>
  32#include <linux/percpu_counter.h>
  33#include <linux/ratelimit.h>
  34#include <crypto/hash.h>
  35#include <linux/fscrypto.h>
  36#include <linux/falloc.h>
  37#include <linux/percpu-rwsem.h>
  38#ifdef __KERNEL__
  39#include <linux/compat.h>
  40#endif
  41
  42/*
  43 * The fourth extended filesystem constants/structures
  44 */
  45
  46/*
  47 * with AGGRESSIVE_CHECK allocator runs consistency checks over
  48 * structures. these checks slow things down a lot
  49 */
  50#define AGGRESSIVE_CHECK__
  51
  52/*
  53 * with DOUBLE_CHECK defined mballoc creates persistent in-core
  54 * bitmaps, maintains and uses them to check for double allocations
  55 */
  56#define DOUBLE_CHECK__
  57
  58/*
  59 * Define EXT4FS_DEBUG to produce debug messages
  60 */
  61#undef EXT4FS_DEBUG
  62
  63/*
  64 * Debug code
  65 */
  66#ifdef EXT4FS_DEBUG
  67#define ext4_debug(f, a...)                                             \
  68        do {                                                            \
  69                printk(KERN_DEBUG "EXT4-fs DEBUG (%s, %d): %s:",        \
  70                        __FILE__, __LINE__, __func__);                  \
  71                printk(KERN_DEBUG f, ## a);                             \
  72        } while (0)
  73#else
  74#define ext4_debug(fmt, ...)    no_printk(fmt, ##__VA_ARGS__)
  75#endif
  76
  77/*
  78 * Turn on EXT_DEBUG to get lots of info about extents operations.
  79 */
  80#define EXT_DEBUG__
  81#ifdef EXT_DEBUG
  82#define ext_debug(fmt, ...)     printk(fmt, ##__VA_ARGS__)
  83#else
  84#define ext_debug(fmt, ...)     no_printk(fmt, ##__VA_ARGS__)
  85#endif
  86
  87/* data type for block offset of block group */
  88typedef int ext4_grpblk_t;
  89
  90/* data type for filesystem-wide blocks number */
  91typedef unsigned long long ext4_fsblk_t;
  92
  93/* data type for file logical block number */
  94typedef __u32 ext4_lblk_t;
  95
  96/* data type for block group number */
  97typedef unsigned int ext4_group_t;
  98
  99enum SHIFT_DIRECTION {
 100        SHIFT_LEFT = 0,
 101        SHIFT_RIGHT,
 102};
 103
 104/*
 105 * Flags used in mballoc's allocation_context flags field.
 106 *
 107 * Also used to show what's going on for debugging purposes when the
 108 * flag field is exported via the traceport interface
 109 */
 110
 111/* prefer goal again. length */
 112#define EXT4_MB_HINT_MERGE              0x0001
 113/* blocks already reserved */
 114#define EXT4_MB_HINT_RESERVED           0x0002
 115/* metadata is being allocated */
 116#define EXT4_MB_HINT_METADATA           0x0004
 117/* first blocks in the file */
 118#define EXT4_MB_HINT_FIRST              0x0008
 119/* search for the best chunk */
 120#define EXT4_MB_HINT_BEST               0x0010
 121/* data is being allocated */
 122#define EXT4_MB_HINT_DATA               0x0020
 123/* don't preallocate (for tails) */
 124#define EXT4_MB_HINT_NOPREALLOC         0x0040
 125/* allocate for locality group */
 126#define EXT4_MB_HINT_GROUP_ALLOC        0x0080
 127/* allocate goal blocks or none */
 128#define EXT4_MB_HINT_GOAL_ONLY          0x0100
 129/* goal is meaningful */
 130#define EXT4_MB_HINT_TRY_GOAL           0x0200
 131/* blocks already pre-reserved by delayed allocation */
 132#define EXT4_MB_DELALLOC_RESERVED       0x0400
 133/* We are doing stream allocation */
 134#define EXT4_MB_STREAM_ALLOC            0x0800
 135/* Use reserved root blocks if needed */
 136#define EXT4_MB_USE_ROOT_BLOCKS         0x1000
 137/* Use blocks from reserved pool */
 138#define EXT4_MB_USE_RESERVED            0x2000
 139
 140struct ext4_allocation_request {
 141        /* target inode for block we're allocating */
 142        struct inode *inode;
 143        /* how many blocks we want to allocate */
 144        unsigned int len;
 145        /* logical block in target inode */
 146        ext4_lblk_t logical;
 147        /* the closest logical allocated block to the left */
 148        ext4_lblk_t lleft;
 149        /* the closest logical allocated block to the right */
 150        ext4_lblk_t lright;
 151        /* phys. target (a hint) */
 152        ext4_fsblk_t goal;
 153        /* phys. block for the closest logical allocated block to the left */
 154        ext4_fsblk_t pleft;
 155        /* phys. block for the closest logical allocated block to the right */
 156        ext4_fsblk_t pright;
 157        /* flags. see above EXT4_MB_HINT_* */
 158        unsigned int flags;
 159};
 160
 161/*
 162 * Logical to physical block mapping, used by ext4_map_blocks()
 163 *
 164 * This structure is used to pass requests into ext4_map_blocks() as
 165 * well as to store the information returned by ext4_map_blocks().  It
 166 * takes less room on the stack than a struct buffer_head.
 167 */
 168#define EXT4_MAP_NEW            (1 << BH_New)
 169#define EXT4_MAP_MAPPED         (1 << BH_Mapped)
 170#define EXT4_MAP_UNWRITTEN      (1 << BH_Unwritten)
 171#define EXT4_MAP_BOUNDARY       (1 << BH_Boundary)
 172#define EXT4_MAP_FLAGS          (EXT4_MAP_NEW | EXT4_MAP_MAPPED |\
 173                                 EXT4_MAP_UNWRITTEN | EXT4_MAP_BOUNDARY)
 174
 175struct ext4_map_blocks {
 176        ext4_fsblk_t m_pblk;
 177        ext4_lblk_t m_lblk;
 178        unsigned int m_len;
 179        unsigned int m_flags;
 180};
 181
 182/*
 183 * Flags for ext4_io_end->flags
 184 */
 185#define EXT4_IO_END_UNWRITTEN   0x0001
 186
 187/*
 188 * For converting unwritten extents on a work queue. 'handle' is used for
 189 * buffered writeback.
 190 */
 191typedef struct ext4_io_end {
 192        struct list_head        list;           /* per-file finished IO list */
 193        handle_t                *handle;        /* handle reserved for extent
 194                                                 * conversion */
 195        struct inode            *inode;         /* file being written to */
 196        struct bio              *bio;           /* Linked list of completed
 197                                                 * bios covering the extent */
 198        unsigned int            flag;           /* unwritten or not */
 199        atomic_t                count;          /* reference counter */
 200        loff_t                  offset;         /* offset in the file */
 201        ssize_t                 size;           /* size of the extent */
 202} ext4_io_end_t;
 203
 204struct ext4_io_submit {
 205        struct writeback_control *io_wbc;
 206        struct bio              *io_bio;
 207        ext4_io_end_t           *io_end;
 208        sector_t                io_next_block;
 209};
 210
 211/*
 212 * Special inodes numbers
 213 */
 214#define EXT4_BAD_INO             1      /* Bad blocks inode */
 215#define EXT4_ROOT_INO            2      /* Root inode */
 216#define EXT4_USR_QUOTA_INO       3      /* User quota inode */
 217#define EXT4_GRP_QUOTA_INO       4      /* Group quota inode */
 218#define EXT4_BOOT_LOADER_INO     5      /* Boot loader inode */
 219#define EXT4_UNDEL_DIR_INO       6      /* Undelete directory inode */
 220#define EXT4_RESIZE_INO          7      /* Reserved group descriptors inode */
 221#define EXT4_JOURNAL_INO         8      /* Journal inode */
 222
 223/* First non-reserved inode for old ext4 filesystems */
 224#define EXT4_GOOD_OLD_FIRST_INO 11
 225
 226/*
 227 * Maximal count of links to a file
 228 */
 229#define EXT4_LINK_MAX           65000
 230
 231/*
 232 * Macro-instructions used to manage several block sizes
 233 */
 234#define EXT4_MIN_BLOCK_SIZE             1024
 235#define EXT4_MAX_BLOCK_SIZE             65536
 236#define EXT4_MIN_BLOCK_LOG_SIZE         10
 237#define EXT4_MAX_BLOCK_LOG_SIZE         16
 238#define EXT4_MAX_CLUSTER_LOG_SIZE       30
 239#ifdef __KERNEL__
 240# define EXT4_BLOCK_SIZE(s)             ((s)->s_blocksize)
 241#else
 242# define EXT4_BLOCK_SIZE(s)             (EXT4_MIN_BLOCK_SIZE << (s)->s_log_block_size)
 243#endif
 244#define EXT4_ADDR_PER_BLOCK(s)          (EXT4_BLOCK_SIZE(s) / sizeof(__u32))
 245#define EXT4_CLUSTER_SIZE(s)            (EXT4_BLOCK_SIZE(s) << \
 246                                         EXT4_SB(s)->s_cluster_bits)
 247#ifdef __KERNEL__
 248# define EXT4_BLOCK_SIZE_BITS(s)        ((s)->s_blocksize_bits)
 249# define EXT4_CLUSTER_BITS(s)           (EXT4_SB(s)->s_cluster_bits)
 250#else
 251# define EXT4_BLOCK_SIZE_BITS(s)        ((s)->s_log_block_size + 10)
 252#endif
 253#ifdef __KERNEL__
 254#define EXT4_ADDR_PER_BLOCK_BITS(s)     (EXT4_SB(s)->s_addr_per_block_bits)
 255#define EXT4_INODE_SIZE(s)              (EXT4_SB(s)->s_inode_size)
 256#define EXT4_FIRST_INO(s)               (EXT4_SB(s)->s_first_ino)
 257#else
 258#define EXT4_INODE_SIZE(s)      (((s)->s_rev_level == EXT4_GOOD_OLD_REV) ? \
 259                                 EXT4_GOOD_OLD_INODE_SIZE : \
 260                                 (s)->s_inode_size)
 261#define EXT4_FIRST_INO(s)       (((s)->s_rev_level == EXT4_GOOD_OLD_REV) ? \
 262                                 EXT4_GOOD_OLD_FIRST_INO : \
 263                                 (s)->s_first_ino)
 264#endif
 265#define EXT4_BLOCK_ALIGN(size, blkbits)         ALIGN((size), (1 << (blkbits)))
 266#define EXT4_MAX_BLOCKS(size, offset, blkbits) \
 267        ((EXT4_BLOCK_ALIGN(size + offset, blkbits) >> blkbits) - (offset >> \
 268                                                                  blkbits))
 269
 270/* Translate a block number to a cluster number */
 271#define EXT4_B2C(sbi, blk)      ((blk) >> (sbi)->s_cluster_bits)
 272/* Translate a cluster number to a block number */
 273#define EXT4_C2B(sbi, cluster)  ((cluster) << (sbi)->s_cluster_bits)
 274/* Translate # of blks to # of clusters */
 275#define EXT4_NUM_B2C(sbi, blks) (((blks) + (sbi)->s_cluster_ratio - 1) >> \
 276                                 (sbi)->s_cluster_bits)
 277/* Mask out the low bits to get the starting block of the cluster */
 278#define EXT4_PBLK_CMASK(s, pblk) ((pblk) &                              \
 279                                  ~((ext4_fsblk_t) (s)->s_cluster_ratio - 1))
 280#define EXT4_LBLK_CMASK(s, lblk) ((lblk) &                              \
 281                                  ~((ext4_lblk_t) (s)->s_cluster_ratio - 1))
 282/* Get the cluster offset */
 283#define EXT4_PBLK_COFF(s, pblk) ((pblk) &                               \
 284                                 ((ext4_fsblk_t) (s)->s_cluster_ratio - 1))
 285#define EXT4_LBLK_COFF(s, lblk) ((lblk) &                               \
 286                                 ((ext4_lblk_t) (s)->s_cluster_ratio - 1))
 287
 288/*
 289 * Structure of a blocks group descriptor
 290 */
 291struct ext4_group_desc
 292{
 293        __le32  bg_block_bitmap_lo;     /* Blocks bitmap block */
 294        __le32  bg_inode_bitmap_lo;     /* Inodes bitmap block */
 295        __le32  bg_inode_table_lo;      /* Inodes table block */
 296        __le16  bg_free_blocks_count_lo;/* Free blocks count */
 297        __le16  bg_free_inodes_count_lo;/* Free inodes count */
 298        __le16  bg_used_dirs_count_lo;  /* Directories count */
 299        __le16  bg_flags;               /* EXT4_BG_flags (INODE_UNINIT, etc) */
 300        __le32  bg_exclude_bitmap_lo;   /* Exclude bitmap for snapshots */
 301        __le16  bg_block_bitmap_csum_lo;/* crc32c(s_uuid+grp_num+bbitmap) LE */
 302        __le16  bg_inode_bitmap_csum_lo;/* crc32c(s_uuid+grp_num+ibitmap) LE */
 303        __le16  bg_itable_unused_lo;    /* Unused inodes count */
 304        __le16  bg_checksum;            /* crc16(sb_uuid+group+desc) */
 305        __le32  bg_block_bitmap_hi;     /* Blocks bitmap block MSB */
 306        __le32  bg_inode_bitmap_hi;     /* Inodes bitmap block MSB */
 307        __le32  bg_inode_table_hi;      /* Inodes table block MSB */
 308        __le16  bg_free_blocks_count_hi;/* Free blocks count MSB */
 309        __le16  bg_free_inodes_count_hi;/* Free inodes count MSB */
 310        __le16  bg_used_dirs_count_hi;  /* Directories count MSB */
 311        __le16  bg_itable_unused_hi;    /* Unused inodes count MSB */
 312        __le32  bg_exclude_bitmap_hi;   /* Exclude bitmap block MSB */
 313        __le16  bg_block_bitmap_csum_hi;/* crc32c(s_uuid+grp_num+bbitmap) BE */
 314        __le16  bg_inode_bitmap_csum_hi;/* crc32c(s_uuid+grp_num+ibitmap) BE */
 315        __u32   bg_reserved;
 316};
 317
 318#define EXT4_BG_INODE_BITMAP_CSUM_HI_END        \
 319        (offsetof(struct ext4_group_desc, bg_inode_bitmap_csum_hi) + \
 320         sizeof(__le16))
 321#define EXT4_BG_BLOCK_BITMAP_CSUM_HI_END        \
 322        (offsetof(struct ext4_group_desc, bg_block_bitmap_csum_hi) + \
 323         sizeof(__le16))
 324
 325/*
 326 * Structure of a flex block group info
 327 */
 328
 329struct flex_groups {
 330        atomic64_t      free_clusters;
 331        atomic_t        free_inodes;
 332        atomic_t        used_dirs;
 333};
 334
 335#define EXT4_BG_INODE_UNINIT    0x0001 /* Inode table/bitmap not in use */
 336#define EXT4_BG_BLOCK_UNINIT    0x0002 /* Block bitmap not in use */
 337#define EXT4_BG_INODE_ZEROED    0x0004 /* On-disk itable initialized to zero */
 338
 339/*
 340 * Macro-instructions used to manage group descriptors
 341 */
 342#define EXT4_MIN_DESC_SIZE              32
 343#define EXT4_MIN_DESC_SIZE_64BIT        64
 344#define EXT4_MAX_DESC_SIZE              EXT4_MIN_BLOCK_SIZE
 345#define EXT4_DESC_SIZE(s)               (EXT4_SB(s)->s_desc_size)
 346#ifdef __KERNEL__
 347# define EXT4_BLOCKS_PER_GROUP(s)       (EXT4_SB(s)->s_blocks_per_group)
 348# define EXT4_CLUSTERS_PER_GROUP(s)     (EXT4_SB(s)->s_clusters_per_group)
 349# define EXT4_DESC_PER_BLOCK(s)         (EXT4_SB(s)->s_desc_per_block)
 350# define EXT4_INODES_PER_GROUP(s)       (EXT4_SB(s)->s_inodes_per_group)
 351# define EXT4_DESC_PER_BLOCK_BITS(s)    (EXT4_SB(s)->s_desc_per_block_bits)
 352#else
 353# define EXT4_BLOCKS_PER_GROUP(s)       ((s)->s_blocks_per_group)
 354# define EXT4_DESC_PER_BLOCK(s)         (EXT4_BLOCK_SIZE(s) / EXT4_DESC_SIZE(s))
 355# define EXT4_INODES_PER_GROUP(s)       ((s)->s_inodes_per_group)
 356#endif
 357
 358/*
 359 * Constants relative to the data blocks
 360 */
 361#define EXT4_NDIR_BLOCKS                12
 362#define EXT4_IND_BLOCK                  EXT4_NDIR_BLOCKS
 363#define EXT4_DIND_BLOCK                 (EXT4_IND_BLOCK + 1)
 364#define EXT4_TIND_BLOCK                 (EXT4_DIND_BLOCK + 1)
 365#define EXT4_N_BLOCKS                   (EXT4_TIND_BLOCK + 1)
 366
 367/*
 368 * Inode flags
 369 */
 370#define EXT4_SECRM_FL                   0x00000001 /* Secure deletion */
 371#define EXT4_UNRM_FL                    0x00000002 /* Undelete */
 372#define EXT4_COMPR_FL                   0x00000004 /* Compress file */
 373#define EXT4_SYNC_FL                    0x00000008 /* Synchronous updates */
 374#define EXT4_IMMUTABLE_FL               0x00000010 /* Immutable file */
 375#define EXT4_APPEND_FL                  0x00000020 /* writes to file may only append */
 376#define EXT4_NODUMP_FL                  0x00000040 /* do not dump file */
 377#define EXT4_NOATIME_FL                 0x00000080 /* do not update atime */
 378/* Reserved for compression usage... */
 379#define EXT4_DIRTY_FL                   0x00000100
 380#define EXT4_COMPRBLK_FL                0x00000200 /* One or more compressed clusters */
 381#define EXT4_NOCOMPR_FL                 0x00000400 /* Don't compress */
 382        /* nb: was previously EXT2_ECOMPR_FL */
 383#define EXT4_ENCRYPT_FL                 0x00000800 /* encrypted file */
 384/* End compression flags --- maybe not all used */
 385#define EXT4_INDEX_FL                   0x00001000 /* hash-indexed directory */
 386#define EXT4_IMAGIC_FL                  0x00002000 /* AFS directory */
 387#define EXT4_JOURNAL_DATA_FL            0x00004000 /* file data should be journaled */
 388#define EXT4_NOTAIL_FL                  0x00008000 /* file tail should not be merged */
 389#define EXT4_DIRSYNC_FL                 0x00010000 /* dirsync behaviour (directories only) */
 390#define EXT4_TOPDIR_FL                  0x00020000 /* Top of directory hierarchies*/
 391#define EXT4_HUGE_FILE_FL               0x00040000 /* Set to each huge file */
 392#define EXT4_EXTENTS_FL                 0x00080000 /* Inode uses extents */
 393#define EXT4_EA_INODE_FL                0x00200000 /* Inode used for large EA */
 394#define EXT4_EOFBLOCKS_FL               0x00400000 /* Blocks allocated beyond EOF */
 395#define EXT4_INLINE_DATA_FL             0x10000000 /* Inode has inline data. */
 396#define EXT4_PROJINHERIT_FL             0x20000000 /* Create with parents projid */
 397#define EXT4_RESERVED_FL                0x80000000 /* reserved for ext4 lib */
 398
 399#define EXT4_FL_USER_VISIBLE            0x304BDFFF /* User visible flags */
 400#define EXT4_FL_USER_MODIFIABLE         0x204380FF /* User modifiable flags */
 401
 402#define EXT4_FL_XFLAG_VISIBLE           (EXT4_SYNC_FL | \
 403                                         EXT4_IMMUTABLE_FL | \
 404                                         EXT4_APPEND_FL | \
 405                                         EXT4_NODUMP_FL | \
 406                                         EXT4_NOATIME_FL | \
 407                                         EXT4_PROJINHERIT_FL)
 408
 409/* Flags that should be inherited by new inodes from their parent. */
 410#define EXT4_FL_INHERITED (EXT4_SECRM_FL | EXT4_UNRM_FL | EXT4_COMPR_FL |\
 411                           EXT4_SYNC_FL | EXT4_NODUMP_FL | EXT4_NOATIME_FL |\
 412                           EXT4_NOCOMPR_FL | EXT4_JOURNAL_DATA_FL |\
 413                           EXT4_NOTAIL_FL | EXT4_DIRSYNC_FL |\
 414                           EXT4_PROJINHERIT_FL)
 415
 416/* Flags that are appropriate for regular files (all but dir-specific ones). */
 417#define EXT4_REG_FLMASK (~(EXT4_DIRSYNC_FL | EXT4_TOPDIR_FL))
 418
 419/* Flags that are appropriate for non-directories/regular files. */
 420#define EXT4_OTHER_FLMASK (EXT4_NODUMP_FL | EXT4_NOATIME_FL)
 421
 422/* Mask out flags that are inappropriate for the given type of inode. */
 423static inline __u32 ext4_mask_flags(umode_t mode, __u32 flags)
 424{
 425        if (S_ISDIR(mode))
 426                return flags;
 427        else if (S_ISREG(mode))
 428                return flags & EXT4_REG_FLMASK;
 429        else
 430                return flags & EXT4_OTHER_FLMASK;
 431}
 432
 433/*
 434 * Inode flags used for atomic set/get
 435 */
 436enum {
 437        EXT4_INODE_SECRM        = 0,    /* Secure deletion */
 438        EXT4_INODE_UNRM         = 1,    /* Undelete */
 439        EXT4_INODE_COMPR        = 2,    /* Compress file */
 440        EXT4_INODE_SYNC         = 3,    /* Synchronous updates */
 441        EXT4_INODE_IMMUTABLE    = 4,    /* Immutable file */
 442        EXT4_INODE_APPEND       = 5,    /* writes to file may only append */
 443        EXT4_INODE_NODUMP       = 6,    /* do not dump file */
 444        EXT4_INODE_NOATIME      = 7,    /* do not update atime */
 445/* Reserved for compression usage... */
 446        EXT4_INODE_DIRTY        = 8,
 447        EXT4_INODE_COMPRBLK     = 9,    /* One or more compressed clusters */
 448        EXT4_INODE_NOCOMPR      = 10,   /* Don't compress */
 449        EXT4_INODE_ENCRYPT      = 11,   /* Encrypted file */
 450/* End compression flags --- maybe not all used */
 451        EXT4_INODE_INDEX        = 12,   /* hash-indexed directory */
 452        EXT4_INODE_IMAGIC       = 13,   /* AFS directory */
 453        EXT4_INODE_JOURNAL_DATA = 14,   /* file data should be journaled */
 454        EXT4_INODE_NOTAIL       = 15,   /* file tail should not be merged */
 455        EXT4_INODE_DIRSYNC      = 16,   /* dirsync behaviour (directories only) */
 456        EXT4_INODE_TOPDIR       = 17,   /* Top of directory hierarchies*/
 457        EXT4_INODE_HUGE_FILE    = 18,   /* Set to each huge file */
 458        EXT4_INODE_EXTENTS      = 19,   /* Inode uses extents */
 459        EXT4_INODE_EA_INODE     = 21,   /* Inode used for large EA */
 460        EXT4_INODE_EOFBLOCKS    = 22,   /* Blocks allocated beyond EOF */
 461        EXT4_INODE_INLINE_DATA  = 28,   /* Data in inode. */
 462        EXT4_INODE_PROJINHERIT  = 29,   /* Create with parents projid */
 463        EXT4_INODE_RESERVED     = 31,   /* reserved for ext4 lib */
 464};
 465
 466/*
 467 * Since it's pretty easy to mix up bit numbers and hex values, we use a
 468 * build-time check to make sure that EXT4_XXX_FL is consistent with respect to
 469 * EXT4_INODE_XXX. If all is well, the macros will be dropped, so, it won't cost
 470 * any extra space in the compiled kernel image, otherwise, the build will fail.
 471 * It's important that these values are the same, since we are using
 472 * EXT4_INODE_XXX to test for flag values, but EXT4_XXX_FL must be consistent
 473 * with the values of FS_XXX_FL defined in include/linux/fs.h and the on-disk
 474 * values found in ext2, ext3 and ext4 filesystems, and of course the values
 475 * defined in e2fsprogs.
 476 *
 477 * It's not paranoia if the Murphy's Law really *is* out to get you.  :-)
 478 */
 479#define TEST_FLAG_VALUE(FLAG) (EXT4_##FLAG##_FL == (1 << EXT4_INODE_##FLAG))
 480#define CHECK_FLAG_VALUE(FLAG) BUILD_BUG_ON(!TEST_FLAG_VALUE(FLAG))
 481
 482static inline void ext4_check_flag_values(void)
 483{
 484        CHECK_FLAG_VALUE(SECRM);
 485        CHECK_FLAG_VALUE(UNRM);
 486        CHECK_FLAG_VALUE(COMPR);
 487        CHECK_FLAG_VALUE(SYNC);
 488        CHECK_FLAG_VALUE(IMMUTABLE);
 489        CHECK_FLAG_VALUE(APPEND);
 490        CHECK_FLAG_VALUE(NODUMP);
 491        CHECK_FLAG_VALUE(NOATIME);
 492        CHECK_FLAG_VALUE(DIRTY);
 493        CHECK_FLAG_VALUE(COMPRBLK);
 494        CHECK_FLAG_VALUE(NOCOMPR);
 495        CHECK_FLAG_VALUE(ENCRYPT);
 496        CHECK_FLAG_VALUE(INDEX);
 497        CHECK_FLAG_VALUE(IMAGIC);
 498        CHECK_FLAG_VALUE(JOURNAL_DATA);
 499        CHECK_FLAG_VALUE(NOTAIL);
 500        CHECK_FLAG_VALUE(DIRSYNC);
 501        CHECK_FLAG_VALUE(TOPDIR);
 502        CHECK_FLAG_VALUE(HUGE_FILE);
 503        CHECK_FLAG_VALUE(EXTENTS);
 504        CHECK_FLAG_VALUE(EA_INODE);
 505        CHECK_FLAG_VALUE(EOFBLOCKS);
 506        CHECK_FLAG_VALUE(INLINE_DATA);
 507        CHECK_FLAG_VALUE(PROJINHERIT);
 508        CHECK_FLAG_VALUE(RESERVED);
 509}
 510
 511/* Used to pass group descriptor data when online resize is done */
 512struct ext4_new_group_input {
 513        __u32 group;            /* Group number for this data */
 514        __u64 block_bitmap;     /* Absolute block number of block bitmap */
 515        __u64 inode_bitmap;     /* Absolute block number of inode bitmap */
 516        __u64 inode_table;      /* Absolute block number of inode table start */
 517        __u32 blocks_count;     /* Total number of blocks in this group */
 518        __u16 reserved_blocks;  /* Number of reserved blocks in this group */
 519        __u16 unused;
 520};
 521
 522#if defined(__KERNEL__) && defined(CONFIG_COMPAT)
 523struct compat_ext4_new_group_input {
 524        u32 group;
 525        compat_u64 block_bitmap;
 526        compat_u64 inode_bitmap;
 527        compat_u64 inode_table;
 528        u32 blocks_count;
 529        u16 reserved_blocks;
 530        u16 unused;
 531};
 532#endif
 533
 534/* The struct ext4_new_group_input in kernel space, with free_blocks_count */
 535struct ext4_new_group_data {
 536        __u32 group;
 537        __u64 block_bitmap;
 538        __u64 inode_bitmap;
 539        __u64 inode_table;
 540        __u32 blocks_count;
 541        __u16 reserved_blocks;
 542        __u16 unused;
 543        __u32 free_blocks_count;
 544};
 545
 546/* Indexes used to index group tables in ext4_new_group_data */
 547enum {
 548        BLOCK_BITMAP = 0,       /* block bitmap */
 549        INODE_BITMAP,           /* inode bitmap */
 550        INODE_TABLE,            /* inode tables */
 551        GROUP_TABLE_COUNT,
 552};
 553
 554/*
 555 * Flags used by ext4_map_blocks()
 556 */
 557        /* Allocate any needed blocks and/or convert an unwritten
 558           extent to be an initialized ext4 */
 559#define EXT4_GET_BLOCKS_CREATE                  0x0001
 560        /* Request the creation of an unwritten extent */
 561#define EXT4_GET_BLOCKS_UNWRIT_EXT              0x0002
 562#define EXT4_GET_BLOCKS_CREATE_UNWRIT_EXT       (EXT4_GET_BLOCKS_UNWRIT_EXT|\
 563                                                 EXT4_GET_BLOCKS_CREATE)
 564        /* Caller is from the delayed allocation writeout path
 565         * finally doing the actual allocation of delayed blocks */
 566#define EXT4_GET_BLOCKS_DELALLOC_RESERVE        0x0004
 567        /* caller is from the direct IO path, request to creation of an
 568        unwritten extents if not allocated, split the unwritten
 569        extent if blocks has been preallocated already*/
 570#define EXT4_GET_BLOCKS_PRE_IO                  0x0008
 571#define EXT4_GET_BLOCKS_CONVERT                 0x0010
 572#define EXT4_GET_BLOCKS_IO_CREATE_EXT           (EXT4_GET_BLOCKS_PRE_IO|\
 573                                         EXT4_GET_BLOCKS_CREATE_UNWRIT_EXT)
 574        /* Convert extent to initialized after IO complete */
 575#define EXT4_GET_BLOCKS_IO_CONVERT_EXT          (EXT4_GET_BLOCKS_CONVERT|\
 576                                         EXT4_GET_BLOCKS_CREATE_UNWRIT_EXT)
 577        /* Eventual metadata allocation (due to growing extent tree)
 578         * should not fail, so try to use reserved blocks for that.*/
 579#define EXT4_GET_BLOCKS_METADATA_NOFAIL         0x0020
 580        /* Don't normalize allocation size (used for fallocate) */
 581#define EXT4_GET_BLOCKS_NO_NORMALIZE            0x0040
 582        /* Request will not result in inode size update (user for fallocate) */
 583#define EXT4_GET_BLOCKS_KEEP_SIZE               0x0080
 584        /* Convert written extents to unwritten */
 585#define EXT4_GET_BLOCKS_CONVERT_UNWRITTEN       0x0100
 586        /* Write zeros to newly created written extents */
 587#define EXT4_GET_BLOCKS_ZERO                    0x0200
 588#define EXT4_GET_BLOCKS_CREATE_ZERO             (EXT4_GET_BLOCKS_CREATE |\
 589                                        EXT4_GET_BLOCKS_ZERO)
 590        /* Caller will submit data before dropping transaction handle. This
 591         * allows jbd2 to avoid submitting data before commit. */
 592#define EXT4_GET_BLOCKS_IO_SUBMIT               0x0400
 593
 594/*
 595 * The bit position of these flags must not overlap with any of the
 596 * EXT4_GET_BLOCKS_*.  They are used by ext4_find_extent(),
 597 * read_extent_tree_block(), ext4_split_extent_at(),
 598 * ext4_ext_insert_extent(), and ext4_ext_create_new_leaf().
 599 * EXT4_EX_NOCACHE is used to indicate that the we shouldn't be
 600 * caching the extents when reading from the extent tree while a
 601 * truncate or punch hole operation is in progress.
 602 */
 603#define EXT4_EX_NOCACHE                         0x40000000
 604#define EXT4_EX_FORCE_CACHE                     0x20000000
 605
 606/*
 607 * Flags used by ext4_free_blocks
 608 */
 609#define EXT4_FREE_BLOCKS_METADATA       0x0001
 610#define EXT4_FREE_BLOCKS_FORGET         0x0002
 611#define EXT4_FREE_BLOCKS_VALIDATED      0x0004
 612#define EXT4_FREE_BLOCKS_NO_QUOT_UPDATE 0x0008
 613#define EXT4_FREE_BLOCKS_NOFREE_FIRST_CLUSTER   0x0010
 614#define EXT4_FREE_BLOCKS_NOFREE_LAST_CLUSTER    0x0020
 615
 616/*
 617 * ioctl commands
 618 */
 619#define EXT4_IOC_GETFLAGS               FS_IOC_GETFLAGS
 620#define EXT4_IOC_SETFLAGS               FS_IOC_SETFLAGS
 621#define EXT4_IOC_GETVERSION             _IOR('f', 3, long)
 622#define EXT4_IOC_SETVERSION             _IOW('f', 4, long)
 623#define EXT4_IOC_GETVERSION_OLD         FS_IOC_GETVERSION
 624#define EXT4_IOC_SETVERSION_OLD         FS_IOC_SETVERSION
 625#define EXT4_IOC_GETRSVSZ               _IOR('f', 5, long)
 626#define EXT4_IOC_SETRSVSZ               _IOW('f', 6, long)
 627#define EXT4_IOC_GROUP_EXTEND           _IOW('f', 7, unsigned long)
 628#define EXT4_IOC_GROUP_ADD              _IOW('f', 8, struct ext4_new_group_input)
 629#define EXT4_IOC_MIGRATE                _IO('f', 9)
 630 /* note ioctl 10 reserved for an early version of the FIEMAP ioctl */
 631 /* note ioctl 11 reserved for filesystem-independent FIEMAP ioctl */
 632#define EXT4_IOC_ALLOC_DA_BLKS          _IO('f', 12)
 633#define EXT4_IOC_MOVE_EXT               _IOWR('f', 15, struct move_extent)
 634#define EXT4_IOC_RESIZE_FS              _IOW('f', 16, __u64)
 635#define EXT4_IOC_SWAP_BOOT              _IO('f', 17)
 636#define EXT4_IOC_PRECACHE_EXTENTS       _IO('f', 18)
 637#define EXT4_IOC_SET_ENCRYPTION_POLICY  FS_IOC_SET_ENCRYPTION_POLICY
 638#define EXT4_IOC_GET_ENCRYPTION_PWSALT  FS_IOC_GET_ENCRYPTION_PWSALT
 639#define EXT4_IOC_GET_ENCRYPTION_POLICY  FS_IOC_GET_ENCRYPTION_POLICY
 640
 641#ifndef FS_IOC_FSGETXATTR
 642/* Until the uapi changes get merged for project quota... */
 643
 644#define FS_IOC_FSGETXATTR               _IOR('X', 31, struct fsxattr)
 645#define FS_IOC_FSSETXATTR               _IOW('X', 32, struct fsxattr)
 646
 647/*
 648 * Structure for FS_IOC_FSGETXATTR and FS_IOC_FSSETXATTR.
 649 */
 650struct fsxattr {
 651        __u32           fsx_xflags;     /* xflags field value (get/set) */
 652        __u32           fsx_extsize;    /* extsize field value (get/set)*/
 653        __u32           fsx_nextents;   /* nextents field value (get)   */
 654        __u32           fsx_projid;     /* project identifier (get/set) */
 655        unsigned char   fsx_pad[12];
 656};
 657
 658/*
 659 * Flags for the fsx_xflags field
 660 */
 661#define FS_XFLAG_REALTIME       0x00000001      /* data in realtime volume */
 662#define FS_XFLAG_PREALLOC       0x00000002      /* preallocated file extents */
 663#define FS_XFLAG_IMMUTABLE      0x00000008      /* file cannot be modified */
 664#define FS_XFLAG_APPEND         0x00000010      /* all writes append */
 665#define FS_XFLAG_SYNC           0x00000020      /* all writes synchronous */
 666#define FS_XFLAG_NOATIME        0x00000040      /* do not update access time */
 667#define FS_XFLAG_NODUMP         0x00000080      /* do not include in backups */
 668#define FS_XFLAG_RTINHERIT      0x00000100      /* create with rt bit set */
 669#define FS_XFLAG_PROJINHERIT    0x00000200      /* create with parents projid */
 670#define FS_XFLAG_NOSYMLINKS     0x00000400      /* disallow symlink creation */
 671#define FS_XFLAG_EXTSIZE        0x00000800      /* extent size allocator hint */
 672#define FS_XFLAG_EXTSZINHERIT   0x00001000      /* inherit inode extent size */
 673#define FS_XFLAG_NODEFRAG       0x00002000      /* do not defragment */
 674#define FS_XFLAG_FILESTREAM     0x00004000      /* use filestream allocator */
 675#define FS_XFLAG_HASATTR        0x80000000      /* no DIFLAG for this */
 676#endif /* !defined(FS_IOC_FSGETXATTR) */
 677
 678#define EXT4_IOC_FSGETXATTR             FS_IOC_FSGETXATTR
 679#define EXT4_IOC_FSSETXATTR             FS_IOC_FSSETXATTR
 680
 681#if defined(__KERNEL__) && defined(CONFIG_COMPAT)
 682/*
 683 * ioctl commands in 32 bit emulation
 684 */
 685#define EXT4_IOC32_GETFLAGS             FS_IOC32_GETFLAGS
 686#define EXT4_IOC32_SETFLAGS             FS_IOC32_SETFLAGS
 687#define EXT4_IOC32_GETVERSION           _IOR('f', 3, int)
 688#define EXT4_IOC32_SETVERSION           _IOW('f', 4, int)
 689#define EXT4_IOC32_GETRSVSZ             _IOR('f', 5, int)
 690#define EXT4_IOC32_SETRSVSZ             _IOW('f', 6, int)
 691#define EXT4_IOC32_GROUP_EXTEND         _IOW('f', 7, unsigned int)
 692#define EXT4_IOC32_GROUP_ADD            _IOW('f', 8, struct compat_ext4_new_group_input)
 693#define EXT4_IOC32_GETVERSION_OLD       FS_IOC32_GETVERSION
 694#define EXT4_IOC32_SETVERSION_OLD       FS_IOC32_SETVERSION
 695#endif
 696
 697/* Max physical block we can address w/o extents */
 698#define EXT4_MAX_BLOCK_FILE_PHYS        0xFFFFFFFF
 699
 700/*
 701 * Structure of an inode on the disk
 702 */
 703struct ext4_inode {
 704        __le16  i_mode;         /* File mode */
 705        __le16  i_uid;          /* Low 16 bits of Owner Uid */
 706        __le32  i_size_lo;      /* Size in bytes */
 707        __le32  i_atime;        /* Access time */
 708        __le32  i_ctime;        /* Inode Change time */
 709        __le32  i_mtime;        /* Modification time */
 710        __le32  i_dtime;        /* Deletion Time */
 711        __le16  i_gid;          /* Low 16 bits of Group Id */
 712        __le16  i_links_count;  /* Links count */
 713        __le32  i_blocks_lo;    /* Blocks count */
 714        __le32  i_flags;        /* File flags */
 715        union {
 716                struct {
 717                        __le32  l_i_version;
 718                } linux1;
 719                struct {
 720                        __u32  h_i_translator;
 721                } hurd1;
 722                struct {
 723                        __u32  m_i_reserved1;
 724                } masix1;
 725        } osd1;                         /* OS dependent 1 */
 726        __le32  i_block[EXT4_N_BLOCKS];/* Pointers to blocks */
 727        __le32  i_generation;   /* File version (for NFS) */
 728        __le32  i_file_acl_lo;  /* File ACL */
 729        __le32  i_size_high;
 730        __le32  i_obso_faddr;   /* Obsoleted fragment address */
 731        union {
 732                struct {
 733                        __le16  l_i_blocks_high; /* were l_i_reserved1 */
 734                        __le16  l_i_file_acl_high;
 735                        __le16  l_i_uid_high;   /* these 2 fields */
 736                        __le16  l_i_gid_high;   /* were reserved2[0] */
 737                        __le16  l_i_checksum_lo;/* crc32c(uuid+inum+inode) LE */
 738                        __le16  l_i_reserved;
 739                } linux2;
 740                struct {
 741                        __le16  h_i_reserved1;  /* Obsoleted fragment number/size which are removed in ext4 */
 742                        __u16   h_i_mode_high;
 743                        __u16   h_i_uid_high;
 744                        __u16   h_i_gid_high;
 745                        __u32   h_i_author;
 746                } hurd2;
 747                struct {
 748                        __le16  h_i_reserved1;  /* Obsoleted fragment number/size which are removed in ext4 */
 749                        __le16  m_i_file_acl_high;
 750                        __u32   m_i_reserved2[2];
 751                } masix2;
 752        } osd2;                         /* OS dependent 2 */
 753        __le16  i_extra_isize;
 754        __le16  i_checksum_hi;  /* crc32c(uuid+inum+inode) BE */
 755        __le32  i_ctime_extra;  /* extra Change time      (nsec << 2 | epoch) */
 756        __le32  i_mtime_extra;  /* extra Modification time(nsec << 2 | epoch) */
 757        __le32  i_atime_extra;  /* extra Access time      (nsec << 2 | epoch) */
 758        __le32  i_crtime;       /* File Creation time */
 759        __le32  i_crtime_extra; /* extra FileCreationtime (nsec << 2 | epoch) */
 760        __le32  i_version_hi;   /* high 32 bits for 64-bit version */
 761        __le32  i_projid;       /* Project ID */
 762};
 763
 764struct move_extent {
 765        __u32 reserved;         /* should be zero */
 766        __u32 donor_fd;         /* donor file descriptor */
 767        __u64 orig_start;       /* logical start offset in block for orig */
 768        __u64 donor_start;      /* logical start offset in block for donor */
 769        __u64 len;              /* block length to be moved */
 770        __u64 moved_len;        /* moved block length */
 771};
 772
 773#define EXT4_EPOCH_BITS 2
 774#define EXT4_EPOCH_MASK ((1 << EXT4_EPOCH_BITS) - 1)
 775#define EXT4_NSEC_MASK  (~0UL << EXT4_EPOCH_BITS)
 776
 777/*
 778 * Extended fields will fit into an inode if the filesystem was formatted
 779 * with large inodes (-I 256 or larger) and there are not currently any EAs
 780 * consuming all of the available space. For new inodes we always reserve
 781 * enough space for the kernel's known extended fields, but for inodes
 782 * created with an old kernel this might not have been the case. None of
 783 * the extended inode fields is critical for correct filesystem operation.
 784 * This macro checks if a certain field fits in the inode. Note that
 785 * inode-size = GOOD_OLD_INODE_SIZE + i_extra_isize
 786 */
 787#define EXT4_FITS_IN_INODE(ext4_inode, einode, field)   \
 788        ((offsetof(typeof(*ext4_inode), field) +        \
 789          sizeof((ext4_inode)->field))                  \
 790        <= (EXT4_GOOD_OLD_INODE_SIZE +                  \
 791            (einode)->i_extra_isize))                   \
 792
 793/*
 794 * We use an encoding that preserves the times for extra epoch "00":
 795 *
 796 * extra  msb of                         adjust for signed
 797 * epoch  32-bit                         32-bit tv_sec to
 798 * bits   time    decoded 64-bit tv_sec  64-bit tv_sec      valid time range
 799 * 0 0    1    -0x80000000..-0x00000001  0x000000000 1901-12-13..1969-12-31
 800 * 0 0    0    0x000000000..0x07fffffff  0x000000000 1970-01-01..2038-01-19
 801 * 0 1    1    0x080000000..0x0ffffffff  0x100000000 2038-01-19..2106-02-07
 802 * 0 1    0    0x100000000..0x17fffffff  0x100000000 2106-02-07..2174-02-25
 803 * 1 0    1    0x180000000..0x1ffffffff  0x200000000 2174-02-25..2242-03-16
 804 * 1 0    0    0x200000000..0x27fffffff  0x200000000 2242-03-16..2310-04-04
 805 * 1 1    1    0x280000000..0x2ffffffff  0x300000000 2310-04-04..2378-04-22
 806 * 1 1    0    0x300000000..0x37fffffff  0x300000000 2378-04-22..2446-05-10
 807 *
 808 * Note that previous versions of the kernel on 64-bit systems would
 809 * incorrectly use extra epoch bits 1,1 for dates between 1901 and
 810 * 1970.  e2fsck will correct this, assuming that it is run on the
 811 * affected filesystem before 2242.
 812 */
 813
 814static inline __le32 ext4_encode_extra_time(struct timespec *time)
 815{
 816        u32 extra = sizeof(time->tv_sec) > 4 ?
 817                ((time->tv_sec - (s32)time->tv_sec) >> 32) & EXT4_EPOCH_MASK : 0;
 818        return cpu_to_le32(extra | (time->tv_nsec << EXT4_EPOCH_BITS));
 819}
 820
 821static inline void ext4_decode_extra_time(struct timespec *time, __le32 extra)
 822{
 823        if (unlikely(sizeof(time->tv_sec) > 4 &&
 824                        (extra & cpu_to_le32(EXT4_EPOCH_MASK)))) {
 825#if LINUX_VERSION_CODE < KERNEL_VERSION(4,20,0)
 826                /* Handle legacy encoding of pre-1970 dates with epoch
 827                 * bits 1,1.  We assume that by kernel version 4.20,
 828                 * everyone will have run fsck over the affected
 829                 * filesystems to correct the problem.  (This
 830                 * backwards compatibility may be removed before this
 831                 * time, at the discretion of the ext4 developers.)
 832                 */
 833                u64 extra_bits = le32_to_cpu(extra) & EXT4_EPOCH_MASK;
 834                if (extra_bits == 3 && ((time->tv_sec) & 0x80000000) != 0)
 835                        extra_bits = 0;
 836                time->tv_sec += extra_bits << 32;
 837#else
 838                time->tv_sec += (u64)(le32_to_cpu(extra) & EXT4_EPOCH_MASK) << 32;
 839#endif
 840        }
 841        time->tv_nsec = (le32_to_cpu(extra) & EXT4_NSEC_MASK) >> EXT4_EPOCH_BITS;
 842}
 843
 844#define EXT4_INODE_SET_XTIME(xtime, inode, raw_inode)                          \
 845do {                                                                           \
 846        (raw_inode)->xtime = cpu_to_le32((inode)->xtime.tv_sec);               \
 847        if (EXT4_FITS_IN_INODE(raw_inode, EXT4_I(inode), xtime ## _extra))     \
 848                (raw_inode)->xtime ## _extra =                                 \
 849                                ext4_encode_extra_time(&(inode)->xtime);       \
 850} while (0)
 851
 852#define EXT4_EINODE_SET_XTIME(xtime, einode, raw_inode)                        \
 853do {                                                                           \
 854        if (EXT4_FITS_IN_INODE(raw_inode, einode, xtime))                      \
 855                (raw_inode)->xtime = cpu_to_le32((einode)->xtime.tv_sec);      \
 856        if (EXT4_FITS_IN_INODE(raw_inode, einode, xtime ## _extra))            \
 857                (raw_inode)->xtime ## _extra =                                 \
 858                                ext4_encode_extra_time(&(einode)->xtime);      \
 859} while (0)
 860
 861#define EXT4_INODE_GET_XTIME(xtime, inode, raw_inode)                          \
 862do {                                                                           \
 863        (inode)->xtime.tv_sec = (signed)le32_to_cpu((raw_inode)->xtime);       \
 864        if (EXT4_FITS_IN_INODE(raw_inode, EXT4_I(inode), xtime ## _extra))     \
 865                ext4_decode_extra_time(&(inode)->xtime,                        \
 866                                       raw_inode->xtime ## _extra);            \
 867        else                                                                   \
 868                (inode)->xtime.tv_nsec = 0;                                    \
 869} while (0)
 870
 871#define EXT4_EINODE_GET_XTIME(xtime, einode, raw_inode)                        \
 872do {                                                                           \
 873        if (EXT4_FITS_IN_INODE(raw_inode, einode, xtime))                      \
 874                (einode)->xtime.tv_sec =                                       \
 875                        (signed)le32_to_cpu((raw_inode)->xtime);               \
 876        else                                                                   \
 877                (einode)->xtime.tv_sec = 0;                                    \
 878        if (EXT4_FITS_IN_INODE(raw_inode, einode, xtime ## _extra))            \
 879                ext4_decode_extra_time(&(einode)->xtime,                       \
 880                                       raw_inode->xtime ## _extra);            \
 881        else                                                                   \
 882                (einode)->xtime.tv_nsec = 0;                                   \
 883} while (0)
 884
 885#define i_disk_version osd1.linux1.l_i_version
 886
 887#if defined(__KERNEL__) || defined(__linux__)
 888#define i_reserved1     osd1.linux1.l_i_reserved1
 889#define i_file_acl_high osd2.linux2.l_i_file_acl_high
 890#define i_blocks_high   osd2.linux2.l_i_blocks_high
 891#define i_uid_low       i_uid
 892#define i_gid_low       i_gid
 893#define i_uid_high      osd2.linux2.l_i_uid_high
 894#define i_gid_high      osd2.linux2.l_i_gid_high
 895#define i_checksum_lo   osd2.linux2.l_i_checksum_lo
 896
 897#elif defined(__GNU__)
 898
 899#define i_translator    osd1.hurd1.h_i_translator
 900#define i_uid_high      osd2.hurd2.h_i_uid_high
 901#define i_gid_high      osd2.hurd2.h_i_gid_high
 902#define i_author        osd2.hurd2.h_i_author
 903
 904#elif defined(__masix__)
 905
 906#define i_reserved1     osd1.masix1.m_i_reserved1
 907#define i_file_acl_high osd2.masix2.m_i_file_acl_high
 908#define i_reserved2     osd2.masix2.m_i_reserved2
 909
 910#endif /* defined(__KERNEL__) || defined(__linux__) */
 911
 912#include "extents_status.h"
 913
 914/*
 915 * Lock subclasses for i_data_sem in the ext4_inode_info structure.
 916 *
 917 * These are needed to avoid lockdep false positives when we need to
 918 * allocate blocks to the quota inode during ext4_map_blocks(), while
 919 * holding i_data_sem for a normal (non-quota) inode.  Since we don't
 920 * do quota tracking for the quota inode, this avoids deadlock (as
 921 * well as infinite recursion, since it isn't turtles all the way
 922 * down...)
 923 *
 924 *  I_DATA_SEM_NORMAL - Used for most inodes
 925 *  I_DATA_SEM_OTHER  - Used by move_inode.c for the second normal inode
 926 *                        where the second inode has larger inode number
 927 *                        than the first
 928 *  I_DATA_SEM_QUOTA  - Used for quota inodes only
 929 */
 930enum {
 931        I_DATA_SEM_NORMAL = 0,
 932        I_DATA_SEM_OTHER,
 933        I_DATA_SEM_QUOTA,
 934};
 935
 936
 937/*
 938 * fourth extended file system inode data in memory
 939 */
 940struct ext4_inode_info {
 941        __le32  i_data[15];     /* unconverted */
 942        __u32   i_dtime;
 943        ext4_fsblk_t    i_file_acl;
 944
 945        /*
 946         * i_block_group is the number of the block group which contains
 947         * this file's inode.  Constant across the lifetime of the inode,
 948         * it is ued for making block allocation decisions - we try to
 949         * place a file's data blocks near its inode block, and new inodes
 950         * near to their parent directory's inode.
 951         */
 952        ext4_group_t    i_block_group;
 953        ext4_lblk_t     i_dir_start_lookup;
 954#if (BITS_PER_LONG < 64)
 955        unsigned long   i_state_flags;          /* Dynamic state flags */
 956#endif
 957        unsigned long   i_flags;
 958
 959        /*
 960         * Extended attributes can be read independently of the main file
 961         * data. Taking i_mutex even when reading would cause contention
 962         * between readers of EAs and writers of regular file data, so
 963         * instead we synchronize on xattr_sem when reading or changing
 964         * EAs.
 965         */
 966        struct rw_semaphore xattr_sem;
 967
 968        struct list_head i_orphan;      /* unlinked but open inodes */
 969
 970        /*
 971         * i_disksize keeps track of what the inode size is ON DISK, not
 972         * in memory.  During truncate, i_size is set to the new size by
 973         * the VFS prior to calling ext4_truncate(), but the filesystem won't
 974         * set i_disksize to 0 until the truncate is actually under way.
 975         *
 976         * The intent is that i_disksize always represents the blocks which
 977         * are used by this file.  This allows recovery to restart truncate
 978         * on orphans if we crash during truncate.  We actually write i_disksize
 979         * into the on-disk inode when writing inodes out, instead of i_size.
 980         *
 981         * The only time when i_disksize and i_size may be different is when
 982         * a truncate is in progress.  The only things which change i_disksize
 983         * are ext4_get_block (growth) and ext4_truncate (shrinkth).
 984         */
 985        loff_t  i_disksize;
 986
 987        /*
 988         * i_data_sem is for serialising ext4_truncate() against
 989         * ext4_getblock().  In the 2.4 ext2 design, great chunks of inode's
 990         * data tree are chopped off during truncate. We can't do that in
 991         * ext4 because whenever we perform intermediate commits during
 992         * truncate, the inode and all the metadata blocks *must* be in a
 993         * consistent state which allows truncation of the orphans to restart
 994         * during recovery.  Hence we must fix the get_block-vs-truncate race
 995         * by other means, so we have i_data_sem.
 996         */
 997        struct rw_semaphore i_data_sem;
 998        /*
 999         * i_mmap_sem is for serializing page faults with truncate / punch hole
1000         * operations. We have to make sure that new page cannot be faulted in
1001         * a section of the inode that is being punched. We cannot easily use
1002         * i_data_sem for this since we need protection for the whole punch
1003         * operation and i_data_sem ranks below transaction start so we have
1004         * to occasionally drop it.
1005         */
1006        struct rw_semaphore i_mmap_sem;
1007        struct inode vfs_inode;
1008        struct jbd2_inode *jinode;
1009
1010        spinlock_t i_raw_lock;  /* protects updates to the raw inode */
1011
1012        /*
1013         * File creation time. Its function is same as that of
1014         * struct timespec i_{a,c,m}time in the generic inode.
1015         */
1016        struct timespec i_crtime;
1017
1018        /* mballoc */
1019        struct list_head i_prealloc_list;
1020        spinlock_t i_prealloc_lock;
1021
1022        /* extents status tree */
1023        struct ext4_es_tree i_es_tree;
1024        rwlock_t i_es_lock;
1025        struct list_head i_es_list;
1026        unsigned int i_es_all_nr;       /* protected by i_es_lock */
1027        unsigned int i_es_shk_nr;       /* protected by i_es_lock */
1028        ext4_lblk_t i_es_shrink_lblk;   /* Offset where we start searching for
1029                                           extents to shrink. Protected by
1030                                           i_es_lock  */
1031
1032        /* ialloc */
1033        ext4_group_t    i_last_alloc_group;
1034
1035        /* allocation reservation info for delalloc */
1036        /* In case of bigalloc, these refer to clusters rather than blocks */
1037        unsigned int i_reserved_data_blocks;
1038        unsigned int i_reserved_meta_blocks;
1039        unsigned int i_allocated_meta_blocks;
1040        ext4_lblk_t i_da_metadata_calc_last_lblock;
1041        int i_da_metadata_calc_len;
1042
1043        /* on-disk additional length */
1044        __u16 i_extra_isize;
1045
1046        /* Indicate the inline data space. */
1047        u16 i_inline_off;
1048        u16 i_inline_size;
1049
1050#ifdef CONFIG_QUOTA
1051        /* quota space reservation, managed internally by quota code */
1052        qsize_t i_reserved_quota;
1053#endif
1054
1055        /* Lock protecting lists below */
1056        spinlock_t i_completed_io_lock;
1057        /*
1058         * Completed IOs that need unwritten extents handling and have
1059         * transaction reserved
1060         */
1061        struct list_head i_rsv_conversion_list;
1062        struct work_struct i_rsv_conversion_work;
1063        atomic_t i_unwritten; /* Nr. of inflight conversions pending */
1064
1065        spinlock_t i_block_reservation_lock;
1066
1067        /*
1068         * Transactions that contain inode's metadata needed to complete
1069         * fsync and fdatasync, respectively.
1070         */
1071        tid_t i_sync_tid;
1072        tid_t i_datasync_tid;
1073
1074#ifdef CONFIG_QUOTA
1075        struct dquot *i_dquot[MAXQUOTAS];
1076#endif
1077
1078        /* Precomputed uuid+inum+igen checksum for seeding inode checksums */
1079        __u32 i_csum_seed;
1080
1081        kprojid_t i_projid;
1082};
1083
1084/*
1085 * File system states
1086 */
1087#define EXT4_VALID_FS                   0x0001  /* Unmounted cleanly */
1088#define EXT4_ERROR_FS                   0x0002  /* Errors detected */
1089#define EXT4_ORPHAN_FS                  0x0004  /* Orphans being recovered */
1090
1091/*
1092 * Misc. filesystem flags
1093 */
1094#define EXT2_FLAGS_SIGNED_HASH          0x0001  /* Signed dirhash in use */
1095#define EXT2_FLAGS_UNSIGNED_HASH        0x0002  /* Unsigned dirhash in use */
1096#define EXT2_FLAGS_TEST_FILESYS         0x0004  /* to test development code */
1097
1098/*
1099 * Mount flags set via mount options or defaults
1100 */
1101#define EXT4_MOUNT_GRPID                0x00004 /* Create files with directory's group */
1102#define EXT4_MOUNT_DEBUG                0x00008 /* Some debugging messages */
1103#define EXT4_MOUNT_ERRORS_CONT          0x00010 /* Continue on errors */
1104#define EXT4_MOUNT_ERRORS_RO            0x00020 /* Remount fs ro on errors */
1105#define EXT4_MOUNT_ERRORS_PANIC         0x00040 /* Panic on errors */
1106#define EXT4_MOUNT_ERRORS_MASK          0x00070
1107#define EXT4_MOUNT_MINIX_DF             0x00080 /* Mimics the Minix statfs */
1108#define EXT4_MOUNT_NOLOAD               0x00100 /* Don't use existing journal*/
1109#ifdef CONFIG_FS_DAX
1110#define EXT4_MOUNT_DAX                  0x00200 /* Direct Access */
1111#else
1112#define EXT4_MOUNT_DAX                  0
1113#endif
1114#define EXT4_MOUNT_DATA_FLAGS           0x00C00 /* Mode for data writes: */
1115#define EXT4_MOUNT_JOURNAL_DATA         0x00400 /* Write data to journal */
1116#define EXT4_MOUNT_ORDERED_DATA         0x00800 /* Flush data before commit */
1117#define EXT4_MOUNT_WRITEBACK_DATA       0x00C00 /* No data ordering */
1118#define EXT4_MOUNT_UPDATE_JOURNAL       0x01000 /* Update the journal format */
1119#define EXT4_MOUNT_NO_UID32             0x02000  /* Disable 32-bit UIDs */
1120#define EXT4_MOUNT_XATTR_USER           0x04000 /* Extended user attributes */
1121#define EXT4_MOUNT_POSIX_ACL            0x08000 /* POSIX Access Control Lists */
1122#define EXT4_MOUNT_NO_AUTO_DA_ALLOC     0x10000 /* No auto delalloc mapping */
1123#define EXT4_MOUNT_BARRIER              0x20000 /* Use block barriers */
1124#define EXT4_MOUNT_QUOTA                0x40000 /* Some quota option set */
1125#define EXT4_MOUNT_USRQUOTA             0x80000 /* "old" user quota,
1126                                                 * enable enforcement for hidden
1127                                                 * quota files */
1128#define EXT4_MOUNT_GRPQUOTA             0x100000 /* "old" group quota, enable
1129                                                  * enforcement for hidden quota
1130                                                  * files */
1131#define EXT4_MOUNT_PRJQUOTA             0x200000 /* Enable project quota
1132                                                  * enforcement */
1133#define EXT4_MOUNT_DIOREAD_NOLOCK       0x400000 /* Enable support for dio read nolocking */
1134#define EXT4_MOUNT_JOURNAL_CHECKSUM     0x800000 /* Journal checksums */
1135#define EXT4_MOUNT_JOURNAL_ASYNC_COMMIT 0x1000000 /* Journal Async Commit */
1136#define EXT4_MOUNT_DELALLOC             0x8000000 /* Delalloc support */
1137#define EXT4_MOUNT_DATA_ERR_ABORT       0x10000000 /* Abort on file data write */
1138#define EXT4_MOUNT_BLOCK_VALIDITY       0x20000000 /* Block validity checking */
1139#define EXT4_MOUNT_DISCARD              0x40000000 /* Issue DISCARD requests */
1140#define EXT4_MOUNT_INIT_INODE_TABLE     0x80000000 /* Initialize uninitialized itables */
1141
1142/*
1143 * Mount flags set either automatically (could not be set by mount option)
1144 * based on per file system feature or property or in special cases such as
1145 * distinguishing between explicit mount option definition and default.
1146 */
1147#define EXT4_MOUNT2_EXPLICIT_DELALLOC   0x00000001 /* User explicitly
1148                                                      specified delalloc */
1149#define EXT4_MOUNT2_STD_GROUP_SIZE      0x00000002 /* We have standard group
1150                                                      size of blocksize * 8
1151                                                      blocks */
1152#define EXT4_MOUNT2_HURD_COMPAT         0x00000004 /* Support HURD-castrated
1153                                                      file systems */
1154
1155#define EXT4_MOUNT2_EXPLICIT_JOURNAL_CHECKSUM   0x00000008 /* User explicitly
1156                                                specified journal checksum */
1157
1158#define clear_opt(sb, opt)              EXT4_SB(sb)->s_mount_opt &= \
1159                                                ~EXT4_MOUNT_##opt
1160#define set_opt(sb, opt)                EXT4_SB(sb)->s_mount_opt |= \
1161                                                EXT4_MOUNT_##opt
1162#define test_opt(sb, opt)               (EXT4_SB(sb)->s_mount_opt & \
1163                                         EXT4_MOUNT_##opt)
1164
1165#define clear_opt2(sb, opt)             EXT4_SB(sb)->s_mount_opt2 &= \
1166                                                ~EXT4_MOUNT2_##opt
1167#define set_opt2(sb, opt)               EXT4_SB(sb)->s_mount_opt2 |= \
1168                                                EXT4_MOUNT2_##opt
1169#define test_opt2(sb, opt)              (EXT4_SB(sb)->s_mount_opt2 & \
1170                                         EXT4_MOUNT2_##opt)
1171
1172#define ext4_test_and_set_bit           __test_and_set_bit_le
1173#define ext4_set_bit                    __set_bit_le
1174#define ext4_set_bit_atomic             ext2_set_bit_atomic
1175#define ext4_test_and_clear_bit         __test_and_clear_bit_le
1176#define ext4_clear_bit                  __clear_bit_le
1177#define ext4_clear_bit_atomic           ext2_clear_bit_atomic
1178#define ext4_test_bit                   test_bit_le
1179#define ext4_find_next_zero_bit         find_next_zero_bit_le
1180#define ext4_find_next_bit              find_next_bit_le
1181
1182extern void ext4_set_bits(void *bm, int cur, int len);
1183
1184/*
1185 * Maximal mount counts between two filesystem checks
1186 */
1187#define EXT4_DFL_MAX_MNT_COUNT          20      /* Allow 20 mounts */
1188#define EXT4_DFL_CHECKINTERVAL          0       /* Don't use interval check */
1189
1190/*
1191 * Behaviour when detecting errors
1192 */
1193#define EXT4_ERRORS_CONTINUE            1       /* Continue execution */
1194#define EXT4_ERRORS_RO                  2       /* Remount fs read-only */
1195#define EXT4_ERRORS_PANIC               3       /* Panic */
1196#define EXT4_ERRORS_DEFAULT             EXT4_ERRORS_CONTINUE
1197
1198/* Metadata checksum algorithm codes */
1199#define EXT4_CRC32C_CHKSUM              1
1200
1201/*
1202 * Structure of the super block
1203 */
1204struct ext4_super_block {
1205/*00*/  __le32  s_inodes_count;         /* Inodes count */
1206        __le32  s_blocks_count_lo;      /* Blocks count */
1207        __le32  s_r_blocks_count_lo;    /* Reserved blocks count */
1208        __le32  s_free_blocks_count_lo; /* Free blocks count */
1209/*10*/  __le32  s_free_inodes_count;    /* Free inodes count */
1210        __le32  s_first_data_block;     /* First Data Block */
1211        __le32  s_log_block_size;       /* Block size */
1212        __le32  s_log_cluster_size;     /* Allocation cluster size */
1213/*20*/  __le32  s_blocks_per_group;     /* # Blocks per group */
1214        __le32  s_clusters_per_group;   /* # Clusters per group */
1215        __le32  s_inodes_per_group;     /* # Inodes per group */
1216        __le32  s_mtime;                /* Mount time */
1217/*30*/  __le32  s_wtime;                /* Write time */
1218        __le16  s_mnt_count;            /* Mount count */
1219        __le16  s_max_mnt_count;        /* Maximal mount count */
1220        __le16  s_magic;                /* Magic signature */
1221        __le16  s_state;                /* File system state */
1222        __le16  s_errors;               /* Behaviour when detecting errors */
1223        __le16  s_minor_rev_level;      /* minor revision level */
1224/*40*/  __le32  s_lastcheck;            /* time of last check */
1225        __le32  s_checkinterval;        /* max. time between checks */
1226        __le32  s_creator_os;           /* OS */
1227        __le32  s_rev_level;            /* Revision level */
1228/*50*/  __le16  s_def_resuid;           /* Default uid for reserved blocks */
1229        __le16  s_def_resgid;           /* Default gid for reserved blocks */
1230        /*
1231         * These fields are for EXT4_DYNAMIC_REV superblocks only.
1232         *
1233         * Note: the difference between the compatible feature set and
1234         * the incompatible feature set is that if there is a bit set
1235         * in the incompatible feature set that the kernel doesn't
1236         * know about, it should refuse to mount the filesystem.
1237         *
1238         * e2fsck's requirements are more strict; if it doesn't know
1239         * about a feature in either the compatible or incompatible
1240         * feature set, it must abort and not try to meddle with
1241         * things it doesn't understand...
1242         */
1243        __le32  s_first_ino;            /* First non-reserved inode */
1244        __le16  s_inode_size;           /* size of inode structure */
1245        __le16  s_block_group_nr;       /* block group # of this superblock */
1246        __le32  s_feature_compat;       /* compatible feature set */
1247/*60*/  __le32  s_feature_incompat;     /* incompatible feature set */
1248        __le32  s_feature_ro_compat;    /* readonly-compatible feature set */
1249/*68*/  __u8    s_uuid[16];             /* 128-bit uuid for volume */
1250/*78*/  char    s_volume_name[16];      /* volume name */
1251/*88*/  char    s_last_mounted[64];     /* directory where last mounted */
1252/*C8*/  __le32  s_algorithm_usage_bitmap; /* For compression */
1253        /*
1254         * Performance hints.  Directory preallocation should only
1255         * happen if the EXT4_FEATURE_COMPAT_DIR_PREALLOC flag is on.
1256         */
1257        __u8    s_prealloc_blocks;      /* Nr of blocks to try to preallocate*/
1258        __u8    s_prealloc_dir_blocks;  /* Nr to preallocate for dirs */
1259        __le16  s_reserved_gdt_blocks;  /* Per group desc for online growth */
1260        /*
1261         * Journaling support valid if EXT4_FEATURE_COMPAT_HAS_JOURNAL set.
1262         */
1263/*D0*/  __u8    s_journal_uuid[16];     /* uuid of journal superblock */
1264/*E0*/  __le32  s_journal_inum;         /* inode number of journal file */
1265        __le32  s_journal_dev;          /* device number of journal file */
1266        __le32  s_last_orphan;          /* start of list of inodes to delete */
1267        __le32  s_hash_seed[4];         /* HTREE hash seed */
1268        __u8    s_def_hash_version;     /* Default hash version to use */
1269        __u8    s_jnl_backup_type;
1270        __le16  s_desc_size;            /* size of group descriptor */
1271/*100*/ __le32  s_default_mount_opts;
1272        __le32  s_first_meta_bg;        /* First metablock block group */
1273        __le32  s_mkfs_time;            /* When the filesystem was created */
1274        __le32  s_jnl_blocks[17];       /* Backup of the journal inode */
1275        /* 64bit support valid if EXT4_FEATURE_COMPAT_64BIT */
1276/*150*/ __le32  s_blocks_count_hi;      /* Blocks count */
1277        __le32  s_r_blocks_count_hi;    /* Reserved blocks count */
1278        __le32  s_free_blocks_count_hi; /* Free blocks count */
1279        __le16  s_min_extra_isize;      /* All inodes have at least # bytes */
1280        __le16  s_want_extra_isize;     /* New inodes should reserve # bytes */
1281        __le32  s_flags;                /* Miscellaneous flags */
1282        __le16  s_raid_stride;          /* RAID stride */
1283        __le16  s_mmp_update_interval;  /* # seconds to wait in MMP checking */
1284        __le64  s_mmp_block;            /* Block for multi-mount protection */
1285        __le32  s_raid_stripe_width;    /* blocks on all data disks (N*stride)*/
1286        __u8    s_log_groups_per_flex;  /* FLEX_BG group size */
1287        __u8    s_checksum_type;        /* metadata checksum algorithm used */
1288        __u8    s_encryption_level;     /* versioning level for encryption */
1289        __u8    s_reserved_pad;         /* Padding to next 32bits */
1290        __le64  s_kbytes_written;       /* nr of lifetime kilobytes written */
1291        __le32  s_snapshot_inum;        /* Inode number of active snapshot */
1292        __le32  s_snapshot_id;          /* sequential ID of active snapshot */
1293        __le64  s_snapshot_r_blocks_count; /* reserved blocks for active
1294                                              snapshot's future use */
1295        __le32  s_snapshot_list;        /* inode number of the head of the
1296                                           on-disk snapshot list */
1297#define EXT4_S_ERR_START offsetof(struct ext4_super_block, s_error_count)
1298        __le32  s_error_count;          /* number of fs errors */
1299        __le32  s_first_error_time;     /* first time an error happened */
1300        __le32  s_first_error_ino;      /* inode involved in first error */
1301        __le64  s_first_error_block;    /* block involved of first error */
1302        __u8    s_first_error_func[32]; /* function where the error happened */
1303        __le32  s_first_error_line;     /* line number where error happened */
1304        __le32  s_last_error_time;      /* most recent time of an error */
1305        __le32  s_last_error_ino;       /* inode involved in last error */
1306        __le32  s_last_error_line;      /* line number where error happened */
1307        __le64  s_last_error_block;     /* block involved of last error */
1308        __u8    s_last_error_func[32];  /* function where the error happened */
1309#define EXT4_S_ERR_END offsetof(struct ext4_super_block, s_mount_opts)
1310        __u8    s_mount_opts[64];
1311        __le32  s_usr_quota_inum;       /* inode for tracking user quota */
1312        __le32  s_grp_quota_inum;       /* inode for tracking group quota */
1313        __le32  s_overhead_clusters;    /* overhead blocks/clusters in fs */
1314        __le32  s_backup_bgs[2];        /* groups with sparse_super2 SBs */
1315        __u8    s_encrypt_algos[4];     /* Encryption algorithms in use  */
1316        __u8    s_encrypt_pw_salt[16];  /* Salt used for string2key algorithm */
1317        __le32  s_lpf_ino;              /* Location of the lost+found inode */
1318        __le32  s_prj_quota_inum;       /* inode for tracking project quota */
1319        __le32  s_checksum_seed;        /* crc32c(uuid) if csum_seed set */
1320        __le32  s_reserved[98];         /* Padding to the end of the block */
1321        __le32  s_checksum;             /* crc32c(superblock) */
1322};
1323
1324#define EXT4_S_ERR_LEN (EXT4_S_ERR_END - EXT4_S_ERR_START)
1325
1326#ifdef __KERNEL__
1327
1328/*
1329 * run-time mount flags
1330 */
1331#define EXT4_MF_MNTDIR_SAMPLED          0x0001
1332#define EXT4_MF_FS_ABORTED              0x0002  /* Fatal error detected */
1333#define EXT4_MF_TEST_DUMMY_ENCRYPTION   0x0004
1334
1335#ifdef CONFIG_EXT4_FS_ENCRYPTION
1336#define DUMMY_ENCRYPTION_ENABLED(sbi) (unlikely((sbi)->s_mount_flags & \
1337                                                EXT4_MF_TEST_DUMMY_ENCRYPTION))
1338#else
1339#define DUMMY_ENCRYPTION_ENABLED(sbi) (0)
1340#endif
1341
1342/* Number of quota types we support */
1343#define EXT4_MAXQUOTAS 3
1344
1345#ifdef CONFIG_EXT4_FS_ENCRYPTION
1346#define EXT4_KEY_DESC_PREFIX "ext4:"
1347#define EXT4_KEY_DESC_PREFIX_SIZE 5
1348#endif
1349
1350/*
1351 * fourth extended-fs super-block data in memory
1352 */
1353struct ext4_sb_info {
1354        unsigned long s_desc_size;      /* Size of a group descriptor in bytes */
1355        unsigned long s_inodes_per_block;/* Number of inodes per block */
1356        unsigned long s_blocks_per_group;/* Number of blocks in a group */
1357        unsigned long s_clusters_per_group; /* Number of clusters in a group */
1358        unsigned long s_inodes_per_group;/* Number of inodes in a group */
1359        unsigned long s_itb_per_group;  /* Number of inode table blocks per group */
1360        unsigned long s_gdb_count;      /* Number of group descriptor blocks */
1361        unsigned long s_desc_per_block; /* Number of group descriptors per block */
1362        ext4_group_t s_groups_count;    /* Number of groups in the fs */
1363        ext4_group_t s_blockfile_groups;/* Groups acceptable for non-extent files */
1364        unsigned long s_overhead;  /* # of fs overhead clusters */
1365        unsigned int s_cluster_ratio;   /* Number of blocks per cluster */
1366        unsigned int s_cluster_bits;    /* log2 of s_cluster_ratio */
1367        loff_t s_bitmap_maxbytes;       /* max bytes for bitmap files */
1368        struct buffer_head * s_sbh;     /* Buffer containing the super block */
1369        struct ext4_super_block *s_es;  /* Pointer to the super block in the buffer */
1370        struct buffer_head **s_group_desc;
1371        unsigned int s_mount_opt;
1372        unsigned int s_mount_opt2;
1373        unsigned int s_mount_flags;
1374        unsigned int s_def_mount_opt;
1375        ext4_fsblk_t s_sb_block;
1376        atomic64_t s_resv_clusters;
1377        kuid_t s_resuid;
1378        kgid_t s_resgid;
1379        unsigned short s_mount_state;
1380        unsigned short s_pad;
1381        int s_addr_per_block_bits;
1382        int s_desc_per_block_bits;
1383        int s_inode_size;
1384        int s_first_ino;
1385        unsigned int s_inode_readahead_blks;
1386        unsigned int s_inode_goal;
1387        spinlock_t s_next_gen_lock;
1388        u32 s_next_generation;
1389        u32 s_hash_seed[4];
1390        int s_def_hash_version;
1391        int s_hash_unsigned;    /* 3 if hash should be signed, 0 if not */
1392        struct percpu_counter s_freeclusters_counter;
1393        struct percpu_counter s_freeinodes_counter;
1394        struct percpu_counter s_dirs_counter;
1395        struct percpu_counter s_dirtyclusters_counter;
1396        struct blockgroup_lock *s_blockgroup_lock;
1397        struct proc_dir_entry *s_proc;
1398        struct kobject s_kobj;
1399        struct completion s_kobj_unregister;
1400        struct super_block *s_sb;
1401
1402        /* Journaling */
1403        struct journal_s *s_journal;
1404        struct list_head s_orphan;
1405        struct mutex s_orphan_lock;
1406        unsigned long s_resize_flags;           /* Flags indicating if there
1407                                                   is a resizer */
1408        unsigned long s_commit_interval;
1409        u32 s_max_batch_time;
1410        u32 s_min_batch_time;
1411        struct block_device *journal_bdev;
1412#ifdef CONFIG_QUOTA
1413        char *s_qf_names[EXT4_MAXQUOTAS];       /* Names of quota files with journalled quota */
1414        int s_jquota_fmt;                       /* Format of quota to use */
1415#endif
1416        unsigned int s_want_extra_isize; /* New inodes should reserve # bytes */
1417        struct rb_root system_blks;
1418
1419#ifdef EXTENTS_STATS
1420        /* ext4 extents stats */
1421        unsigned long s_ext_min;
1422        unsigned long s_ext_max;
1423        unsigned long s_depth_max;
1424        spinlock_t s_ext_stats_lock;
1425        unsigned long s_ext_blocks;
1426        unsigned long s_ext_extents;
1427#endif
1428
1429        /* for buddy allocator */
1430        struct ext4_group_info ***s_group_info;
1431        struct inode *s_buddy_cache;
1432        spinlock_t s_md_lock;
1433        unsigned short *s_mb_offsets;
1434        unsigned int *s_mb_maxs;
1435        unsigned int s_group_info_size;
1436        unsigned int s_mb_free_pending;
1437
1438        /* tunables */
1439        unsigned long s_stripe;
1440        unsigned int s_mb_stream_request;
1441        unsigned int s_mb_max_to_scan;
1442        unsigned int s_mb_min_to_scan;
1443        unsigned int s_mb_stats;
1444        unsigned int s_mb_order2_reqs;
1445        unsigned int s_mb_group_prealloc;
1446        unsigned int s_max_dir_size_kb;
1447        /* where last allocation was done - for stream allocation */
1448        unsigned long s_mb_last_group;
1449        unsigned long s_mb_last_start;
1450
1451        /* stats for buddy allocator */
1452        atomic_t s_bal_reqs;    /* number of reqs with len > 1 */
1453        atomic_t s_bal_success; /* we found long enough chunks */
1454        atomic_t s_bal_allocated;       /* in blocks */
1455        atomic_t s_bal_ex_scanned;      /* total extents scanned */
1456        atomic_t s_bal_goals;   /* goal hits */
1457        atomic_t s_bal_breaks;  /* too long searches */
1458        atomic_t s_bal_2orders; /* 2^order hits */
1459        spinlock_t s_bal_lock;
1460        unsigned long s_mb_buddies_generated;
1461        unsigned long long s_mb_generation_time;
1462        atomic_t s_mb_lost_chunks;
1463        atomic_t s_mb_preallocated;
1464        atomic_t s_mb_discarded;
1465        atomic_t s_lock_busy;
1466
1467        /* locality groups */
1468        struct ext4_locality_group __percpu *s_locality_groups;
1469
1470        /* for write statistics */
1471        unsigned long s_sectors_written_start;
1472        u64 s_kbytes_written;
1473
1474        /* the size of zero-out chunk */
1475        unsigned int s_extent_max_zeroout_kb;
1476
1477        unsigned int s_log_groups_per_flex;
1478        struct flex_groups *s_flex_groups;
1479        ext4_group_t s_flex_groups_allocated;
1480
1481        /* workqueue for reserved extent conversions (buffered io) */
1482        struct workqueue_struct *rsv_conversion_wq;
1483
1484        /* timer for periodic error stats printing */
1485        struct timer_list s_err_report;
1486
1487        /* Lazy inode table initialization info */
1488        struct ext4_li_request *s_li_request;
1489        /* Wait multiplier for lazy initialization thread */
1490        unsigned int s_li_wait_mult;
1491
1492        /* Kernel thread for multiple mount protection */
1493        struct task_struct *s_mmp_tsk;
1494
1495        /* record the last minlen when FITRIM is called. */
1496        atomic_t s_last_trim_minblks;
1497
1498        /* Reference to checksum algorithm driver via cryptoapi */
1499        struct crypto_shash *s_chksum_driver;
1500
1501        /* Precomputed FS UUID checksum for seeding other checksums */
1502        __u32 s_csum_seed;
1503
1504        /* Reclaim extents from extent status tree */
1505        struct shrinker s_es_shrinker;
1506        struct list_head s_es_list;     /* List of inodes with reclaimable extents */
1507        long s_es_nr_inode;
1508        struct ext4_es_stats s_es_stats;
1509        struct mb_cache *s_mb_cache;
1510        spinlock_t s_es_lock ____cacheline_aligned_in_smp;
1511
1512        /* Ratelimit ext4 messages. */
1513        struct ratelimit_state s_err_ratelimit_state;
1514        struct ratelimit_state s_warning_ratelimit_state;
1515        struct ratelimit_state s_msg_ratelimit_state;
1516
1517        /* Barrier between changing inodes' journal flags and writepages ops. */
1518        struct percpu_rw_semaphore s_journal_flag_rwsem;
1519
1520        /* Encryption support */
1521#ifdef CONFIG_EXT4_FS_ENCRYPTION
1522        u8 key_prefix[EXT4_KEY_DESC_PREFIX_SIZE];
1523        u8 key_prefix_size;
1524#endif
1525};
1526
1527static inline struct ext4_sb_info *EXT4_SB(struct super_block *sb)
1528{
1529        return sb->s_fs_info;
1530}
1531static inline struct ext4_inode_info *EXT4_I(struct inode *inode)
1532{
1533        return container_of(inode, struct ext4_inode_info, vfs_inode);
1534}
1535
1536static inline struct timespec ext4_current_time(struct inode *inode)
1537{
1538        return (inode->i_sb->s_time_gran < NSEC_PER_SEC) ?
1539                current_fs_time(inode->i_sb) : CURRENT_TIME_SEC;
1540}
1541
1542static inline int ext4_valid_inum(struct super_block *sb, unsigned long ino)
1543{
1544        return ino == EXT4_ROOT_INO ||
1545                ino == EXT4_USR_QUOTA_INO ||
1546                ino == EXT4_GRP_QUOTA_INO ||
1547                ino == EXT4_BOOT_LOADER_INO ||
1548                ino == EXT4_JOURNAL_INO ||
1549                ino == EXT4_RESIZE_INO ||
1550                (ino >= EXT4_FIRST_INO(sb) &&
1551                 ino <= le32_to_cpu(EXT4_SB(sb)->s_es->s_inodes_count));
1552}
1553
1554/*
1555 * Inode dynamic state flags
1556 */
1557enum {
1558        EXT4_STATE_JDATA,               /* journaled data exists */
1559        EXT4_STATE_NEW,                 /* inode is newly created */
1560        EXT4_STATE_XATTR,               /* has in-inode xattrs */
1561        EXT4_STATE_NO_EXPAND,           /* No space for expansion */
1562        EXT4_STATE_DA_ALLOC_CLOSE,      /* Alloc DA blks on close */
1563        EXT4_STATE_EXT_MIGRATE,         /* Inode is migrating */
1564        EXT4_STATE_DIO_UNWRITTEN,       /* need convert on dio done*/
1565        EXT4_STATE_NEWENTRY,            /* File just added to dir */
1566        EXT4_STATE_DIOREAD_LOCK,        /* Disable support for dio read
1567                                           nolocking */
1568        EXT4_STATE_MAY_INLINE_DATA,     /* may have in-inode data */
1569        EXT4_STATE_EXT_PRECACHED,       /* extents have been precached */
1570};
1571
1572#define EXT4_INODE_BIT_FNS(name, field, offset)                         \
1573static inline int ext4_test_inode_##name(struct inode *inode, int bit)  \
1574{                                                                       \
1575        return test_bit(bit + (offset), &EXT4_I(inode)->i_##field);     \
1576}                                                                       \
1577static inline void ext4_set_inode_##name(struct inode *inode, int bit)  \
1578{                                                                       \
1579        set_bit(bit + (offset), &EXT4_I(inode)->i_##field);             \
1580}                                                                       \
1581static inline void ext4_clear_inode_##name(struct inode *inode, int bit) \
1582{                                                                       \
1583        clear_bit(bit + (offset), &EXT4_I(inode)->i_##field);           \
1584}
1585
1586/* Add these declarations here only so that these functions can be
1587 * found by name.  Otherwise, they are very hard to locate. */
1588static inline int ext4_test_inode_flag(struct inode *inode, int bit);
1589static inline void ext4_set_inode_flag(struct inode *inode, int bit);
1590static inline void ext4_clear_inode_flag(struct inode *inode, int bit);
1591EXT4_INODE_BIT_FNS(flag, flags, 0)
1592
1593/* Add these declarations here only so that these functions can be
1594 * found by name.  Otherwise, they are very hard to locate. */
1595static inline int ext4_test_inode_state(struct inode *inode, int bit);
1596static inline void ext4_set_inode_state(struct inode *inode, int bit);
1597static inline void ext4_clear_inode_state(struct inode *inode, int bit);
1598#if (BITS_PER_LONG < 64)
1599EXT4_INODE_BIT_FNS(state, state_flags, 0)
1600
1601static inline void ext4_clear_state_flags(struct ext4_inode_info *ei)
1602{
1603        (ei)->i_state_flags = 0;
1604}
1605#else
1606EXT4_INODE_BIT_FNS(state, flags, 32)
1607
1608static inline void ext4_clear_state_flags(struct ext4_inode_info *ei)
1609{
1610        /* We depend on the fact that callers will set i_flags */
1611}
1612#endif
1613#else
1614/* Assume that user mode programs are passing in an ext4fs superblock, not
1615 * a kernel struct super_block.  This will allow us to call the feature-test
1616 * macros from user land. */
1617#define EXT4_SB(sb)     (sb)
1618#endif
1619
1620/*
1621 * Returns true if the inode is inode is encrypted
1622 */
1623#define NEXT_ORPHAN(inode) EXT4_I(inode)->i_dtime
1624
1625/*
1626 * Codes for operating systems
1627 */
1628#define EXT4_OS_LINUX           0
1629#define EXT4_OS_HURD            1
1630#define EXT4_OS_MASIX           2
1631#define EXT4_OS_FREEBSD         3
1632#define EXT4_OS_LITES           4
1633
1634/*
1635 * Revision levels
1636 */
1637#define EXT4_GOOD_OLD_REV       0       /* The good old (original) format */
1638#define EXT4_DYNAMIC_REV        1       /* V2 format w/ dynamic inode sizes */
1639
1640#define EXT4_CURRENT_REV        EXT4_GOOD_OLD_REV
1641#define EXT4_MAX_SUPP_REV       EXT4_DYNAMIC_REV
1642
1643#define EXT4_GOOD_OLD_INODE_SIZE 128
1644
1645/*
1646 * Feature set definitions
1647 */
1648
1649#define EXT4_FEATURE_COMPAT_DIR_PREALLOC        0x0001
1650#define EXT4_FEATURE_COMPAT_IMAGIC_INODES       0x0002
1651#define EXT4_FEATURE_COMPAT_HAS_JOURNAL         0x0004
1652#define EXT4_FEATURE_COMPAT_EXT_ATTR            0x0008
1653#define EXT4_FEATURE_COMPAT_RESIZE_INODE        0x0010
1654#define EXT4_FEATURE_COMPAT_DIR_INDEX           0x0020
1655#define EXT4_FEATURE_COMPAT_SPARSE_SUPER2       0x0200
1656
1657#define EXT4_FEATURE_RO_COMPAT_SPARSE_SUPER     0x0001
1658#define EXT4_FEATURE_RO_COMPAT_LARGE_FILE       0x0002
1659#define EXT4_FEATURE_RO_COMPAT_BTREE_DIR        0x0004
1660#define EXT4_FEATURE_RO_COMPAT_HUGE_FILE        0x0008
1661#define EXT4_FEATURE_RO_COMPAT_GDT_CSUM         0x0010
1662#define EXT4_FEATURE_RO_COMPAT_DIR_NLINK        0x0020
1663#define EXT4_FEATURE_RO_COMPAT_EXTRA_ISIZE      0x0040
1664#define EXT4_FEATURE_RO_COMPAT_QUOTA            0x0100
1665#define EXT4_FEATURE_RO_COMPAT_BIGALLOC         0x0200
1666/*
1667 * METADATA_CSUM also enables group descriptor checksums (GDT_CSUM).  When
1668 * METADATA_CSUM is set, group descriptor checksums use the same algorithm as
1669 * all other data structures' checksums.  However, the METADATA_CSUM and
1670 * GDT_CSUM bits are mutually exclusive.
1671 */
1672#define EXT4_FEATURE_RO_COMPAT_METADATA_CSUM    0x0400
1673#define EXT4_FEATURE_RO_COMPAT_READONLY         0x1000
1674#define EXT4_FEATURE_RO_COMPAT_PROJECT          0x2000
1675
1676#define EXT4_FEATURE_INCOMPAT_COMPRESSION       0x0001
1677#define EXT4_FEATURE_INCOMPAT_FILETYPE          0x0002
1678#define EXT4_FEATURE_INCOMPAT_RECOVER           0x0004 /* Needs recovery */
1679#define EXT4_FEATURE_INCOMPAT_JOURNAL_DEV       0x0008 /* Journal device */
1680#define EXT4_FEATURE_INCOMPAT_META_BG           0x0010
1681#define EXT4_FEATURE_INCOMPAT_EXTENTS           0x0040 /* extents support */
1682#define EXT4_FEATURE_INCOMPAT_64BIT             0x0080
1683#define EXT4_FEATURE_INCOMPAT_MMP               0x0100
1684#define EXT4_FEATURE_INCOMPAT_FLEX_BG           0x0200
1685#define EXT4_FEATURE_INCOMPAT_EA_INODE          0x0400 /* EA in inode */
1686#define EXT4_FEATURE_INCOMPAT_DIRDATA           0x1000 /* data in dirent */
1687#define EXT4_FEATURE_INCOMPAT_CSUM_SEED         0x2000
1688#define EXT4_FEATURE_INCOMPAT_LARGEDIR          0x4000 /* >2GB or 3-lvl htree */
1689#define EXT4_FEATURE_INCOMPAT_INLINE_DATA       0x8000 /* data in inode */
1690#define EXT4_FEATURE_INCOMPAT_ENCRYPT           0x10000
1691
1692#define EXT4_FEATURE_COMPAT_FUNCS(name, flagname) \
1693static inline bool ext4_has_feature_##name(struct super_block *sb) \
1694{ \
1695        return ((EXT4_SB(sb)->s_es->s_feature_compat & \
1696                cpu_to_le32(EXT4_FEATURE_COMPAT_##flagname)) != 0); \
1697} \
1698static inline void ext4_set_feature_##name(struct super_block *sb) \
1699{ \
1700        EXT4_SB(sb)->s_es->s_feature_compat |= \
1701                cpu_to_le32(EXT4_FEATURE_COMPAT_##flagname); \
1702} \
1703static inline void ext4_clear_feature_##name(struct super_block *sb) \
1704{ \
1705        EXT4_SB(sb)->s_es->s_feature_compat &= \
1706                ~cpu_to_le32(EXT4_FEATURE_COMPAT_##flagname); \
1707}
1708
1709#define EXT4_FEATURE_RO_COMPAT_FUNCS(name, flagname) \
1710static inline bool ext4_has_feature_##name(struct super_block *sb) \
1711{ \
1712        return ((EXT4_SB(sb)->s_es->s_feature_ro_compat & \
1713                cpu_to_le32(EXT4_FEATURE_RO_COMPAT_##flagname)) != 0); \
1714} \
1715static inline void ext4_set_feature_##name(struct super_block *sb) \
1716{ \
1717        EXT4_SB(sb)->s_es->s_feature_ro_compat |= \
1718                cpu_to_le32(EXT4_FEATURE_RO_COMPAT_##flagname); \
1719} \
1720static inline void ext4_clear_feature_##name(struct super_block *sb) \
1721{ \
1722        EXT4_SB(sb)->s_es->s_feature_ro_compat &= \
1723                ~cpu_to_le32(EXT4_FEATURE_RO_COMPAT_##flagname); \
1724}
1725
1726#define EXT4_FEATURE_INCOMPAT_FUNCS(name, flagname) \
1727static inline bool ext4_has_feature_##name(struct super_block *sb) \
1728{ \
1729        return ((EXT4_SB(sb)->s_es->s_feature_incompat & \
1730                cpu_to_le32(EXT4_FEATURE_INCOMPAT_##flagname)) != 0); \
1731} \
1732static inline void ext4_set_feature_##name(struct super_block *sb) \
1733{ \
1734        EXT4_SB(sb)->s_es->s_feature_incompat |= \
1735                cpu_to_le32(EXT4_FEATURE_INCOMPAT_##flagname); \
1736} \
1737static inline void ext4_clear_feature_##name(struct super_block *sb) \
1738{ \
1739        EXT4_SB(sb)->s_es->s_feature_incompat &= \
1740                ~cpu_to_le32(EXT4_FEATURE_INCOMPAT_##flagname); \
1741}
1742
1743EXT4_FEATURE_COMPAT_FUNCS(dir_prealloc,         DIR_PREALLOC)
1744EXT4_FEATURE_COMPAT_FUNCS(imagic_inodes,        IMAGIC_INODES)
1745EXT4_FEATURE_COMPAT_FUNCS(journal,              HAS_JOURNAL)
1746EXT4_FEATURE_COMPAT_FUNCS(xattr,                EXT_ATTR)
1747EXT4_FEATURE_COMPAT_FUNCS(resize_inode,         RESIZE_INODE)
1748EXT4_FEATURE_COMPAT_FUNCS(dir_index,            DIR_INDEX)
1749EXT4_FEATURE_COMPAT_FUNCS(sparse_super2,        SPARSE_SUPER2)
1750
1751EXT4_FEATURE_RO_COMPAT_FUNCS(sparse_super,      SPARSE_SUPER)
1752EXT4_FEATURE_RO_COMPAT_FUNCS(large_file,        LARGE_FILE)
1753EXT4_FEATURE_RO_COMPAT_FUNCS(btree_dir,         BTREE_DIR)
1754EXT4_FEATURE_RO_COMPAT_FUNCS(huge_file,         HUGE_FILE)
1755EXT4_FEATURE_RO_COMPAT_FUNCS(gdt_csum,          GDT_CSUM)
1756EXT4_FEATURE_RO_COMPAT_FUNCS(dir_nlink,         DIR_NLINK)
1757EXT4_FEATURE_RO_COMPAT_FUNCS(extra_isize,       EXTRA_ISIZE)
1758EXT4_FEATURE_RO_COMPAT_FUNCS(quota,             QUOTA)
1759EXT4_FEATURE_RO_COMPAT_FUNCS(bigalloc,          BIGALLOC)
1760EXT4_FEATURE_RO_COMPAT_FUNCS(metadata_csum,     METADATA_CSUM)
1761EXT4_FEATURE_RO_COMPAT_FUNCS(readonly,          READONLY)
1762EXT4_FEATURE_RO_COMPAT_FUNCS(project,           PROJECT)
1763
1764EXT4_FEATURE_INCOMPAT_FUNCS(compression,        COMPRESSION)
1765EXT4_FEATURE_INCOMPAT_FUNCS(filetype,           FILETYPE)
1766EXT4_FEATURE_INCOMPAT_FUNCS(journal_needs_recovery,     RECOVER)
1767EXT4_FEATURE_INCOMPAT_FUNCS(journal_dev,        JOURNAL_DEV)
1768EXT4_FEATURE_INCOMPAT_FUNCS(meta_bg,            META_BG)
1769EXT4_FEATURE_INCOMPAT_FUNCS(extents,            EXTENTS)
1770EXT4_FEATURE_INCOMPAT_FUNCS(64bit,              64BIT)
1771EXT4_FEATURE_INCOMPAT_FUNCS(mmp,                MMP)
1772EXT4_FEATURE_INCOMPAT_FUNCS(flex_bg,            FLEX_BG)
1773EXT4_FEATURE_INCOMPAT_FUNCS(ea_inode,           EA_INODE)
1774EXT4_FEATURE_INCOMPAT_FUNCS(dirdata,            DIRDATA)
1775EXT4_FEATURE_INCOMPAT_FUNCS(csum_seed,          CSUM_SEED)
1776EXT4_FEATURE_INCOMPAT_FUNCS(largedir,           LARGEDIR)
1777EXT4_FEATURE_INCOMPAT_FUNCS(inline_data,        INLINE_DATA)
1778EXT4_FEATURE_INCOMPAT_FUNCS(encrypt,            ENCRYPT)
1779
1780#define EXT2_FEATURE_COMPAT_SUPP        EXT4_FEATURE_COMPAT_EXT_ATTR
1781#define EXT2_FEATURE_INCOMPAT_SUPP      (EXT4_FEATURE_INCOMPAT_FILETYPE| \
1782                                         EXT4_FEATURE_INCOMPAT_META_BG)
1783#define EXT2_FEATURE_RO_COMPAT_SUPP     (EXT4_FEATURE_RO_COMPAT_SPARSE_SUPER| \
1784                                         EXT4_FEATURE_RO_COMPAT_LARGE_FILE| \
1785                                         EXT4_FEATURE_RO_COMPAT_BTREE_DIR)
1786
1787#define EXT3_FEATURE_COMPAT_SUPP        EXT4_FEATURE_COMPAT_EXT_ATTR
1788#define EXT3_FEATURE_INCOMPAT_SUPP      (EXT4_FEATURE_INCOMPAT_FILETYPE| \
1789                                         EXT4_FEATURE_INCOMPAT_RECOVER| \
1790                                         EXT4_FEATURE_INCOMPAT_META_BG)
1791#define EXT3_FEATURE_RO_COMPAT_SUPP     (EXT4_FEATURE_RO_COMPAT_SPARSE_SUPER| \
1792                                         EXT4_FEATURE_RO_COMPAT_LARGE_FILE| \
1793                                         EXT4_FEATURE_RO_COMPAT_BTREE_DIR)
1794
1795#define EXT4_FEATURE_COMPAT_SUPP        EXT4_FEATURE_COMPAT_EXT_ATTR
1796#define EXT4_FEATURE_INCOMPAT_SUPP      (EXT4_FEATURE_INCOMPAT_FILETYPE| \
1797                                         EXT4_FEATURE_INCOMPAT_RECOVER| \
1798                                         EXT4_FEATURE_INCOMPAT_META_BG| \
1799                                         EXT4_FEATURE_INCOMPAT_EXTENTS| \
1800                                         EXT4_FEATURE_INCOMPAT_64BIT| \
1801                                         EXT4_FEATURE_INCOMPAT_FLEX_BG| \
1802                                         EXT4_FEATURE_INCOMPAT_MMP | \
1803                                         EXT4_FEATURE_INCOMPAT_INLINE_DATA | \
1804                                         EXT4_FEATURE_INCOMPAT_ENCRYPT | \
1805                                         EXT4_FEATURE_INCOMPAT_CSUM_SEED)
1806#define EXT4_FEATURE_RO_COMPAT_SUPP     (EXT4_FEATURE_RO_COMPAT_SPARSE_SUPER| \
1807                                         EXT4_FEATURE_RO_COMPAT_LARGE_FILE| \
1808                                         EXT4_FEATURE_RO_COMPAT_GDT_CSUM| \
1809                                         EXT4_FEATURE_RO_COMPAT_DIR_NLINK | \
1810                                         EXT4_FEATURE_RO_COMPAT_EXTRA_ISIZE | \
1811                                         EXT4_FEATURE_RO_COMPAT_BTREE_DIR |\
1812                                         EXT4_FEATURE_RO_COMPAT_HUGE_FILE |\
1813                                         EXT4_FEATURE_RO_COMPAT_BIGALLOC |\
1814                                         EXT4_FEATURE_RO_COMPAT_METADATA_CSUM|\
1815                                         EXT4_FEATURE_RO_COMPAT_QUOTA |\
1816                                         EXT4_FEATURE_RO_COMPAT_PROJECT)
1817
1818#define EXTN_FEATURE_FUNCS(ver) \
1819static inline bool ext4_has_unknown_ext##ver##_compat_features(struct super_block *sb) \
1820{ \
1821        return ((EXT4_SB(sb)->s_es->s_feature_compat & \
1822                cpu_to_le32(~EXT##ver##_FEATURE_COMPAT_SUPP)) != 0); \
1823} \
1824static inline bool ext4_has_unknown_ext##ver##_ro_compat_features(struct super_block *sb) \
1825{ \
1826        return ((EXT4_SB(sb)->s_es->s_feature_ro_compat & \
1827                cpu_to_le32(~EXT##ver##_FEATURE_RO_COMPAT_SUPP)) != 0); \
1828} \
1829static inline bool ext4_has_unknown_ext##ver##_incompat_features(struct super_block *sb) \
1830{ \
1831        return ((EXT4_SB(sb)->s_es->s_feature_incompat & \
1832                cpu_to_le32(~EXT##ver##_FEATURE_INCOMPAT_SUPP)) != 0); \
1833}
1834
1835EXTN_FEATURE_FUNCS(2)
1836EXTN_FEATURE_FUNCS(3)
1837EXTN_FEATURE_FUNCS(4)
1838
1839static inline bool ext4_has_compat_features(struct super_block *sb)
1840{
1841        return (EXT4_SB(sb)->s_es->s_feature_compat != 0);
1842}
1843static inline bool ext4_has_ro_compat_features(struct super_block *sb)
1844{
1845        return (EXT4_SB(sb)->s_es->s_feature_ro_compat != 0);
1846}
1847static inline bool ext4_has_incompat_features(struct super_block *sb)
1848{
1849        return (EXT4_SB(sb)->s_es->s_feature_incompat != 0);
1850}
1851
1852/*
1853 * Default values for user and/or group using reserved blocks
1854 */
1855#define EXT4_DEF_RESUID         0
1856#define EXT4_DEF_RESGID         0
1857
1858/*
1859 * Default project ID
1860 */
1861#define EXT4_DEF_PROJID         0
1862
1863#define EXT4_DEF_INODE_READAHEAD_BLKS   32
1864
1865/*
1866 * Default mount options
1867 */
1868#define EXT4_DEFM_DEBUG         0x0001
1869#define EXT4_DEFM_BSDGROUPS     0x0002
1870#define EXT4_DEFM_XATTR_USER    0x0004
1871#define EXT4_DEFM_ACL           0x0008
1872#define EXT4_DEFM_UID16         0x0010
1873#define EXT4_DEFM_JMODE         0x0060
1874#define EXT4_DEFM_JMODE_DATA    0x0020
1875#define EXT4_DEFM_JMODE_ORDERED 0x0040
1876#define EXT4_DEFM_JMODE_WBACK   0x0060
1877#define EXT4_DEFM_NOBARRIER     0x0100
1878#define EXT4_DEFM_BLOCK_VALIDITY 0x0200
1879#define EXT4_DEFM_DISCARD       0x0400
1880#define EXT4_DEFM_NODELALLOC    0x0800
1881
1882/*
1883 * Default journal batch times
1884 */
1885#define EXT4_DEF_MIN_BATCH_TIME 0
1886#define EXT4_DEF_MAX_BATCH_TIME 15000 /* 15ms */
1887
1888/*
1889 * Minimum number of groups in a flexgroup before we separate out
1890 * directories into the first block group of a flexgroup
1891 */
1892#define EXT4_FLEX_SIZE_DIR_ALLOC_SCHEME 4
1893
1894/*
1895 * Structure of a directory entry
1896 */
1897#define EXT4_NAME_LEN 255
1898
1899struct ext4_dir_entry {
1900        __le32  inode;                  /* Inode number */
1901        __le16  rec_len;                /* Directory entry length */
1902        __le16  name_len;               /* Name length */
1903        char    name[EXT4_NAME_LEN];    /* File name */
1904};
1905
1906/*
1907 * The new version of the directory entry.  Since EXT4 structures are
1908 * stored in intel byte order, and the name_len field could never be
1909 * bigger than 255 chars, it's safe to reclaim the extra byte for the
1910 * file_type field.
1911 */
1912struct ext4_dir_entry_2 {
1913        __le32  inode;                  /* Inode number */
1914        __le16  rec_len;                /* Directory entry length */
1915        __u8    name_len;               /* Name length */
1916        __u8    file_type;
1917        char    name[EXT4_NAME_LEN];    /* File name */
1918};
1919
1920/*
1921 * This is a bogus directory entry at the end of each leaf block that
1922 * records checksums.
1923 */
1924struct ext4_dir_entry_tail {
1925        __le32  det_reserved_zero1;     /* Pretend to be unused */
1926        __le16  det_rec_len;            /* 12 */
1927        __u8    det_reserved_zero2;     /* Zero name length */
1928        __u8    det_reserved_ft;        /* 0xDE, fake file type */
1929        __le32  det_checksum;           /* crc32c(uuid+inum+dirblock) */
1930};
1931
1932#define EXT4_DIRENT_TAIL(block, blocksize) \
1933        ((struct ext4_dir_entry_tail *)(((void *)(block)) + \
1934                                        ((blocksize) - \
1935                                         sizeof(struct ext4_dir_entry_tail))))
1936
1937/*
1938 * Ext4 directory file types.  Only the low 3 bits are used.  The
1939 * other bits are reserved for now.
1940 */
1941#define EXT4_FT_UNKNOWN         0
1942#define EXT4_FT_REG_FILE        1
1943#define EXT4_FT_DIR             2
1944#define EXT4_FT_CHRDEV          3
1945#define EXT4_FT_BLKDEV          4
1946#define EXT4_FT_FIFO            5
1947#define EXT4_FT_SOCK            6
1948#define EXT4_FT_SYMLINK         7
1949
1950#define EXT4_FT_MAX             8
1951
1952#define EXT4_FT_DIR_CSUM        0xDE
1953
1954/*
1955 * EXT4_DIR_PAD defines the directory entries boundaries
1956 *
1957 * NOTE: It must be a multiple of 4
1958 */
1959#define EXT4_DIR_PAD                    4
1960#define EXT4_DIR_ROUND                  (EXT4_DIR_PAD - 1)
1961#define EXT4_DIR_REC_LEN(name_len)      (((name_len) + 8 + EXT4_DIR_ROUND) & \
1962                                         ~EXT4_DIR_ROUND)
1963#define EXT4_MAX_REC_LEN                ((1<<16)-1)
1964
1965/*
1966 * If we ever get support for fs block sizes > page_size, we'll need
1967 * to remove the #if statements in the next two functions...
1968 */
1969static inline unsigned int
1970ext4_rec_len_from_disk(__le16 dlen, unsigned blocksize)
1971{
1972        unsigned len = le16_to_cpu(dlen);
1973
1974#if (PAGE_SIZE >= 65536)
1975        if (len == EXT4_MAX_REC_LEN || len == 0)
1976                return blocksize;
1977        return (len & 65532) | ((len & 3) << 16);
1978#else
1979        return len;
1980#endif
1981}
1982
1983static inline __le16 ext4_rec_len_to_disk(unsigned len, unsigned blocksize)
1984{
1985        if ((len > blocksize) || (blocksize > (1 << 18)) || (len & 3))
1986                BUG();
1987#if (PAGE_SIZE >= 65536)
1988        if (len < 65536)
1989                return cpu_to_le16(len);
1990        if (len == blocksize) {
1991                if (blocksize == 65536)
1992                        return cpu_to_le16(EXT4_MAX_REC_LEN);
1993                else
1994                        return cpu_to_le16(0);
1995        }
1996        return cpu_to_le16((len & 65532) | ((len >> 16) & 3));
1997#else
1998        return cpu_to_le16(len);
1999#endif
2000}
2001
2002/*
2003 * Hash Tree Directory indexing
2004 * (c) Daniel Phillips, 2001
2005 */
2006
2007#define is_dx(dir) (ext4_has_feature_dir_index((dir)->i_sb) && \
2008                    ext4_test_inode_flag((dir), EXT4_INODE_INDEX))
2009#define EXT4_DIR_LINK_MAX(dir) (!is_dx(dir) && (dir)->i_nlink >= EXT4_LINK_MAX)
2010#define EXT4_DIR_LINK_EMPTY(dir) ((dir)->i_nlink == 2 || (dir)->i_nlink == 1)
2011
2012/* Legal values for the dx_root hash_version field: */
2013
2014#define DX_HASH_LEGACY          0
2015#define DX_HASH_HALF_MD4        1
2016#define DX_HASH_TEA             2
2017#define DX_HASH_LEGACY_UNSIGNED 3
2018#define DX_HASH_HALF_MD4_UNSIGNED       4
2019#define DX_HASH_TEA_UNSIGNED            5
2020
2021static inline u32 ext4_chksum(struct ext4_sb_info *sbi, u32 crc,
2022                              const void *address, unsigned int length)
2023{
2024        struct {
2025                struct shash_desc shash;
2026                char ctx[4];
2027        } desc;
2028        int err;
2029
2030        BUG_ON(crypto_shash_descsize(sbi->s_chksum_driver)!=sizeof(desc.ctx));
2031
2032        desc.shash.tfm = sbi->s_chksum_driver;
2033        desc.shash.flags = 0;
2034        *(u32 *)desc.ctx = crc;
2035
2036        err = crypto_shash_update(&desc.shash, address, length);
2037        BUG_ON(err);
2038
2039        return *(u32 *)desc.ctx;
2040}
2041
2042#ifdef __KERNEL__
2043
2044/* hash info structure used by the directory hash */
2045struct dx_hash_info
2046{
2047        u32             hash;
2048        u32             minor_hash;
2049        int             hash_version;
2050        u32             *seed;
2051};
2052
2053
2054/* 32 and 64 bit signed EOF for dx directories */
2055#define EXT4_HTREE_EOF_32BIT   ((1UL  << (32 - 1)) - 1)
2056#define EXT4_HTREE_EOF_64BIT   ((1ULL << (64 - 1)) - 1)
2057
2058
2059/*
2060 * Control parameters used by ext4_htree_next_block
2061 */
2062#define HASH_NB_ALWAYS          1
2063
2064struct ext4_filename {
2065        const struct qstr *usr_fname;
2066        struct fscrypt_str disk_name;
2067        struct dx_hash_info hinfo;
2068#ifdef CONFIG_EXT4_FS_ENCRYPTION
2069        struct fscrypt_str crypto_buf;
2070#endif
2071};
2072
2073#define fname_name(p) ((p)->disk_name.name)
2074#define fname_len(p)  ((p)->disk_name.len)
2075
2076/*
2077 * Describe an inode's exact location on disk and in memory
2078 */
2079struct ext4_iloc
2080{
2081        struct buffer_head *bh;
2082        unsigned long offset;
2083        ext4_group_t block_group;
2084};
2085
2086static inline struct ext4_inode *ext4_raw_inode(struct ext4_iloc *iloc)
2087{
2088        return (struct ext4_inode *) (iloc->bh->b_data + iloc->offset);
2089}
2090
2091/*
2092 * This structure is stuffed into the struct file's private_data field
2093 * for directories.  It is where we put information so that we can do
2094 * readdir operations in hash tree order.
2095 */
2096struct dir_private_info {
2097        struct rb_root  root;
2098        struct rb_node  *curr_node;
2099        struct fname    *extra_fname;
2100        loff_t          last_pos;
2101        __u32           curr_hash;
2102        __u32           curr_minor_hash;
2103        __u32           next_hash;
2104};
2105
2106/* calculate the first block number of the group */
2107static inline ext4_fsblk_t
2108ext4_group_first_block_no(struct super_block *sb, ext4_group_t group_no)
2109{
2110        return group_no * (ext4_fsblk_t)EXT4_BLOCKS_PER_GROUP(sb) +
2111                le32_to_cpu(EXT4_SB(sb)->s_es->s_first_data_block);
2112}
2113
2114/*
2115 * Special error return code only used by dx_probe() and its callers.
2116 */
2117#define ERR_BAD_DX_DIR  (-(MAX_ERRNO - 1))
2118
2119/*
2120 * Timeout and state flag for lazy initialization inode thread.
2121 */
2122#define EXT4_DEF_LI_WAIT_MULT                   10
2123#define EXT4_DEF_LI_MAX_START_DELAY             5
2124#define EXT4_LAZYINIT_QUIT                      0x0001
2125#define EXT4_LAZYINIT_RUNNING                   0x0002
2126
2127/*
2128 * Lazy inode table initialization info
2129 */
2130struct ext4_lazy_init {
2131        unsigned long           li_state;
2132        struct list_head        li_request_list;
2133        struct mutex            li_list_mtx;
2134};
2135
2136struct ext4_li_request {
2137        struct super_block      *lr_super;
2138        struct ext4_sb_info     *lr_sbi;
2139        ext4_group_t            lr_next_group;
2140        struct list_head        lr_request;
2141        unsigned long           lr_next_sched;
2142        unsigned long           lr_timeout;
2143};
2144
2145struct ext4_features {
2146        struct kobject f_kobj;
2147        struct completion f_kobj_unregister;
2148};
2149
2150/*
2151 * This structure will be used for multiple mount protection. It will be
2152 * written into the block number saved in the s_mmp_block field in the
2153 * superblock. Programs that check MMP should assume that if
2154 * SEQ_FSCK (or any unknown code above SEQ_MAX) is present then it is NOT safe
2155 * to use the filesystem, regardless of how old the timestamp is.
2156 */
2157#define EXT4_MMP_MAGIC     0x004D4D50U /* ASCII for MMP */
2158#define EXT4_MMP_SEQ_CLEAN 0xFF4D4D50U /* mmp_seq value for clean unmount */
2159#define EXT4_MMP_SEQ_FSCK  0xE24D4D50U /* mmp_seq value when being fscked */
2160#define EXT4_MMP_SEQ_MAX   0xE24D4D4FU /* maximum valid mmp_seq value */
2161
2162struct mmp_struct {
2163        __le32  mmp_magic;              /* Magic number for MMP */
2164        __le32  mmp_seq;                /* Sequence no. updated periodically */
2165
2166        /*
2167         * mmp_time, mmp_nodename & mmp_bdevname are only used for information
2168         * purposes and do not affect the correctness of the algorithm
2169         */
2170        __le64  mmp_time;               /* Time last updated */
2171        char    mmp_nodename[64];       /* Node which last updated MMP block */
2172        char    mmp_bdevname[32];       /* Bdev which last updated MMP block */
2173
2174        /*
2175         * mmp_check_interval is used to verify if the MMP block has been
2176         * updated on the block device. The value is updated based on the
2177         * maximum time to write the MMP block during an update cycle.
2178         */
2179        __le16  mmp_check_interval;
2180
2181        __le16  mmp_pad1;
2182        __le32  mmp_pad2[226];
2183        __le32  mmp_checksum;           /* crc32c(uuid+mmp_block) */
2184};
2185
2186/* arguments passed to the mmp thread */
2187struct mmpd_data {
2188        struct buffer_head *bh; /* bh from initial read_mmp_block() */
2189        struct super_block *sb;  /* super block of the fs */
2190};
2191
2192/*
2193 * Check interval multiplier
2194 * The MMP block is written every update interval and initially checked every
2195 * update interval x the multiplier (the value is then adapted based on the
2196 * write latency). The reason is that writes can be delayed under load and we
2197 * don't want readers to incorrectly assume that the filesystem is no longer
2198 * in use.
2199 */
2200#define EXT4_MMP_CHECK_MULT             2UL
2201
2202/*
2203 * Minimum interval for MMP checking in seconds.
2204 */
2205#define EXT4_MMP_MIN_CHECK_INTERVAL     5UL
2206
2207/*
2208 * Maximum interval for MMP checking in seconds.
2209 */
2210#define EXT4_MMP_MAX_CHECK_INTERVAL     300UL
2211
2212/*
2213 * Function prototypes
2214 */
2215
2216/*
2217 * Ok, these declarations are also in <linux/kernel.h> but none of the
2218 * ext4 source programs needs to include it so they are duplicated here.
2219 */
2220# define NORET_TYPE     /**/
2221# define ATTRIB_NORET   __attribute__((noreturn))
2222# define NORET_AND      noreturn,
2223
2224/* bitmap.c */
2225extern unsigned int ext4_count_free(char *bitmap, unsigned numchars);
2226void ext4_inode_bitmap_csum_set(struct super_block *sb, ext4_group_t group,
2227                                struct ext4_group_desc *gdp,
2228                                struct buffer_head *bh, int sz);
2229int ext4_inode_bitmap_csum_verify(struct super_block *sb, ext4_group_t group,
2230                                  struct ext4_group_desc *gdp,
2231                                  struct buffer_head *bh, int sz);
2232void ext4_block_bitmap_csum_set(struct super_block *sb, ext4_group_t group,
2233                                struct ext4_group_desc *gdp,
2234                                struct buffer_head *bh);
2235int ext4_block_bitmap_csum_verify(struct super_block *sb, ext4_group_t group,
2236                                  struct ext4_group_desc *gdp,
2237                                  struct buffer_head *bh);
2238
2239/* balloc.c */
2240extern void ext4_get_group_no_and_offset(struct super_block *sb,
2241                                         ext4_fsblk_t blocknr,
2242                                         ext4_group_t *blockgrpp,
2243                                         ext4_grpblk_t *offsetp);
2244extern ext4_group_t ext4_get_group_number(struct super_block *sb,
2245                                          ext4_fsblk_t block);
2246
2247extern unsigned int ext4_block_group(struct super_block *sb,
2248                        ext4_fsblk_t blocknr);
2249extern ext4_grpblk_t ext4_block_group_offset(struct super_block *sb,
2250                        ext4_fsblk_t blocknr);
2251extern int ext4_bg_has_super(struct super_block *sb, ext4_group_t group);
2252extern unsigned long ext4_bg_num_gdb(struct super_block *sb,
2253                        ext4_group_t group);
2254extern ext4_fsblk_t ext4_new_meta_blocks(handle_t *handle, struct inode *inode,
2255                                         ext4_fsblk_t goal,
2256                                         unsigned int flags,
2257                                         unsigned long *count,
2258                                         int *errp);
2259extern int ext4_claim_free_clusters(struct ext4_sb_info *sbi,
2260                                    s64 nclusters, unsigned int flags);
2261extern ext4_fsblk_t ext4_count_free_clusters(struct super_block *);
2262extern void ext4_check_blocks_bitmap(struct super_block *);
2263extern struct ext4_group_desc * ext4_get_group_desc(struct super_block * sb,
2264                                                    ext4_group_t block_group,
2265                                                    struct buffer_head ** bh);
2266extern int ext4_should_retry_alloc(struct super_block *sb, int *retries);
2267
2268extern struct buffer_head *ext4_read_block_bitmap_nowait(struct super_block *sb,
2269                                                ext4_group_t block_group);
2270extern int ext4_wait_block_bitmap(struct super_block *sb,
2271                                  ext4_group_t block_group,
2272                                  struct buffer_head *bh);
2273extern struct buffer_head *ext4_read_block_bitmap(struct super_block *sb,
2274                                                  ext4_group_t block_group);
2275extern unsigned ext4_free_clusters_after_init(struct super_block *sb,
2276                                              ext4_group_t block_group,
2277                                              struct ext4_group_desc *gdp);
2278ext4_fsblk_t ext4_inode_to_goal_block(struct inode *);
2279
2280static inline int ext4_sb_has_crypto(struct super_block *sb)
2281{
2282        return ext4_has_feature_encrypt(sb);
2283}
2284
2285static inline bool ext4_encrypted_inode(struct inode *inode)
2286{
2287        return ext4_test_inode_flag(inode, EXT4_INODE_ENCRYPT);
2288}
2289
2290#ifdef CONFIG_EXT4_FS_ENCRYPTION
2291static inline int ext4_fname_setup_filename(struct inode *dir,
2292                        const struct qstr *iname,
2293                        int lookup, struct ext4_filename *fname)
2294{
2295        struct fscrypt_name name;
2296        int err;
2297
2298        memset(fname, 0, sizeof(struct ext4_filename));
2299
2300        err = fscrypt_setup_filename(dir, iname, lookup, &name);
2301
2302        fname->usr_fname = name.usr_fname;
2303        fname->disk_name = name.disk_name;
2304        fname->hinfo.hash = name.hash;
2305        fname->hinfo.minor_hash = name.minor_hash;
2306        fname->crypto_buf = name.crypto_buf;
2307        return err;
2308}
2309
2310static inline void ext4_fname_free_filename(struct ext4_filename *fname)
2311{
2312        struct fscrypt_name name;
2313
2314        name.crypto_buf = fname->crypto_buf;
2315        fscrypt_free_filename(&name);
2316
2317        fname->crypto_buf.name = NULL;
2318        fname->usr_fname = NULL;
2319        fname->disk_name.name = NULL;
2320}
2321#else
2322static inline int ext4_fname_setup_filename(struct inode *dir,
2323                const struct qstr *iname,
2324                int lookup, struct ext4_filename *fname)
2325{
2326        fname->usr_fname = iname;
2327        fname->disk_name.name = (unsigned char *) iname->name;
2328        fname->disk_name.len = iname->len;
2329        return 0;
2330}
2331static inline void ext4_fname_free_filename(struct ext4_filename *fname) { }
2332
2333#define fscrypt_set_d_op(i)
2334#define fscrypt_get_ctx                 fscrypt_notsupp_get_ctx
2335#define fscrypt_release_ctx             fscrypt_notsupp_release_ctx
2336#define fscrypt_encrypt_page            fscrypt_notsupp_encrypt_page
2337#define fscrypt_decrypt_page            fscrypt_notsupp_decrypt_page
2338#define fscrypt_decrypt_bio_pages       fscrypt_notsupp_decrypt_bio_pages
2339#define fscrypt_pullback_bio_page       fscrypt_notsupp_pullback_bio_page
2340#define fscrypt_restore_control_page    fscrypt_notsupp_restore_control_page
2341#define fscrypt_zeroout_range           fscrypt_notsupp_zeroout_range
2342#define fscrypt_process_policy          fscrypt_notsupp_process_policy
2343#define fscrypt_get_policy              fscrypt_notsupp_get_policy
2344#define fscrypt_has_permitted_context   fscrypt_notsupp_has_permitted_context
2345#define fscrypt_inherit_context         fscrypt_notsupp_inherit_context
2346#define fscrypt_get_encryption_info     fscrypt_notsupp_get_encryption_info
2347#define fscrypt_put_encryption_info     fscrypt_notsupp_put_encryption_info
2348#define fscrypt_setup_filename          fscrypt_notsupp_setup_filename
2349#define fscrypt_free_filename           fscrypt_notsupp_free_filename
2350#define fscrypt_fname_encrypted_size    fscrypt_notsupp_fname_encrypted_size
2351#define fscrypt_fname_alloc_buffer      fscrypt_notsupp_fname_alloc_buffer
2352#define fscrypt_fname_free_buffer       fscrypt_notsupp_fname_free_buffer
2353#define fscrypt_fname_disk_to_usr       fscrypt_notsupp_fname_disk_to_usr
2354#define fscrypt_fname_usr_to_disk       fscrypt_notsupp_fname_usr_to_disk
2355#endif
2356
2357/* dir.c */
2358extern int __ext4_check_dir_entry(const char *, unsigned int, struct inode *,
2359                                  struct file *,
2360                                  struct ext4_dir_entry_2 *,
2361                                  struct buffer_head *, char *, int,
2362                                  unsigned int);
2363#define ext4_check_dir_entry(dir, filp, de, bh, buf, size, offset)      \
2364        unlikely(__ext4_check_dir_entry(__func__, __LINE__, (dir), (filp), \
2365                                        (de), (bh), (buf), (size), (offset)))
2366extern int ext4_htree_store_dirent(struct file *dir_file, __u32 hash,
2367                                __u32 minor_hash,
2368                                struct ext4_dir_entry_2 *dirent,
2369                                struct fscrypt_str *ent_name);
2370extern void ext4_htree_free_dir_info(struct dir_private_info *p);
2371extern int ext4_find_dest_de(struct inode *dir, struct inode *inode,
2372                             struct buffer_head *bh,
2373                             void *buf, int buf_size,
2374                             struct ext4_filename *fname,
2375                             struct ext4_dir_entry_2 **dest_de);
2376int ext4_insert_dentry(struct inode *dir,
2377                       struct inode *inode,
2378                       struct ext4_dir_entry_2 *de,
2379                       int buf_size,
2380                       struct ext4_filename *fname);
2381static inline void ext4_update_dx_flag(struct inode *inode)
2382{
2383        if (!ext4_has_feature_dir_index(inode->i_sb))
2384                ext4_clear_inode_flag(inode, EXT4_INODE_INDEX);
2385}
2386static unsigned char ext4_filetype_table[] = {
2387        DT_UNKNOWN, DT_REG, DT_DIR, DT_CHR, DT_BLK, DT_FIFO, DT_SOCK, DT_LNK
2388};
2389
2390static inline  unsigned char get_dtype(struct super_block *sb, int filetype)
2391{
2392        if (!ext4_has_feature_filetype(sb) || filetype >= EXT4_FT_MAX)
2393                return DT_UNKNOWN;
2394
2395        return ext4_filetype_table[filetype];
2396}
2397extern int ext4_check_all_de(struct inode *dir, struct buffer_head *bh,
2398                             void *buf, int buf_size);
2399
2400/* fsync.c */
2401extern int ext4_sync_file(struct file *, loff_t, loff_t, int);
2402
2403/* hash.c */
2404extern int ext4fs_dirhash(const char *name, int len, struct
2405                          dx_hash_info *hinfo);
2406
2407/* ialloc.c */
2408extern struct inode *__ext4_new_inode(handle_t *, struct inode *, umode_t,
2409                                      const struct qstr *qstr, __u32 goal,
2410                                      uid_t *owner, int handle_type,
2411                                      unsigned int line_no, int nblocks);
2412
2413#define ext4_new_inode(handle, dir, mode, qstr, goal, owner) \
2414        __ext4_new_inode((handle), (dir), (mode), (qstr), (goal), (owner), \
2415                         0, 0, 0)
2416#define ext4_new_inode_start_handle(dir, mode, qstr, goal, owner, \
2417                                    type, nblocks)                  \
2418        __ext4_new_inode(NULL, (dir), (mode), (qstr), (goal), (owner), \
2419                         (type), __LINE__, (nblocks))
2420
2421
2422extern void ext4_free_inode(handle_t *, struct inode *);
2423extern struct inode * ext4_orphan_get(struct super_block *, unsigned long);
2424extern unsigned long ext4_count_free_inodes(struct super_block *);
2425extern unsigned long ext4_count_dirs(struct super_block *);
2426extern void ext4_check_inodes_bitmap(struct super_block *);
2427extern void ext4_mark_bitmap_end(int start_bit, int end_bit, char *bitmap);
2428extern int ext4_init_inode_table(struct super_block *sb,
2429                                 ext4_group_t group, int barrier);
2430extern void ext4_end_bitmap_read(struct buffer_head *bh, int uptodate);
2431
2432/* mballoc.c */
2433extern const struct file_operations ext4_seq_mb_groups_fops;
2434extern long ext4_mb_stats;
2435extern long ext4_mb_max_to_scan;
2436extern int ext4_mb_init(struct super_block *);
2437extern int ext4_mb_release(struct super_block *);
2438extern ext4_fsblk_t ext4_mb_new_blocks(handle_t *,
2439                                struct ext4_allocation_request *, int *);
2440extern int ext4_mb_reserve_blocks(struct super_block *, int);
2441extern void ext4_discard_preallocations(struct inode *);
2442extern int __init ext4_init_mballoc(void);
2443extern void ext4_exit_mballoc(void);
2444extern void ext4_free_blocks(handle_t *handle, struct inode *inode,
2445                             struct buffer_head *bh, ext4_fsblk_t block,
2446                             unsigned long count, int flags);
2447extern int ext4_mb_alloc_groupinfo(struct super_block *sb,
2448                                   ext4_group_t ngroups);
2449extern int ext4_mb_add_groupinfo(struct super_block *sb,
2450                ext4_group_t i, struct ext4_group_desc *desc);
2451extern int ext4_group_add_blocks(handle_t *handle, struct super_block *sb,
2452                                ext4_fsblk_t block, unsigned long count);
2453extern int ext4_trim_fs(struct super_block *, struct fstrim_range *);
2454
2455/* inode.c */
2456int ext4_inode_is_fast_symlink(struct inode *inode);
2457struct buffer_head *ext4_getblk(handle_t *, struct inode *, ext4_lblk_t, int);
2458struct buffer_head *ext4_bread(handle_t *, struct inode *, ext4_lblk_t, int);
2459int ext4_get_block_unwritten(struct inode *inode, sector_t iblock,
2460                             struct buffer_head *bh_result, int create);
2461int ext4_dax_get_block(struct inode *inode, sector_t iblock,
2462                       struct buffer_head *bh_result, int create);
2463int ext4_get_block(struct inode *inode, sector_t iblock,
2464                   struct buffer_head *bh_result, int create);
2465int ext4_dio_get_block(struct inode *inode, sector_t iblock,
2466                       struct buffer_head *bh_result, int create);
2467int ext4_da_get_block_prep(struct inode *inode, sector_t iblock,
2468                           struct buffer_head *bh, int create);
2469int ext4_walk_page_buffers(handle_t *handle,
2470                           struct buffer_head *head,
2471                           unsigned from,
2472                           unsigned to,
2473                           int *partial,
2474                           int (*fn)(handle_t *handle,
2475                                     struct buffer_head *bh));
2476int do_journal_get_write_access(handle_t *handle,
2477                                struct buffer_head *bh);
2478#define FALL_BACK_TO_NONDELALLOC 1
2479#define CONVERT_INLINE_DATA      2
2480
2481extern struct inode *ext4_iget(struct super_block *, unsigned long);
2482extern struct inode *ext4_iget_normal(struct super_block *, unsigned long);
2483extern int  ext4_write_inode(struct inode *, struct writeback_control *);
2484extern int  ext4_setattr(struct dentry *, struct iattr *);
2485extern int  ext4_getattr(struct vfsmount *mnt, struct dentry *dentry,
2486                                struct kstat *stat);
2487extern void ext4_evict_inode(struct inode *);
2488extern void ext4_clear_inode(struct inode *);
2489extern int  ext4_sync_inode(handle_t *, struct inode *);
2490extern void ext4_dirty_inode(struct inode *, int);
2491extern int ext4_change_inode_journal_flag(struct inode *, int);
2492extern int ext4_get_inode_loc(struct inode *, struct ext4_iloc *);
2493extern int ext4_inode_attach_jinode(struct inode *inode);
2494extern int ext4_can_truncate(struct inode *inode);
2495extern void ext4_truncate(struct inode *);
2496extern int ext4_punch_hole(struct inode *inode, loff_t offset, loff_t length);
2497extern int ext4_truncate_restart_trans(handle_t *, struct inode *, int nblocks);
2498extern void ext4_set_inode_flags(struct inode *);
2499extern void ext4_get_inode_flags(struct ext4_inode_info *);
2500extern int ext4_alloc_da_blocks(struct inode *inode);
2501extern void ext4_set_aops(struct inode *inode);
2502extern int ext4_writepage_trans_blocks(struct inode *);
2503extern int ext4_chunk_trans_blocks(struct inode *, int nrblocks);
2504extern int ext4_zero_partial_blocks(handle_t *handle, struct inode *inode,
2505                             loff_t lstart, loff_t lend);
2506extern int ext4_page_mkwrite(struct vm_area_struct *vma, struct vm_fault *vmf);
2507extern int ext4_filemap_fault(struct vm_area_struct *vma, struct vm_fault *vmf);
2508extern qsize_t *ext4_get_reserved_space(struct inode *inode);
2509extern int ext4_get_projid(struct inode *inode, kprojid_t *projid);
2510extern void ext4_da_update_reserve_space(struct inode *inode,
2511                                        int used, int quota_claim);
2512extern int ext4_issue_zeroout(struct inode *inode, ext4_lblk_t lblk,
2513                              ext4_fsblk_t pblk, ext4_lblk_t len);
2514extern int ext4_get_next_extent(struct inode *inode, ext4_lblk_t lblk,
2515                                unsigned int map_len,
2516                                struct extent_status *result);
2517
2518/* indirect.c */
2519extern int ext4_ind_map_blocks(handle_t *handle, struct inode *inode,
2520                                struct ext4_map_blocks *map, int flags);
2521extern int ext4_ind_calc_metadata_amount(struct inode *inode, sector_t lblock);
2522extern int ext4_ind_trans_blocks(struct inode *inode, int nrblocks);
2523extern void ext4_ind_truncate(handle_t *, struct inode *inode);
2524extern int ext4_ind_remove_space(handle_t *handle, struct inode *inode,
2525                                 ext4_lblk_t start, ext4_lblk_t end);
2526
2527/* ioctl.c */
2528extern long ext4_ioctl(struct file *, unsigned int, unsigned long);
2529extern long ext4_compat_ioctl(struct file *, unsigned int, unsigned long);
2530
2531/* migrate.c */
2532extern int ext4_ext_migrate(struct inode *);
2533extern int ext4_ind_migrate(struct inode *inode);
2534
2535/* namei.c */
2536extern int ext4_dirent_csum_verify(struct inode *inode,
2537                                   struct ext4_dir_entry *dirent);
2538extern int ext4_orphan_add(handle_t *, struct inode *);
2539extern int ext4_orphan_del(handle_t *, struct inode *);
2540extern int ext4_htree_fill_tree(struct file *dir_file, __u32 start_hash,
2541                                __u32 start_minor_hash, __u32 *next_hash);
2542extern int ext4_search_dir(struct buffer_head *bh,
2543                           char *search_buf,
2544                           int buf_size,
2545                           struct inode *dir,
2546                           struct ext4_filename *fname,
2547                           const struct qstr *d_name,
2548                           unsigned int offset,
2549                           struct ext4_dir_entry_2 **res_dir);
2550extern int ext4_generic_delete_entry(handle_t *handle,
2551                                     struct inode *dir,
2552                                     struct ext4_dir_entry_2 *de_del,
2553                                     struct buffer_head *bh,
2554                                     void *entry_buf,
2555                                     int buf_size,
2556                                     int csum_size);
2557extern bool ext4_empty_dir(struct inode *inode);
2558
2559/* resize.c */
2560extern int ext4_group_add(struct super_block *sb,
2561                                struct ext4_new_group_data *input);
2562extern int ext4_group_extend(struct super_block *sb,
2563                                struct ext4_super_block *es,
2564                                ext4_fsblk_t n_blocks_count);
2565extern int ext4_resize_fs(struct super_block *sb, ext4_fsblk_t n_blocks_count);
2566
2567/* super.c */
2568extern int ext4_seq_options_show(struct seq_file *seq, void *offset);
2569extern int ext4_calculate_overhead(struct super_block *sb);
2570extern void ext4_superblock_csum_set(struct super_block *sb);
2571extern void *ext4_kvmalloc(size_t size, gfp_t flags);
2572extern void *ext4_kvzalloc(size_t size, gfp_t flags);
2573extern int ext4_alloc_flex_bg_array(struct super_block *sb,
2574                                    ext4_group_t ngroup);
2575extern const char *ext4_decode_error(struct super_block *sb, int errno,
2576                                     char nbuf[16]);
2577
2578extern __printf(4, 5)
2579void __ext4_error(struct super_block *, const char *, unsigned int,
2580                  const char *, ...);
2581extern __printf(5, 6)
2582void __ext4_error_inode(struct inode *, const char *, unsigned int, ext4_fsblk_t,
2583                      const char *, ...);
2584extern __printf(5, 6)
2585void __ext4_error_file(struct file *, const char *, unsigned int, ext4_fsblk_t,
2586                     const char *, ...);
2587extern void __ext4_std_error(struct super_block *, const char *,
2588                             unsigned int, int);
2589extern __printf(4, 5)
2590void __ext4_abort(struct super_block *, const char *, unsigned int,
2591                  const char *, ...);
2592extern __printf(4, 5)
2593void __ext4_warning(struct super_block *, const char *, unsigned int,
2594                    const char *, ...);
2595extern __printf(4, 5)
2596void __ext4_warning_inode(const struct inode *inode, const char *function,
2597                          unsigned int line, const char *fmt, ...);
2598extern __printf(3, 4)
2599void __ext4_msg(struct super_block *, const char *, const char *, ...);
2600extern void __dump_mmp_msg(struct super_block *, struct mmp_struct *mmp,
2601                           const char *, unsigned int, const char *);
2602extern __printf(7, 8)
2603void __ext4_grp_locked_error(const char *, unsigned int,
2604                             struct super_block *, ext4_group_t,
2605                             unsigned long, ext4_fsblk_t,
2606                             const char *, ...);
2607
2608#define EXT4_ERROR_INODE(inode, fmt, a...) \
2609        ext4_error_inode((inode), __func__, __LINE__, 0, (fmt), ## a)
2610
2611#define EXT4_ERROR_INODE_BLOCK(inode, block, fmt, a...)                 \
2612        ext4_error_inode((inode), __func__, __LINE__, (block), (fmt), ## a)
2613
2614#define EXT4_ERROR_FILE(file, block, fmt, a...)                         \
2615        ext4_error_file((file), __func__, __LINE__, (block), (fmt), ## a)
2616
2617#ifdef CONFIG_PRINTK
2618
2619#define ext4_error_inode(inode, func, line, block, fmt, ...)            \
2620        __ext4_error_inode(inode, func, line, block, fmt, ##__VA_ARGS__)
2621#define ext4_error_file(file, func, line, block, fmt, ...)              \
2622        __ext4_error_file(file, func, line, block, fmt, ##__VA_ARGS__)
2623#define ext4_error(sb, fmt, ...)                                        \
2624        __ext4_error(sb, __func__, __LINE__, fmt, ##__VA_ARGS__)
2625#define ext4_abort(sb, fmt, ...)                                        \
2626        __ext4_abort(sb, __func__, __LINE__, fmt, ##__VA_ARGS__)
2627#define ext4_warning(sb, fmt, ...)                                      \
2628        __ext4_warning(sb, __func__, __LINE__, fmt, ##__VA_ARGS__)
2629#define ext4_warning_inode(inode, fmt, ...)                             \
2630        __ext4_warning_inode(inode, __func__, __LINE__, fmt, ##__VA_ARGS__)
2631#define ext4_msg(sb, level, fmt, ...)                           \
2632        __ext4_msg(sb, level, fmt, ##__VA_ARGS__)
2633#define dump_mmp_msg(sb, mmp, msg)                                      \
2634        __dump_mmp_msg(sb, mmp, __func__, __LINE__, msg)
2635#define ext4_grp_locked_error(sb, grp, ino, block, fmt, ...)            \
2636        __ext4_grp_locked_error(__func__, __LINE__, sb, grp, ino, block, \
2637                                fmt, ##__VA_ARGS__)
2638
2639#else
2640
2641#define ext4_error_inode(inode, func, line, block, fmt, ...)            \
2642do {                                                                    \
2643        no_printk(fmt, ##__VA_ARGS__);                                  \
2644        __ext4_error_inode(inode, "", 0, block, " ");                   \
2645} while (0)
2646#define ext4_error_file(file, func, line, block, fmt, ...)              \
2647do {                                                                    \
2648        no_printk(fmt, ##__VA_ARGS__);                                  \
2649        __ext4_error_file(file, "", 0, block, " ");                     \
2650} while (0)
2651#define ext4_error(sb, fmt, ...)                                        \
2652do {                                                                    \
2653        no_printk(fmt, ##__VA_ARGS__);                                  \
2654        __ext4_error(sb, "", 0, " ");                                   \
2655} while (0)
2656#define ext4_abort(sb, fmt, ...)                                        \
2657do {                                                                    \
2658        no_printk(fmt, ##__VA_ARGS__);                                  \
2659        __ext4_abort(sb, "", 0, " ");                                   \
2660} while (0)
2661#define ext4_warning(sb, fmt, ...)                                      \
2662do {                                                                    \
2663        no_printk(fmt, ##__VA_ARGS__);                                  \
2664        __ext4_warning(sb, "", 0, " ");                                 \
2665} while (0)
2666#define ext4_warning_inode(inode, fmt, ...)                             \
2667do {                                                                    \
2668        no_printk(fmt, ##__VA_ARGS__);                                  \
2669        __ext4_warning_inode(inode, "", 0, " ");                        \
2670} while (0)
2671#define ext4_msg(sb, level, fmt, ...)                                   \
2672do {                                                                    \
2673        no_printk(fmt, ##__VA_ARGS__);                                  \
2674        __ext4_msg(sb, "", " ");                                        \
2675} while (0)
2676#define dump_mmp_msg(sb, mmp, msg)                                      \
2677        __dump_mmp_msg(sb, mmp, "", 0, "")
2678#define ext4_grp_locked_error(sb, grp, ino, block, fmt, ...)            \
2679do {                                                                    \
2680        no_printk(fmt, ##__VA_ARGS__);                          \
2681        __ext4_grp_locked_error("", 0, sb, grp, ino, block, " ");       \
2682} while (0)
2683
2684#endif
2685
2686extern void ext4_update_dynamic_rev(struct super_block *sb);
2687extern int ext4_update_compat_feature(handle_t *handle, struct super_block *sb,
2688                                        __u32 compat);
2689extern int ext4_update_rocompat_feature(handle_t *handle,
2690                                        struct super_block *sb, __u32 rocompat);
2691extern int ext4_update_incompat_feature(handle_t *handle,
2692                                        struct super_block *sb, __u32 incompat);
2693extern ext4_fsblk_t ext4_block_bitmap(struct super_block *sb,
2694                                      struct ext4_group_desc *bg);
2695extern ext4_fsblk_t ext4_inode_bitmap(struct super_block *sb,
2696                                      struct ext4_group_desc *bg);
2697extern ext4_fsblk_t ext4_inode_table(struct super_block *sb,
2698                                     struct ext4_group_desc *bg);
2699extern __u32 ext4_free_group_clusters(struct super_block *sb,
2700                                      struct ext4_group_desc *bg);
2701extern __u32 ext4_free_inodes_count(struct super_block *sb,
2702                                 struct ext4_group_desc *bg);
2703extern __u32 ext4_used_dirs_count(struct super_block *sb,
2704                                struct ext4_group_desc *bg);
2705extern __u32 ext4_itable_unused_count(struct super_block *sb,
2706                                   struct ext4_group_desc *bg);
2707extern void ext4_block_bitmap_set(struct super_block *sb,
2708                                  struct ext4_group_desc *bg, ext4_fsblk_t blk);
2709extern void ext4_inode_bitmap_set(struct super_block *sb,
2710                                  struct ext4_group_desc *bg, ext4_fsblk_t blk);
2711extern void ext4_inode_table_set(struct super_block *sb,
2712                                 struct ext4_group_desc *bg, ext4_fsblk_t blk);
2713extern void ext4_free_group_clusters_set(struct super_block *sb,
2714                                         struct ext4_group_desc *bg,
2715                                         __u32 count);
2716extern void ext4_free_inodes_set(struct super_block *sb,
2717                                struct ext4_group_desc *bg, __u32 count);
2718extern void ext4_used_dirs_set(struct super_block *sb,
2719                                struct ext4_group_desc *bg, __u32 count);
2720extern void ext4_itable_unused_set(struct super_block *sb,
2721                                   struct ext4_group_desc *bg, __u32 count);
2722extern int ext4_group_desc_csum_verify(struct super_block *sb, __u32 group,
2723                                       struct ext4_group_desc *gdp);
2724extern void ext4_group_desc_csum_set(struct super_block *sb, __u32 group,
2725                                     struct ext4_group_desc *gdp);
2726extern int ext4_register_li_request(struct super_block *sb,
2727                                    ext4_group_t first_not_zeroed);
2728
2729static inline int ext4_has_group_desc_csum(struct super_block *sb)
2730{
2731        return ext4_has_feature_gdt_csum(sb) ||
2732               EXT4_SB(sb)->s_chksum_driver != NULL;
2733}
2734
2735static inline int ext4_has_metadata_csum(struct super_block *sb)
2736{
2737        WARN_ON_ONCE(ext4_has_feature_metadata_csum(sb) &&
2738                     !EXT4_SB(sb)->s_chksum_driver);
2739
2740        return (EXT4_SB(sb)->s_chksum_driver != NULL);
2741}
2742static inline ext4_fsblk_t ext4_blocks_count(struct ext4_super_block *es)
2743{
2744        return ((ext4_fsblk_t)le32_to_cpu(es->s_blocks_count_hi) << 32) |
2745                le32_to_cpu(es->s_blocks_count_lo);
2746}
2747
2748static inline ext4_fsblk_t ext4_r_blocks_count(struct ext4_super_block *es)
2749{
2750        return ((ext4_fsblk_t)le32_to_cpu(es->s_r_blocks_count_hi) << 32) |
2751                le32_to_cpu(es->s_r_blocks_count_lo);
2752}
2753
2754static inline ext4_fsblk_t ext4_free_blocks_count(struct ext4_super_block *es)
2755{
2756        return ((ext4_fsblk_t)le32_to_cpu(es->s_free_blocks_count_hi) << 32) |
2757                le32_to_cpu(es->s_free_blocks_count_lo);
2758}
2759
2760static inline void ext4_blocks_count_set(struct ext4_super_block *es,
2761                                         ext4_fsblk_t blk)
2762{
2763        es->s_blocks_count_lo = cpu_to_le32((u32)blk);
2764        es->s_blocks_count_hi = cpu_to_le32(blk >> 32);
2765}
2766
2767static inline void ext4_free_blocks_count_set(struct ext4_super_block *es,
2768                                              ext4_fsblk_t blk)
2769{
2770        es->s_free_blocks_count_lo = cpu_to_le32((u32)blk);
2771        es->s_free_blocks_count_hi = cpu_to_le32(blk >> 32);
2772}
2773
2774static inline void ext4_r_blocks_count_set(struct ext4_super_block *es,
2775                                           ext4_fsblk_t blk)
2776{
2777        es->s_r_blocks_count_lo = cpu_to_le32((u32)blk);
2778        es->s_r_blocks_count_hi = cpu_to_le32(blk >> 32);
2779}
2780
2781static inline loff_t ext4_isize(struct ext4_inode *raw_inode)
2782{
2783        if (S_ISREG(le16_to_cpu(raw_inode->i_mode)))
2784                return ((loff_t)le32_to_cpu(raw_inode->i_size_high) << 32) |
2785                        le32_to_cpu(raw_inode->i_size_lo);
2786        else
2787                return (loff_t) le32_to_cpu(raw_inode->i_size_lo);
2788}
2789
2790static inline void ext4_isize_set(struct ext4_inode *raw_inode, loff_t i_size)
2791{
2792        raw_inode->i_size_lo = cpu_to_le32(i_size);
2793        raw_inode->i_size_high = cpu_to_le32(i_size >> 32);
2794}
2795
2796static inline
2797struct ext4_group_info *ext4_get_group_info(struct super_block *sb,
2798                                            ext4_group_t group)
2799{
2800         struct ext4_group_info ***grp_info;
2801         long indexv, indexh;
2802         BUG_ON(group >= EXT4_SB(sb)->s_groups_count);
2803         grp_info = EXT4_SB(sb)->s_group_info;
2804         indexv = group >> (EXT4_DESC_PER_BLOCK_BITS(sb));
2805         indexh = group & ((EXT4_DESC_PER_BLOCK(sb)) - 1);
2806         return grp_info[indexv][indexh];
2807}
2808
2809/*
2810 * Reading s_groups_count requires using smp_rmb() afterwards.  See
2811 * the locking protocol documented in the comments of ext4_group_add()
2812 * in resize.c
2813 */
2814static inline ext4_group_t ext4_get_groups_count(struct super_block *sb)
2815{
2816        ext4_group_t    ngroups = EXT4_SB(sb)->s_groups_count;
2817
2818        smp_rmb();
2819        return ngroups;
2820}
2821
2822static inline ext4_group_t ext4_flex_group(struct ext4_sb_info *sbi,
2823                                             ext4_group_t block_group)
2824{
2825        return block_group >> sbi->s_log_groups_per_flex;
2826}
2827
2828static inline unsigned int ext4_flex_bg_size(struct ext4_sb_info *sbi)
2829{
2830        return 1 << sbi->s_log_groups_per_flex;
2831}
2832
2833#define ext4_std_error(sb, errno)                               \
2834do {                                                            \
2835        if ((errno))                                            \
2836                __ext4_std_error((sb), __func__, __LINE__, (errno));    \
2837} while (0)
2838
2839#ifdef CONFIG_SMP
2840/* Each CPU can accumulate percpu_counter_batch clusters in their local
2841 * counters. So we need to make sure we have free clusters more
2842 * than percpu_counter_batch  * nr_cpu_ids. Also add a window of 4 times.
2843 */
2844#define EXT4_FREECLUSTERS_WATERMARK (4 * (percpu_counter_batch * nr_cpu_ids))
2845#else
2846#define EXT4_FREECLUSTERS_WATERMARK 0
2847#endif
2848
2849/* Update i_disksize. Requires i_mutex to avoid races with truncate */
2850static inline void ext4_update_i_disksize(struct inode *inode, loff_t newsize)
2851{
2852        WARN_ON_ONCE(S_ISREG(inode->i_mode) &&
2853                     !inode_is_locked(inode));
2854        down_write(&EXT4_I(inode)->i_data_sem);
2855        if (newsize > EXT4_I(inode)->i_disksize)
2856                EXT4_I(inode)->i_disksize = newsize;
2857        up_write(&EXT4_I(inode)->i_data_sem);
2858}
2859
2860/* Update i_size, i_disksize. Requires i_mutex to avoid races with truncate */
2861static inline int ext4_update_inode_size(struct inode *inode, loff_t newsize)
2862{
2863        int changed = 0;
2864
2865        if (newsize > inode->i_size) {
2866                i_size_write(inode, newsize);
2867                changed = 1;
2868        }
2869        if (newsize > EXT4_I(inode)->i_disksize) {
2870                ext4_update_i_disksize(inode, newsize);
2871                changed |= 2;
2872        }
2873        return changed;
2874}
2875
2876int ext4_update_disksize_before_punch(struct inode *inode, loff_t offset,
2877                                      loff_t len);
2878
2879struct ext4_group_info {
2880        unsigned long   bb_state;
2881        struct rb_root  bb_free_root;
2882        ext4_grpblk_t   bb_first_free;  /* first free block */
2883        ext4_grpblk_t   bb_free;        /* total free blocks */
2884        ext4_grpblk_t   bb_fragments;   /* nr of freespace fragments */
2885        ext4_grpblk_t   bb_largest_free_order;/* order of largest frag in BG */
2886        struct          list_head bb_prealloc_list;
2887#ifdef DOUBLE_CHECK
2888        void            *bb_bitmap;
2889#endif
2890        struct rw_semaphore alloc_sem;
2891        ext4_grpblk_t   bb_counters[];  /* Nr of free power-of-two-block
2892                                         * regions, index is order.
2893                                         * bb_counters[3] = 5 means
2894                                         * 5 free 8-block regions. */
2895};
2896
2897#define EXT4_GROUP_INFO_NEED_INIT_BIT           0
2898#define EXT4_GROUP_INFO_WAS_TRIMMED_BIT         1
2899#define EXT4_GROUP_INFO_BBITMAP_CORRUPT_BIT     2
2900#define EXT4_GROUP_INFO_IBITMAP_CORRUPT_BIT     3
2901
2902#define EXT4_MB_GRP_NEED_INIT(grp)      \
2903        (test_bit(EXT4_GROUP_INFO_NEED_INIT_BIT, &((grp)->bb_state)))
2904#define EXT4_MB_GRP_BBITMAP_CORRUPT(grp)        \
2905        (test_bit(EXT4_GROUP_INFO_BBITMAP_CORRUPT_BIT, &((grp)->bb_state)))
2906#define EXT4_MB_GRP_IBITMAP_CORRUPT(grp)        \
2907        (test_bit(EXT4_GROUP_INFO_IBITMAP_CORRUPT_BIT, &((grp)->bb_state)))
2908
2909#define EXT4_MB_GRP_WAS_TRIMMED(grp)    \
2910        (test_bit(EXT4_GROUP_INFO_WAS_TRIMMED_BIT, &((grp)->bb_state)))
2911#define EXT4_MB_GRP_SET_TRIMMED(grp)    \
2912        (set_bit(EXT4_GROUP_INFO_WAS_TRIMMED_BIT, &((grp)->bb_state)))
2913#define EXT4_MB_GRP_CLEAR_TRIMMED(grp)  \
2914        (clear_bit(EXT4_GROUP_INFO_WAS_TRIMMED_BIT, &((grp)->bb_state)))
2915
2916#define EXT4_MAX_CONTENTION             8
2917#define EXT4_CONTENTION_THRESHOLD       2
2918
2919static inline spinlock_t *ext4_group_lock_ptr(struct super_block *sb,
2920                                              ext4_group_t group)
2921{
2922        return bgl_lock_ptr(EXT4_SB(sb)->s_blockgroup_lock, group);
2923}
2924
2925/*
2926 * Returns true if the filesystem is busy enough that attempts to
2927 * access the block group locks has run into contention.
2928 */
2929static inline int ext4_fs_is_busy(struct ext4_sb_info *sbi)
2930{
2931        return (atomic_read(&sbi->s_lock_busy) > EXT4_CONTENTION_THRESHOLD);
2932}
2933
2934static inline void ext4_lock_group(struct super_block *sb, ext4_group_t group)
2935{
2936        spinlock_t *lock = ext4_group_lock_ptr(sb, group);
2937        if (spin_trylock(lock))
2938                /*
2939                 * We're able to grab the lock right away, so drop the
2940                 * lock contention counter.
2941                 */
2942                atomic_add_unless(&EXT4_SB(sb)->s_lock_busy, -1, 0);
2943        else {
2944                /*
2945                 * The lock is busy, so bump the contention counter,
2946                 * and then wait on the spin lock.
2947                 */
2948                atomic_add_unless(&EXT4_SB(sb)->s_lock_busy, 1,
2949                                  EXT4_MAX_CONTENTION);
2950                spin_lock(lock);
2951        }
2952}
2953
2954static inline void ext4_unlock_group(struct super_block *sb,
2955                                        ext4_group_t group)
2956{
2957        spin_unlock(ext4_group_lock_ptr(sb, group));
2958}
2959
2960/*
2961 * Block validity checking
2962 */
2963#define ext4_check_indirect_blockref(inode, bh)                         \
2964        ext4_check_blockref(__func__, __LINE__, inode,                  \
2965                            (__le32 *)(bh)->b_data,                     \
2966                            EXT4_ADDR_PER_BLOCK((inode)->i_sb))
2967
2968#define ext4_ind_check_inode(inode)                                     \
2969        ext4_check_blockref(__func__, __LINE__, inode,                  \
2970                            EXT4_I(inode)->i_data,                      \
2971                            EXT4_NDIR_BLOCKS)
2972
2973/*
2974 * Inodes and files operations
2975 */
2976
2977/* dir.c */
2978extern const struct file_operations ext4_dir_operations;
2979
2980/* file.c */
2981extern const struct inode_operations ext4_file_inode_operations;
2982extern const struct file_operations ext4_file_operations;
2983extern loff_t ext4_llseek(struct file *file, loff_t offset, int origin);
2984
2985/* inline.c */
2986extern int ext4_get_max_inline_size(struct inode *inode);
2987extern int ext4_find_inline_data_nolock(struct inode *inode);
2988extern int ext4_init_inline_data(handle_t *handle, struct inode *inode,
2989                                 unsigned int len);
2990extern int ext4_destroy_inline_data(handle_t *handle, struct inode *inode);
2991
2992extern int ext4_readpage_inline(struct inode *inode, struct page *page);
2993extern int ext4_try_to_write_inline_data(struct address_space *mapping,
2994                                         struct inode *inode,
2995                                         loff_t pos, unsigned len,
2996                                         unsigned flags,
2997                                         struct page **pagep);
2998extern int ext4_write_inline_data_end(struct inode *inode,
2999                                      loff_t pos, unsigned len,
3000                                      unsigned copied,
3001                                      struct page *page);
3002extern struct buffer_head *
3003ext4_journalled_write_inline_data(struct inode *inode,
3004                                  unsigned len,
3005                                  struct page *page);
3006extern int ext4_da_write_inline_data_begin(struct address_space *mapping,
3007                                           struct inode *inode,
3008                                           loff_t pos, unsigned len,
3009                                           unsigned flags,
3010                                           struct page **pagep,
3011                                           void **fsdata);
3012extern int ext4_da_write_inline_data_end(struct inode *inode, loff_t pos,
3013                                         unsigned len, unsigned copied,
3014                                         struct page *page);
3015extern int ext4_try_add_inline_entry(handle_t *handle,
3016                                     struct ext4_filename *fname,
3017                                     struct inode *dir, struct inode *inode);
3018extern int ext4_try_create_inline_dir(handle_t *handle,
3019                                      struct inode *parent,
3020                                      struct inode *inode);
3021extern int ext4_read_inline_dir(struct file *filp,
3022                                struct dir_context *ctx,
3023                                int *has_inline_data);
3024extern int htree_inlinedir_to_tree(struct file *dir_file,
3025                                   struct inode *dir, ext4_lblk_t block,
3026                                   struct dx_hash_info *hinfo,
3027                                   __u32 start_hash, __u32 start_minor_hash,
3028                                   int *has_inline_data);
3029extern struct buffer_head *ext4_find_inline_entry(struct inode *dir,
3030                                        struct ext4_filename *fname,
3031                                        const struct qstr *d_name,
3032                                        struct ext4_dir_entry_2 **res_dir,
3033                                        int *has_inline_data);
3034extern int ext4_delete_inline_entry(handle_t *handle,
3035                                    struct inode *dir,
3036                                    struct ext4_dir_entry_2 *de_del,
3037                                    struct buffer_head *bh,
3038                                    int *has_inline_data);
3039extern bool empty_inline_dir(struct inode *dir, int *has_inline_data);
3040extern struct buffer_head *ext4_get_first_inline_block(struct inode *inode,
3041                                        struct ext4_dir_entry_2 **parent_de,
3042                                        int *retval);
3043extern int ext4_inline_data_fiemap(struct inode *inode,
3044                                   struct fiemap_extent_info *fieinfo,
3045                                   int *has_inline, __u64 start, __u64 len);
3046extern int ext4_try_to_evict_inline_data(handle_t *handle,
3047                                         struct inode *inode,
3048                                         int needed);
3049extern void ext4_inline_data_truncate(struct inode *inode, int *has_inline);
3050
3051extern int ext4_convert_inline_data(struct inode *inode);
3052
3053static inline int ext4_has_inline_data(struct inode *inode)
3054{
3055        return ext4_test_inode_flag(inode, EXT4_INODE_INLINE_DATA) &&
3056               EXT4_I(inode)->i_inline_off;
3057}
3058
3059/* namei.c */
3060extern const struct inode_operations ext4_dir_inode_operations;
3061extern const struct inode_operations ext4_special_inode_operations;
3062extern struct dentry *ext4_get_parent(struct dentry *child);
3063extern struct ext4_dir_entry_2 *ext4_init_dot_dotdot(struct inode *inode,
3064                                 struct ext4_dir_entry_2 *de,
3065                                 int blocksize, int csum_size,
3066                                 unsigned int parent_ino, int dotdot_real_len);
3067extern void initialize_dirent_tail(struct ext4_dir_entry_tail *t,
3068                                   unsigned int blocksize);
3069extern int ext4_handle_dirty_dirent_node(handle_t *handle,
3070                                         struct inode *inode,
3071                                         struct buffer_head *bh);
3072#define S_SHIFT 12
3073static unsigned char ext4_type_by_mode[S_IFMT >> S_SHIFT] = {
3074        [S_IFREG >> S_SHIFT]    = EXT4_FT_REG_FILE,
3075        [S_IFDIR >> S_SHIFT]    = EXT4_FT_DIR,
3076        [S_IFCHR >> S_SHIFT]    = EXT4_FT_CHRDEV,
3077        [S_IFBLK >> S_SHIFT]    = EXT4_FT_BLKDEV,
3078        [S_IFIFO >> S_SHIFT]    = EXT4_FT_FIFO,
3079        [S_IFSOCK >> S_SHIFT]   = EXT4_FT_SOCK,
3080        [S_IFLNK >> S_SHIFT]    = EXT4_FT_SYMLINK,
3081};
3082
3083static inline void ext4_set_de_type(struct super_block *sb,
3084                                struct ext4_dir_entry_2 *de,
3085                                umode_t mode) {
3086        if (ext4_has_feature_filetype(sb))
3087                de->file_type = ext4_type_by_mode[(mode & S_IFMT)>>S_SHIFT];
3088}
3089
3090/* readpages.c */
3091extern int ext4_mpage_readpages(struct address_space *mapping,
3092                                struct list_head *pages, struct page *page,
3093                                unsigned nr_pages);
3094
3095/* symlink.c */
3096extern const struct inode_operations ext4_encrypted_symlink_inode_operations;
3097extern const struct inode_operations ext4_symlink_inode_operations;
3098extern const struct inode_operations ext4_fast_symlink_inode_operations;
3099
3100/* sysfs.c */
3101extern int ext4_register_sysfs(struct super_block *sb);
3102extern void ext4_unregister_sysfs(struct super_block *sb);
3103extern int __init ext4_init_sysfs(void);
3104extern void ext4_exit_sysfs(void);
3105
3106/* block_validity */
3107extern void ext4_release_system_zone(struct super_block *sb);
3108extern int ext4_setup_system_zone(struct super_block *sb);
3109extern int __init ext4_init_system_zone(void);
3110extern void ext4_exit_system_zone(void);
3111extern int ext4_data_block_valid(struct ext4_sb_info *sbi,
3112                                 ext4_fsblk_t start_blk,
3113                                 unsigned int count);
3114extern int ext4_check_blockref(const char *, unsigned int,
3115                               struct inode *, __le32 *, unsigned int);
3116
3117/* extents.c */
3118struct ext4_ext_path;
3119struct ext4_extent;
3120
3121/*
3122 * Maximum number of logical blocks in a file; ext4_extent's ee_block is
3123 * __le32.
3124 */
3125#define EXT_MAX_BLOCKS  0xffffffff
3126
3127extern int ext4_ext_tree_init(handle_t *handle, struct inode *);
3128extern int ext4_ext_writepage_trans_blocks(struct inode *, int);
3129extern int ext4_ext_index_trans_blocks(struct inode *inode, int extents);
3130extern int ext4_ext_map_blocks(handle_t *handle, struct inode *inode,
3131                               struct ext4_map_blocks *map, int flags);
3132extern void ext4_ext_truncate(handle_t *, struct inode *);
3133extern int ext4_ext_remove_space(struct inode *inode, ext4_lblk_t start,
3134                                 ext4_lblk_t end);
3135extern void ext4_ext_init(struct super_block *);
3136extern void ext4_ext_release(struct super_block *);
3137extern long ext4_fallocate(struct file *file, int mode, loff_t offset,
3138                          loff_t len);
3139extern int ext4_convert_unwritten_extents(handle_t *handle, struct inode *inode,
3140                                          loff_t offset, ssize_t len);
3141extern int ext4_map_blocks(handle_t *handle, struct inode *inode,
3142                           struct ext4_map_blocks *map, int flags);
3143extern int ext4_ext_calc_metadata_amount(struct inode *inode,
3144                                         ext4_lblk_t lblocks);
3145extern int ext4_ext_calc_credits_for_single_extent(struct inode *inode,
3146                                                   int num,
3147                                                   struct ext4_ext_path *path);
3148extern int ext4_can_extents_be_merged(struct inode *inode,
3149                                      struct ext4_extent *ex1,
3150                                      struct ext4_extent *ex2);
3151extern int ext4_ext_insert_extent(handle_t *, struct inode *,
3152                                  struct ext4_ext_path **,
3153                                  struct ext4_extent *, int);
3154extern struct ext4_ext_path *ext4_find_extent(struct inode *, ext4_lblk_t,
3155                                              struct ext4_ext_path **,
3156                                              int flags);
3157extern void ext4_ext_drop_refs(struct ext4_ext_path *);
3158extern int ext4_ext_check_inode(struct inode *inode);
3159extern int ext4_find_delalloc_range(struct inode *inode,
3160                                    ext4_lblk_t lblk_start,
3161                                    ext4_lblk_t lblk_end);
3162extern int ext4_find_delalloc_cluster(struct inode *inode, ext4_lblk_t lblk);
3163extern ext4_lblk_t ext4_ext_next_allocated_block(struct ext4_ext_path *path);
3164extern int ext4_fiemap(struct inode *inode, struct fiemap_extent_info *fieinfo,
3165                        __u64 start, __u64 len);
3166extern int ext4_ext_precache(struct inode *inode);
3167extern int ext4_collapse_range(struct inode *inode, loff_t offset, loff_t len);
3168extern int ext4_insert_range(struct inode *inode, loff_t offset, loff_t len);
3169extern int ext4_swap_extents(handle_t *handle, struct inode *inode1,
3170                                struct inode *inode2, ext4_lblk_t lblk1,
3171                             ext4_lblk_t lblk2,  ext4_lblk_t count,
3172                             int mark_unwritten,int *err);
3173
3174/* move_extent.c */
3175extern void ext4_double_down_write_data_sem(struct inode *first,
3176                                            struct inode *second);
3177extern void ext4_double_up_write_data_sem(struct inode *orig_inode,
3178                                          struct inode *donor_inode);
3179extern int ext4_move_extents(struct file *o_filp, struct file *d_filp,
3180                             __u64 start_orig, __u64 start_donor,
3181                             __u64 len, __u64 *moved_len);
3182
3183/* page-io.c */
3184extern int __init ext4_init_pageio(void);
3185extern void ext4_exit_pageio(void);
3186extern ext4_io_end_t *ext4_init_io_end(struct inode *inode, gfp_t flags);
3187extern ext4_io_end_t *ext4_get_io_end(ext4_io_end_t *io_end);
3188extern int ext4_put_io_end(ext4_io_end_t *io_end);
3189extern void ext4_put_io_end_defer(ext4_io_end_t *io_end);
3190extern void ext4_io_submit_init(struct ext4_io_submit *io,
3191                                struct writeback_control *wbc);
3192extern void ext4_end_io_rsv_work(struct work_struct *work);
3193extern void ext4_io_submit(struct ext4_io_submit *io);
3194extern int ext4_bio_write_page(struct ext4_io_submit *io,
3195                               struct page *page,
3196                               int len,
3197                               struct writeback_control *wbc,
3198                               bool keep_towrite);
3199
3200/* mmp.c */
3201extern int ext4_multi_mount_protect(struct super_block *, ext4_fsblk_t);
3202
3203/*
3204 * Add new method to test whether block and inode bitmaps are properly
3205 * initialized. With uninit_bg reading the block from disk is not enough
3206 * to mark the bitmap uptodate. We need to also zero-out the bitmap
3207 */
3208#define BH_BITMAP_UPTODATE BH_JBDPrivateStart
3209
3210static inline int bitmap_uptodate(struct buffer_head *bh)
3211{
3212        return (buffer_uptodate(bh) &&
3213                        test_bit(BH_BITMAP_UPTODATE, &(bh)->b_state));
3214}
3215static inline void set_bitmap_uptodate(struct buffer_head *bh)
3216{
3217        set_bit(BH_BITMAP_UPTODATE, &(bh)->b_state);
3218}
3219
3220/*
3221 * Disable DIO read nolock optimization, so new dioreaders will be forced
3222 * to grab i_mutex
3223 */
3224static inline void ext4_inode_block_unlocked_dio(struct inode *inode)
3225{
3226        ext4_set_inode_state(inode, EXT4_STATE_DIOREAD_LOCK);
3227        smp_mb();
3228}
3229static inline void ext4_inode_resume_unlocked_dio(struct inode *inode)
3230{
3231        smp_mb();
3232        ext4_clear_inode_state(inode, EXT4_STATE_DIOREAD_LOCK);
3233}
3234
3235#define in_range(b, first, len) ((b) >= (first) && (b) <= (first) + (len) - 1)
3236
3237/* For ioend & aio unwritten conversion wait queues */
3238#define EXT4_WQ_HASH_SZ         37
3239#define ext4_ioend_wq(v)   (&ext4__ioend_wq[((unsigned long)(v)) %\
3240                                            EXT4_WQ_HASH_SZ])
3241extern wait_queue_head_t ext4__ioend_wq[EXT4_WQ_HASH_SZ];
3242
3243#define EXT4_RESIZING   0
3244extern int ext4_resize_begin(struct super_block *sb);
3245extern void ext4_resize_end(struct super_block *sb);
3246
3247static inline void ext4_set_io_unwritten_flag(struct inode *inode,
3248                                              struct ext4_io_end *io_end)
3249{
3250        if (!(io_end->flag & EXT4_IO_END_UNWRITTEN)) {
3251                io_end->flag |= EXT4_IO_END_UNWRITTEN;
3252                atomic_inc(&EXT4_I(inode)->i_unwritten);
3253        }
3254}
3255
3256static inline void ext4_clear_io_unwritten_flag(ext4_io_end_t *io_end)
3257{
3258        struct inode *inode = io_end->inode;
3259
3260        if (io_end->flag & EXT4_IO_END_UNWRITTEN) {
3261                io_end->flag &= ~EXT4_IO_END_UNWRITTEN;
3262                /* Wake up anyone waiting on unwritten extent conversion */
3263                if (atomic_dec_and_test(&EXT4_I(inode)->i_unwritten))
3264                        wake_up_all(ext4_ioend_wq(inode));
3265        }
3266}
3267
3268static inline bool ext4_aligned_io(struct inode *inode, loff_t off, loff_t len)
3269{
3270        int blksize = 1 << inode->i_blkbits;
3271
3272        return IS_ALIGNED(off, blksize) && IS_ALIGNED(len, blksize);
3273}
3274
3275#endif  /* __KERNEL__ */
3276
3277#define EFSBADCRC       EBADMSG         /* Bad CRC detected */
3278#define EFSCORRUPTED    EUCLEAN         /* Filesystem is corrupted */
3279
3280#endif  /* _EXT4_H */
3281