2018-06-06 02:42:14 +00:00
|
|
|
// SPDX-License-Identifier: GPL-2.0
|
2005-04-16 22:20:36 +00:00
|
|
|
/*
|
2005-11-02 03:58:39 +00:00
|
|
|
* Copyright (c) 2000-2005 Silicon Graphics, Inc.
|
|
|
|
* All Rights Reserved.
|
2005-04-16 22:20:36 +00:00
|
|
|
*/
|
|
|
|
#ifndef __XFS_MOUNT_H__
|
|
|
|
#define __XFS_MOUNT_H__
|
|
|
|
|
2012-06-14 14:22:15 +00:00
|
|
|
struct xlog;
|
2005-04-16 22:20:36 +00:00
|
|
|
struct xfs_inode;
|
2007-07-11 01:09:12 +00:00
|
|
|
struct xfs_mru_cache;
|
2008-10-30 06:38:26 +00:00
|
|
|
struct xfs_ail;
|
2009-06-08 13:33:32 +00:00
|
|
|
struct xfs_quotainfo;
|
2014-06-06 05:01:58 +00:00
|
|
|
struct xfs_da_geometry;
|
2021-06-02 00:48:24 +00:00
|
|
|
struct xfs_perag;
|
2009-06-08 13:33:32 +00:00
|
|
|
|
2011-01-04 00:35:03 +00:00
|
|
|
/* dynamic preallocation free space thresholds, 5% down to 1% */
|
|
|
|
enum {
|
|
|
|
XFS_LOWSP_1_PCNT = 0,
|
|
|
|
XFS_LOWSP_2_PCNT,
|
|
|
|
XFS_LOWSP_3_PCNT,
|
|
|
|
XFS_LOWSP_4_PCNT,
|
|
|
|
XFS_LOWSP_5_PCNT,
|
|
|
|
XFS_LOWSP_MAX,
|
|
|
|
};
|
|
|
|
|
2016-05-18 00:58:51 +00:00
|
|
|
/*
|
|
|
|
* Error Configuration
|
|
|
|
*
|
|
|
|
* Error classes define the subsystem the configuration belongs to.
|
|
|
|
* Error numbers define the errors that are configurable.
|
|
|
|
*/
|
|
|
|
enum {
|
2016-05-18 01:01:00 +00:00
|
|
|
XFS_ERR_METADATA,
|
2016-05-18 00:58:51 +00:00
|
|
|
XFS_ERR_CLASS_MAX,
|
|
|
|
};
|
|
|
|
enum {
|
2016-05-18 01:01:00 +00:00
|
|
|
XFS_ERR_DEFAULT,
|
2016-05-18 01:09:28 +00:00
|
|
|
XFS_ERR_EIO,
|
|
|
|
XFS_ERR_ENOSPC,
|
|
|
|
XFS_ERR_ENODEV,
|
2016-05-18 00:58:51 +00:00
|
|
|
XFS_ERR_ERRNO_MAX,
|
|
|
|
};
|
|
|
|
|
2016-05-18 01:08:15 +00:00
|
|
|
#define XFS_ERR_RETRY_FOREVER -1
|
|
|
|
|
2016-09-13 21:51:30 +00:00
|
|
|
/*
|
|
|
|
* Although retry_timeout is in jiffies which is normally an unsigned long,
|
|
|
|
* we limit the retry timeout to 86400 seconds, or one day. So even a
|
|
|
|
* signed 32-bit long is sufficient for a HZ value up to 24855. Making it
|
|
|
|
* signed lets us store the special "-1" value, meaning retry forever.
|
|
|
|
*/
|
2016-05-18 00:58:51 +00:00
|
|
|
struct xfs_error_cfg {
|
|
|
|
struct xfs_kobj kobj;
|
|
|
|
int max_retries;
|
2016-09-13 21:51:30 +00:00
|
|
|
long retry_timeout; /* in jiffies, -1 = infinite */
|
2016-05-18 00:58:51 +00:00
|
|
|
};
|
|
|
|
|
2021-08-06 18:05:39 +00:00
|
|
|
/*
|
|
|
|
* Per-cpu deferred inode inactivation GC lists.
|
|
|
|
*/
|
|
|
|
struct xfs_inodegc {
|
2023-09-11 15:39:03 +00:00
|
|
|
struct xfs_mount *mp;
|
2021-08-06 18:05:39 +00:00
|
|
|
struct llist_head list;
|
2022-06-16 14:44:31 +00:00
|
|
|
struct delayed_work work;
|
2023-06-05 04:48:15 +00:00
|
|
|
int error;
|
2021-08-06 18:05:39 +00:00
|
|
|
|
|
|
|
/* approximate count of inodes in the list */
|
|
|
|
unsigned int items;
|
2021-08-06 18:05:43 +00:00
|
|
|
unsigned int shrinker_hits;
|
2023-05-01 23:16:12 +00:00
|
|
|
unsigned int cpu;
|
2021-08-06 18:05:39 +00:00
|
|
|
};
|
|
|
|
|
2020-05-20 20:17:11 +00:00
|
|
|
/*
|
|
|
|
* The struct xfsmount layout is optimised to separate read-mostly variables
|
|
|
|
* from variables that are frequently modified. We put the read-mostly variables
|
|
|
|
* first, then place all the other variables at the end.
|
|
|
|
*
|
|
|
|
* Typically, read-mostly variables are those that are set at mount time and
|
|
|
|
* never changed again, or only change rarely as a result of things like sysfs
|
|
|
|
* knobs being tweaked.
|
|
|
|
*/
|
2005-04-16 22:20:36 +00:00
|
|
|
typedef struct xfs_mount {
|
2020-05-20 20:17:11 +00:00
|
|
|
struct xfs_sb m_sb; /* copy of fs superblock */
|
2007-08-30 07:21:30 +00:00
|
|
|
struct super_block *m_super;
|
2008-10-30 06:38:26 +00:00
|
|
|
struct xfs_ail *m_ail; /* fs active log item list */
|
2005-04-16 22:20:36 +00:00
|
|
|
struct xfs_buf *m_sb_bp; /* buffer for superblock */
|
2005-11-02 00:44:33 +00:00
|
|
|
char *m_rtname; /* realtime device name */
|
|
|
|
char *m_logname; /* external log device name */
|
2014-06-06 05:01:58 +00:00
|
|
|
struct xfs_da_geometry *m_dir_geo; /* directory block geometry */
|
|
|
|
struct xfs_da_geometry *m_attr_geo; /* attribute block geometry */
|
2012-06-14 14:22:15 +00:00
|
|
|
struct xlog *m_log; /* log specific stuff */
|
2005-04-16 22:20:36 +00:00
|
|
|
struct xfs_inode *m_rbmip; /* pointer to bitmap inode */
|
|
|
|
struct xfs_inode *m_rsumip; /* pointer to summary inode */
|
|
|
|
struct xfs_inode *m_rootip; /* pointer to root directory */
|
|
|
|
struct xfs_quotainfo *m_quotainfo; /* disk quota information */
|
2024-02-22 20:42:44 +00:00
|
|
|
struct xfs_buftarg *m_ddev_targp; /* data device */
|
|
|
|
struct xfs_buftarg *m_logdev_targp;/* log device */
|
|
|
|
struct xfs_buftarg *m_rtdev_targp; /* rt device */
|
2021-08-06 18:05:39 +00:00
|
|
|
void __percpu *m_inodegc; /* percpu inodegc structures */
|
|
|
|
|
2020-05-20 20:17:11 +00:00
|
|
|
/*
|
|
|
|
* Optional cache of rt summary level per bitmap block with the
|
2023-10-16 17:41:55 +00:00
|
|
|
* invariant that m_rsum_cache[bbno] > the maximum i for which
|
|
|
|
* rsum[i][bbno] != 0, or 0 if rsum[i][bbno] == 0 for all i.
|
|
|
|
* Reads and writes are serialized by the rsumip inode lock.
|
2020-05-20 20:17:11 +00:00
|
|
|
*/
|
|
|
|
uint8_t *m_rsum_cache;
|
|
|
|
struct xfs_mru_cache *m_filestream; /* per-mount filestream data */
|
|
|
|
struct workqueue_struct *m_buf_workqueue;
|
|
|
|
struct workqueue_struct *m_unwritten_workqueue;
|
|
|
|
struct workqueue_struct *m_reclaim_workqueue;
|
|
|
|
struct workqueue_struct *m_sync_workqueue;
|
2021-08-06 18:05:39 +00:00
|
|
|
struct workqueue_struct *m_blockgc_wq;
|
|
|
|
struct workqueue_struct *m_inodegc_wq;
|
2020-05-20 20:17:11 +00:00
|
|
|
|
|
|
|
int m_bsize; /* fs logical block size */
|
2017-06-16 18:00:05 +00:00
|
|
|
uint8_t m_blkbit_log; /* blocklog + NBBY */
|
|
|
|
uint8_t m_blkbb_log; /* blocklog - BBSHIFT */
|
|
|
|
uint8_t m_agno_log; /* log #ag's */
|
2020-05-20 20:17:11 +00:00
|
|
|
uint8_t m_sectbb_log; /* sectlog - BBSHIFT */
|
2023-10-16 16:40:11 +00:00
|
|
|
int8_t m_rtxblklog; /* log2 of rextsize, if possible */
|
2005-04-16 22:20:36 +00:00
|
|
|
uint m_blockmask; /* sb_blocksize-1 */
|
|
|
|
uint m_blockwsize; /* sb_blocksize in words */
|
|
|
|
uint m_blockwmask; /* blockwsize-1 */
|
2008-10-30 06:11:19 +00:00
|
|
|
uint m_alloc_mxr[2]; /* max alloc btree records */
|
|
|
|
uint m_alloc_mnr[2]; /* min alloc btree records */
|
|
|
|
uint m_bmap_dmxr[2]; /* max bmap btree records */
|
|
|
|
uint m_bmap_dmnr[2]; /* min bmap btree records */
|
2016-08-03 01:36:07 +00:00
|
|
|
uint m_rmap_mxr[2]; /* max rmap btree records */
|
|
|
|
uint m_rmap_mnr[2]; /* min rmap btree records */
|
2016-10-03 16:11:18 +00:00
|
|
|
uint m_refc_mxr[2]; /* max refc btree records */
|
|
|
|
uint m_refc_mnr[2]; /* min refc btree records */
|
2021-10-13 17:02:19 +00:00
|
|
|
uint m_alloc_maxlevels; /* max alloc btree levels */
|
|
|
|
uint m_bm_maxlevels[2]; /* max bmap btree levels */
|
2016-08-03 01:36:07 +00:00
|
|
|
uint m_rmap_maxlevels; /* max rmap btree levels */
|
2016-10-03 16:11:18 +00:00
|
|
|
uint m_refc_maxlevels; /* max refcount btree level */
|
2021-09-16 19:27:34 +00:00
|
|
|
unsigned int m_agbtree_maxlevels; /* max level of all AG btrees */
|
2016-08-03 01:31:47 +00:00
|
|
|
xfs_extlen_t m_ag_prealloc_blocks; /* reserved ag blocks */
|
2016-08-03 01:38:24 +00:00
|
|
|
uint m_alloc_set_aside; /* space we can't use */
|
|
|
|
uint m_ag_max_usable; /* max space per AG */
|
2020-05-20 20:17:11 +00:00
|
|
|
int m_dalign; /* stripe unit */
|
|
|
|
int m_swidth; /* stripe width */
|
|
|
|
xfs_agnumber_t m_maxagi; /* highest inode alloc group */
|
|
|
|
uint m_allocsize_log;/* min write size log bytes */
|
|
|
|
uint m_allocsize_blocks; /* min write size blocks */
|
|
|
|
int m_logbufs; /* number of log buffers */
|
|
|
|
int m_logbsize; /* size of each log buffer */
|
|
|
|
uint m_rsumlevels; /* rt summary levels */
|
2024-08-30 22:37:15 +00:00
|
|
|
xfs_filblks_t m_rsumblocks; /* size of rt summary, FSBs */
|
2005-04-16 22:20:36 +00:00
|
|
|
int m_fixedfsid[2]; /* unchanged for life of FS */
|
|
|
|
uint m_qflags; /* quota status flags */
|
2021-08-19 01:46:26 +00:00
|
|
|
uint64_t m_features; /* active filesystem features */
|
2021-08-06 18:05:41 +00:00
|
|
|
uint64_t m_low_space[XFS_LOWSP_MAX];
|
|
|
|
uint64_t m_low_rtexts[XFS_LOWSP_MAX];
|
2023-10-16 16:40:11 +00:00
|
|
|
uint64_t m_rtxblkmask; /* rt extent block mask */
|
2020-05-20 20:17:11 +00:00
|
|
|
struct xfs_ino_geometry m_ino_geo; /* inode geometry */
|
2013-08-12 10:49:56 +00:00
|
|
|
struct xfs_trans_resv m_resv; /* precomputed res values */
|
2020-05-20 20:17:11 +00:00
|
|
|
/* low free space thresholds */
|
2021-08-06 18:05:39 +00:00
|
|
|
unsigned long m_opstate; /* dynamic state flags */
|
2020-05-20 20:17:11 +00:00
|
|
|
bool m_always_cow;
|
|
|
|
bool m_fail_unmount;
|
|
|
|
bool m_finobt_nores; /* no per-AG finobt resv. */
|
|
|
|
bool m_update_sb; /* sb needs update in mount */
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Bitsets of per-fs metadata that have been checked and/or are sick.
|
|
|
|
* Callers must hold m_sb_lock to access these two fields.
|
|
|
|
*/
|
|
|
|
uint8_t m_fs_checked;
|
|
|
|
uint8_t m_fs_sick;
|
|
|
|
/*
|
|
|
|
* Bitsets of rt metadata that have been checked and/or are sick.
|
|
|
|
* Callers must hold m_sb_lock to access this field.
|
|
|
|
*/
|
|
|
|
uint8_t m_rt_checked;
|
|
|
|
uint8_t m_rt_sick;
|
|
|
|
|
|
|
|
/*
|
|
|
|
* End of read-mostly variables. Frequently written variables and locks
|
|
|
|
* should be placed below this comment from now on. The first variable
|
|
|
|
* here is marked as cacheline aligned so they it is separated from
|
|
|
|
* the read-mostly variables.
|
|
|
|
*/
|
|
|
|
|
|
|
|
spinlock_t ____cacheline_aligned m_sb_lock; /* sb counter lock */
|
|
|
|
struct percpu_counter m_icount; /* allocated inodes counter */
|
|
|
|
struct percpu_counter m_ifree; /* free inodes counter */
|
|
|
|
struct percpu_counter m_fdblocks; /* free block counter */
|
2022-04-11 20:49:42 +00:00
|
|
|
struct percpu_counter m_frextents; /* free rt extent counter */
|
|
|
|
|
2020-05-20 20:17:11 +00:00
|
|
|
/*
|
|
|
|
* Count of data device blocks reserved for delayed allocations,
|
|
|
|
* including indlen blocks. Does not include allocated CoW staging
|
|
|
|
* extents or anything related to the rt device.
|
|
|
|
*/
|
|
|
|
struct percpu_counter m_delalloc_blks;
|
2024-04-22 11:20:15 +00:00
|
|
|
|
|
|
|
/*
|
|
|
|
* RT version of the above.
|
|
|
|
*/
|
|
|
|
struct percpu_counter m_delalloc_rtextents;
|
|
|
|
|
2021-04-28 22:05:50 +00:00
|
|
|
/*
|
|
|
|
* Global count of allocation btree blocks in use across all AGs. Only
|
|
|
|
* used when perag reservation is enabled. Helps prevent block
|
|
|
|
* reservation from attempting to reserve allocation btree blocks.
|
|
|
|
*/
|
|
|
|
atomic64_t m_allocbt_blks;
|
2020-05-20 20:17:11 +00:00
|
|
|
|
2024-08-29 04:08:40 +00:00
|
|
|
struct xarray m_perags; /* per-ag accounting info */
|
2017-06-16 18:00:05 +00:00
|
|
|
uint64_t m_resblks; /* total reserved blocks */
|
|
|
|
uint64_t m_resblks_avail;/* available reserved blocks */
|
|
|
|
uint64_t m_resblks_save; /* reserved blks @ remount,ro */
|
2011-04-08 02:45:07 +00:00
|
|
|
struct delayed_work m_reclaim_work; /* background inode reclaim */
|
2023-08-10 14:48:07 +00:00
|
|
|
struct dentry *m_debugfs; /* debugfs parent */
|
2014-07-14 22:07:01 +00:00
|
|
|
struct xfs_kobj m_kobj;
|
2016-05-18 00:58:51 +00:00
|
|
|
struct xfs_kobj m_error_kobj;
|
2016-05-18 01:01:00 +00:00
|
|
|
struct xfs_kobj m_error_meta_kobj;
|
2016-05-18 00:58:51 +00:00
|
|
|
struct xfs_error_cfg m_error_cfg[XFS_ERR_CLASS_MAX][XFS_ERR_ERRNO_MAX];
|
2015-10-12 07:21:19 +00:00
|
|
|
struct xstats m_stats; /* per-fs stats */
|
2023-08-10 14:48:07 +00:00
|
|
|
#ifdef CONFIG_XFS_ONLINE_SCRUB_STATS
|
|
|
|
struct xchk_stats *m_scrub_stats;
|
|
|
|
#endif
|
2020-05-20 20:17:11 +00:00
|
|
|
xfs_agnumber_t m_agfrotor; /* last ag where space found */
|
2023-02-12 22:14:52 +00:00
|
|
|
atomic_t m_agirotor; /* last ag dir inode alloced */
|
2012-02-29 09:53:48 +00:00
|
|
|
|
2021-08-06 18:05:43 +00:00
|
|
|
/* Memory shrinker to throttle and reprioritize inodegc */
|
2023-09-11 09:44:34 +00:00
|
|
|
struct shrinker *m_inodegc_shrinker;
|
2020-04-12 20:11:10 +00:00
|
|
|
/*
|
|
|
|
* Workqueue item so that we can coalesce multiple inode flush attempts
|
|
|
|
* into a single flush.
|
|
|
|
*/
|
|
|
|
struct work_struct m_flush_inodes_work;
|
2015-02-16 00:49:23 +00:00
|
|
|
|
|
|
|
/*
|
|
|
|
* Generation of the filesysyem layout. This is incremented by each
|
|
|
|
* growfs, and used by the pNFS server to ensure the client updates
|
|
|
|
* its view of the block device once it gets a layout that might
|
|
|
|
* reference the newly added blocks. Does not need to be persistent
|
|
|
|
* as long as we only allow file system size increments, but if we
|
|
|
|
* ever support shrinks it would have to be persisted in addition
|
|
|
|
* to various other kinds of pain inflicted on the pNFS server.
|
|
|
|
*/
|
2017-06-16 18:00:05 +00:00
|
|
|
uint32_t m_generation;
|
2020-05-20 20:17:11 +00:00
|
|
|
struct mutex m_growlock; /* growfs mutex */
|
2016-03-15 00:42:44 +00:00
|
|
|
|
|
|
|
#ifdef DEBUG
|
2017-06-21 00:54:46 +00:00
|
|
|
/*
|
|
|
|
* Frequency with which errors are injected. Replaces xfs_etest; the
|
|
|
|
* value stored in here is the inverse of the frequency with which the
|
|
|
|
* error triggers. 1 = always, 2 = half the time, etc.
|
|
|
|
*/
|
|
|
|
unsigned int *m_errortag;
|
2017-06-21 00:54:47 +00:00
|
|
|
struct xfs_kobj m_errortag_kobj;
|
2016-03-15 00:42:44 +00:00
|
|
|
#endif
|
2023-09-11 15:39:03 +00:00
|
|
|
|
|
|
|
/* cpus that have inodes queued for inactivation */
|
|
|
|
struct cpumask m_inodegc_cpumask;
|
2024-02-22 20:30:59 +00:00
|
|
|
|
|
|
|
/* Hook to feed dirent updates to an active online repair. */
|
|
|
|
struct xfs_hooks m_dir_update_hooks;
|
2005-04-16 22:20:36 +00:00
|
|
|
} xfs_mount_t;
|
|
|
|
|
2019-06-05 18:19:34 +00:00
|
|
|
#define M_IGEO(mp) (&(mp)->m_ino_geo)
|
|
|
|
|
2021-08-19 01:46:26 +00:00
|
|
|
/*
|
|
|
|
* Flags for m_features.
|
|
|
|
*
|
|
|
|
* These are all the active features in the filesystem, regardless of how
|
|
|
|
* they are configured.
|
|
|
|
*/
|
|
|
|
#define XFS_FEAT_ATTR (1ULL << 0) /* xattrs present in fs */
|
|
|
|
#define XFS_FEAT_NLINK (1ULL << 1) /* 32 bit link counts */
|
|
|
|
#define XFS_FEAT_QUOTA (1ULL << 2) /* quota active */
|
|
|
|
#define XFS_FEAT_ALIGN (1ULL << 3) /* inode alignment */
|
|
|
|
#define XFS_FEAT_DALIGN (1ULL << 4) /* data alignment */
|
|
|
|
#define XFS_FEAT_LOGV2 (1ULL << 5) /* version 2 logs */
|
|
|
|
#define XFS_FEAT_SECTOR (1ULL << 6) /* sector size > 512 bytes */
|
|
|
|
#define XFS_FEAT_EXTFLG (1ULL << 7) /* unwritten extents */
|
|
|
|
#define XFS_FEAT_ASCIICI (1ULL << 8) /* ASCII only case-insens. */
|
|
|
|
#define XFS_FEAT_LAZYSBCOUNT (1ULL << 9) /* Superblk counters */
|
|
|
|
#define XFS_FEAT_ATTR2 (1ULL << 10) /* dynamic attr fork */
|
|
|
|
#define XFS_FEAT_PARENT (1ULL << 11) /* parent pointers */
|
|
|
|
#define XFS_FEAT_PROJID32 (1ULL << 12) /* 32 bit project id */
|
|
|
|
#define XFS_FEAT_CRC (1ULL << 13) /* metadata CRCs */
|
|
|
|
#define XFS_FEAT_V3INODES (1ULL << 14) /* Version 3 inodes */
|
|
|
|
#define XFS_FEAT_PQUOTINO (1ULL << 15) /* non-shared proj/grp quotas */
|
|
|
|
#define XFS_FEAT_FTYPE (1ULL << 16) /* inode type in dir */
|
|
|
|
#define XFS_FEAT_FINOBT (1ULL << 17) /* free inode btree */
|
|
|
|
#define XFS_FEAT_RMAPBT (1ULL << 18) /* reverse map btree */
|
|
|
|
#define XFS_FEAT_REFLINK (1ULL << 19) /* reflinked files */
|
|
|
|
#define XFS_FEAT_SPINODES (1ULL << 20) /* sparse inode chunks */
|
|
|
|
#define XFS_FEAT_META_UUID (1ULL << 21) /* metadata UUID */
|
|
|
|
#define XFS_FEAT_REALTIME (1ULL << 22) /* realtime device present */
|
|
|
|
#define XFS_FEAT_INOBTCNT (1ULL << 23) /* inobt block counts */
|
|
|
|
#define XFS_FEAT_BIGTIME (1ULL << 24) /* large timestamps */
|
|
|
|
#define XFS_FEAT_NEEDSREPAIR (1ULL << 25) /* needs xfs_repair */
|
2021-11-16 08:39:32 +00:00
|
|
|
#define XFS_FEAT_NREXT64 (1ULL << 26) /* large extent counters */
|
2024-04-15 21:54:15 +00:00
|
|
|
#define XFS_FEAT_EXCHANGE_RANGE (1ULL << 27) /* exchange range */
|
2021-08-19 01:46:26 +00:00
|
|
|
|
2021-08-19 01:46:51 +00:00
|
|
|
/* Mount features */
|
|
|
|
#define XFS_FEAT_NOATTR2 (1ULL << 48) /* disable attr2 creation */
|
|
|
|
#define XFS_FEAT_NOALIGN (1ULL << 49) /* ignore alignment */
|
|
|
|
#define XFS_FEAT_ALLOCSIZE (1ULL << 50) /* user specified allocation size */
|
|
|
|
#define XFS_FEAT_LARGE_IOSIZE (1ULL << 51) /* report large preferred
|
|
|
|
* I/O size in stat() */
|
|
|
|
#define XFS_FEAT_WSYNC (1ULL << 52) /* synchronous metadata ops */
|
|
|
|
#define XFS_FEAT_DIRSYNC (1ULL << 53) /* synchronous directory ops */
|
|
|
|
#define XFS_FEAT_DISCARD (1ULL << 54) /* discard unused blocks */
|
|
|
|
#define XFS_FEAT_GRPID (1ULL << 55) /* group-ID assigned from directory */
|
|
|
|
#define XFS_FEAT_SMALL_INUMS (1ULL << 56) /* user wants 32bit inodes */
|
|
|
|
#define XFS_FEAT_IKEEP (1ULL << 57) /* keep empty inode clusters*/
|
|
|
|
#define XFS_FEAT_SWALLOC (1ULL << 58) /* stripe width allocation */
|
|
|
|
#define XFS_FEAT_FILESTREAMS (1ULL << 59) /* use filestreams allocator */
|
|
|
|
#define XFS_FEAT_DAX_ALWAYS (1ULL << 60) /* DAX always enabled */
|
|
|
|
#define XFS_FEAT_DAX_NEVER (1ULL << 61) /* DAX never enabled */
|
|
|
|
#define XFS_FEAT_NORECOVERY (1ULL << 62) /* no recovery - dirty fs */
|
|
|
|
#define XFS_FEAT_NOUUID (1ULL << 63) /* ignore uuid during mount */
|
|
|
|
|
2021-08-19 01:46:26 +00:00
|
|
|
#define __XFS_HAS_FEAT(name, NAME) \
|
|
|
|
static inline bool xfs_has_ ## name (struct xfs_mount *mp) \
|
|
|
|
{ \
|
|
|
|
return mp->m_features & XFS_FEAT_ ## NAME; \
|
|
|
|
}
|
|
|
|
|
|
|
|
/* Some features can be added dynamically so they need a set wrapper, too. */
|
|
|
|
#define __XFS_ADD_FEAT(name, NAME) \
|
|
|
|
__XFS_HAS_FEAT(name, NAME); \
|
|
|
|
static inline void xfs_add_ ## name (struct xfs_mount *mp) \
|
|
|
|
{ \
|
|
|
|
mp->m_features |= XFS_FEAT_ ## NAME; \
|
|
|
|
xfs_sb_version_add ## name(&mp->m_sb); \
|
|
|
|
}
|
|
|
|
|
2021-08-19 01:46:51 +00:00
|
|
|
/* Superblock features */
|
2021-08-19 01:46:26 +00:00
|
|
|
__XFS_ADD_FEAT(attr, ATTR)
|
|
|
|
__XFS_HAS_FEAT(nlink, NLINK)
|
|
|
|
__XFS_ADD_FEAT(quota, QUOTA)
|
|
|
|
__XFS_HAS_FEAT(dalign, DALIGN)
|
|
|
|
__XFS_HAS_FEAT(sector, SECTOR)
|
|
|
|
__XFS_HAS_FEAT(asciici, ASCIICI)
|
|
|
|
__XFS_HAS_FEAT(parent, PARENT)
|
|
|
|
__XFS_HAS_FEAT(ftype, FTYPE)
|
|
|
|
__XFS_HAS_FEAT(finobt, FINOBT)
|
|
|
|
__XFS_HAS_FEAT(rmapbt, RMAPBT)
|
|
|
|
__XFS_HAS_FEAT(reflink, REFLINK)
|
|
|
|
__XFS_HAS_FEAT(sparseinodes, SPINODES)
|
|
|
|
__XFS_HAS_FEAT(metauuid, META_UUID)
|
|
|
|
__XFS_HAS_FEAT(realtime, REALTIME)
|
2021-08-19 01:46:37 +00:00
|
|
|
__XFS_HAS_FEAT(inobtcounts, INOBTCNT)
|
|
|
|
__XFS_HAS_FEAT(bigtime, BIGTIME)
|
|
|
|
__XFS_HAS_FEAT(needsrepair, NEEDSREPAIR)
|
2021-11-16 08:39:32 +00:00
|
|
|
__XFS_HAS_FEAT(large_extent_counts, NREXT64)
|
2024-04-15 21:54:15 +00:00
|
|
|
__XFS_HAS_FEAT(exchange_range, EXCHANGE_RANGE)
|
2021-08-19 01:46:26 +00:00
|
|
|
|
2024-04-22 06:13:16 +00:00
|
|
|
/*
|
|
|
|
* Some features are always on for v5 file systems, allow the compiler to
|
|
|
|
* eliminiate dead code when building without v4 support.
|
|
|
|
*/
|
|
|
|
#define __XFS_HAS_V4_FEAT(name, NAME) \
|
|
|
|
static inline bool xfs_has_ ## name (struct xfs_mount *mp) \
|
|
|
|
{ \
|
|
|
|
return !IS_ENABLED(CONFIG_XFS_SUPPORT_V4) || \
|
|
|
|
(mp->m_features & XFS_FEAT_ ## NAME); \
|
|
|
|
}
|
|
|
|
|
|
|
|
#define __XFS_ADD_V4_FEAT(name, NAME) \
|
|
|
|
__XFS_HAS_V4_FEAT(name, NAME); \
|
|
|
|
static inline void xfs_add_ ## name (struct xfs_mount *mp) \
|
|
|
|
{ \
|
|
|
|
if (IS_ENABLED(CONFIG_XFS_SUPPORT_V4)) { \
|
|
|
|
mp->m_features |= XFS_FEAT_ ## NAME; \
|
|
|
|
xfs_sb_version_add ## name(&mp->m_sb); \
|
|
|
|
} \
|
|
|
|
}
|
|
|
|
|
|
|
|
__XFS_HAS_V4_FEAT(align, ALIGN)
|
|
|
|
__XFS_HAS_V4_FEAT(logv2, LOGV2)
|
|
|
|
__XFS_HAS_V4_FEAT(extflg, EXTFLG)
|
|
|
|
__XFS_HAS_V4_FEAT(lazysbcount, LAZYSBCOUNT)
|
|
|
|
__XFS_ADD_V4_FEAT(attr2, ATTR2)
|
|
|
|
__XFS_ADD_V4_FEAT(projid32, PROJID32)
|
|
|
|
__XFS_HAS_V4_FEAT(v3inodes, V3INODES)
|
|
|
|
__XFS_HAS_V4_FEAT(crc, CRC)
|
|
|
|
__XFS_HAS_V4_FEAT(pquotino, PQUOTINO)
|
|
|
|
|
2021-08-19 01:46:51 +00:00
|
|
|
/*
|
|
|
|
* Mount features
|
|
|
|
*
|
2021-08-19 01:46:52 +00:00
|
|
|
* These do not change dynamically - features that can come and go, such as 32
|
|
|
|
* bit inodes and read-only state, are kept as operational state rather than
|
2021-08-19 01:46:51 +00:00
|
|
|
* features.
|
|
|
|
*/
|
|
|
|
__XFS_HAS_FEAT(noattr2, NOATTR2)
|
|
|
|
__XFS_HAS_FEAT(noalign, NOALIGN)
|
|
|
|
__XFS_HAS_FEAT(allocsize, ALLOCSIZE)
|
|
|
|
__XFS_HAS_FEAT(large_iosize, LARGE_IOSIZE)
|
|
|
|
__XFS_HAS_FEAT(wsync, WSYNC)
|
|
|
|
__XFS_HAS_FEAT(dirsync, DIRSYNC)
|
|
|
|
__XFS_HAS_FEAT(discard, DISCARD)
|
|
|
|
__XFS_HAS_FEAT(grpid, GRPID)
|
|
|
|
__XFS_HAS_FEAT(small_inums, SMALL_INUMS)
|
|
|
|
__XFS_HAS_FEAT(ikeep, IKEEP)
|
|
|
|
__XFS_HAS_FEAT(swalloc, SWALLOC)
|
|
|
|
__XFS_HAS_FEAT(filestreams, FILESTREAMS)
|
|
|
|
__XFS_HAS_FEAT(dax_always, DAX_ALWAYS)
|
|
|
|
__XFS_HAS_FEAT(dax_never, DAX_NEVER)
|
|
|
|
__XFS_HAS_FEAT(norecovery, NORECOVERY)
|
|
|
|
__XFS_HAS_FEAT(nouuid, NOUUID)
|
|
|
|
|
2005-04-16 22:20:36 +00:00
|
|
|
/*
|
2021-08-19 01:46:52 +00:00
|
|
|
* Operational mount state flags
|
|
|
|
*
|
|
|
|
* Use these with atomic bit ops only!
|
2005-04-16 22:20:36 +00:00
|
|
|
*/
|
2021-08-19 01:46:52 +00:00
|
|
|
#define XFS_OPSTATE_UNMOUNTING 0 /* filesystem is unmounting */
|
|
|
|
#define XFS_OPSTATE_CLEAN 1 /* mount was clean */
|
|
|
|
#define XFS_OPSTATE_SHUTDOWN 2 /* stop all fs operations */
|
|
|
|
#define XFS_OPSTATE_INODE32 3 /* inode32 allocator active */
|
|
|
|
#define XFS_OPSTATE_READONLY 4 /* read-only fs */
|
2015-06-03 23:19:18 +00:00
|
|
|
|
2021-08-06 18:05:39 +00:00
|
|
|
/*
|
|
|
|
* If set, inactivation worker threads will be scheduled to process queued
|
|
|
|
* inodegc work. If not, queued inodes remain in memory waiting to be
|
|
|
|
* processed.
|
|
|
|
*/
|
2021-08-19 01:46:52 +00:00
|
|
|
#define XFS_OPSTATE_INODEGC_ENABLED 5
|
2021-08-06 18:05:42 +00:00
|
|
|
/*
|
|
|
|
* If set, background speculative prealloc gc worker threads will be scheduled
|
|
|
|
* to process queued blockgc work. If not, inodes retain their preallocations
|
|
|
|
* until explicitly deleted.
|
|
|
|
*/
|
2021-08-19 01:46:52 +00:00
|
|
|
#define XFS_OPSTATE_BLOCKGC_ENABLED 6
|
2021-08-06 18:05:39 +00:00
|
|
|
|
2022-05-27 00:31:34 +00:00
|
|
|
/* Kernel has logged a warning about online fsck being used on this fs. */
|
|
|
|
#define XFS_OPSTATE_WARNED_SCRUB 7
|
|
|
|
/* Kernel has logged a warning about shrink being used on this fs. */
|
|
|
|
#define XFS_OPSTATE_WARNED_SHRINK 8
|
2022-05-27 00:32:07 +00:00
|
|
|
/* Kernel has logged a warning about logged xattr updates being used. */
|
|
|
|
#define XFS_OPSTATE_WARNED_LARP 9
|
2023-09-11 15:39:08 +00:00
|
|
|
/* Mount time quotacheck is running */
|
|
|
|
#define XFS_OPSTATE_QUOTACHECK_RUNNING 10
|
xfs: only clear log incompat flags at clean unmount
While reviewing the online fsck patchset, someone spied the
xfs_swapext_can_use_without_log_assistance function and wondered why we
go through this inverted-bitmask dance to avoid setting the
XFS_SB_FEAT_INCOMPAT_LOG_SWAPEXT feature.
(The same principles apply to the logged extended attribute update
feature bit in the since-merged LARP series.)
The reason for this dance is that xfs_add_incompat_log_feature is an
expensive operation -- it forces the log, pushes the AIL, and then if
nobody's beaten us to it, sets the feature bit and issues a synchronous
write of the primary superblock. That could be a one-time cost
amortized over the life of the filesystem, but the log quiesce and cover
operations call xfs_clear_incompat_log_features to remove feature bits
opportunistically. On a moderately loaded filesystem this leads to us
cycling those bits on and off over and over, which hurts performance.
Why do we clear the log incompat bits? Back in ~2020 I think Dave and I
had a conversation on IRC[2] about what the log incompat bits represent.
IIRC in that conversation we decided that the log incompat bits protect
unrecovered log items so that old kernels won't try to recover them and
barf. Since a clean log has no protected log items, we could clear the
bits at cover/quiesce time.
As Dave Chinner pointed out in the thread, clearing log incompat bits at
unmount time has positive effects for golden root disk image generator
setups, since the generator could be running a newer kernel than what
gets written to the golden image -- if there are log incompat fields set
in the golden image that was generated by a newer kernel/OS image
builder then the provisioning host cannot mount the filesystem even
though the log is clean and recovery is unnecessary to mount the
filesystem.
Given that it's expensive to set log incompat bits, we really only want
to do that once per bit per mount. Therefore, I propose that we only
clear log incompat bits as part of writing a clean unmount record. Do
this by adding an operational state flag to the xfs mount that guards
whether or not the feature bit clearing can actually take place.
This eliminates the l_incompat_users rwsem that we use to protect a log
cleaning operation from clearing a feature bit that a frontend thread is
trying to set -- this lock adds another way to fail w.r.t. locking. For
the swapext series, I shard that into multiple locks just to work around
the lockdep complaints, and that's fugly.
Link: https://lore.kernel.org/linux-xfs/20240131230043.GA6180@frogsfrogsfrogs/
Signed-off-by: Darrick J. Wong <djwong@kernel.org>
Reviewed-by: Christoph Hellwig <hch@lst.de>
Reviewed-by: Dave Chinner <dchinner@redhat.com>
2024-04-15 21:54:06 +00:00
|
|
|
/* Do we want to clear log incompat flags? */
|
|
|
|
#define XFS_OPSTATE_UNSET_LOG_INCOMPAT 11
|
2024-04-22 16:47:25 +00:00
|
|
|
/* Filesystem can use logged extended attributes */
|
|
|
|
#define XFS_OPSTATE_USE_LARP 12
|
2022-05-27 00:31:34 +00:00
|
|
|
|
2021-08-06 18:05:39 +00:00
|
|
|
#define __XFS_IS_OPSTATE(name, NAME) \
|
|
|
|
static inline bool xfs_is_ ## name (struct xfs_mount *mp) \
|
|
|
|
{ \
|
|
|
|
return test_bit(XFS_OPSTATE_ ## NAME, &mp->m_opstate); \
|
|
|
|
} \
|
|
|
|
static inline bool xfs_clear_ ## name (struct xfs_mount *mp) \
|
|
|
|
{ \
|
|
|
|
return test_and_clear_bit(XFS_OPSTATE_ ## NAME, &mp->m_opstate); \
|
|
|
|
} \
|
|
|
|
static inline bool xfs_set_ ## name (struct xfs_mount *mp) \
|
|
|
|
{ \
|
|
|
|
return test_and_set_bit(XFS_OPSTATE_ ## NAME, &mp->m_opstate); \
|
|
|
|
}
|
|
|
|
|
2021-08-19 01:46:52 +00:00
|
|
|
__XFS_IS_OPSTATE(unmounting, UNMOUNTING)
|
|
|
|
__XFS_IS_OPSTATE(clean, CLEAN)
|
|
|
|
__XFS_IS_OPSTATE(shutdown, SHUTDOWN)
|
|
|
|
__XFS_IS_OPSTATE(inode32, INODE32)
|
|
|
|
__XFS_IS_OPSTATE(readonly, READONLY)
|
2021-08-06 18:05:39 +00:00
|
|
|
__XFS_IS_OPSTATE(inodegc_enabled, INODEGC_ENABLED)
|
2021-08-06 18:05:42 +00:00
|
|
|
__XFS_IS_OPSTATE(blockgc_enabled, BLOCKGC_ENABLED)
|
2023-09-11 15:39:08 +00:00
|
|
|
#ifdef CONFIG_XFS_QUOTA
|
|
|
|
__XFS_IS_OPSTATE(quotacheck_running, QUOTACHECK_RUNNING)
|
|
|
|
#else
|
|
|
|
# define xfs_is_quotacheck_running(mp) (false)
|
|
|
|
#endif
|
xfs: only clear log incompat flags at clean unmount
While reviewing the online fsck patchset, someone spied the
xfs_swapext_can_use_without_log_assistance function and wondered why we
go through this inverted-bitmask dance to avoid setting the
XFS_SB_FEAT_INCOMPAT_LOG_SWAPEXT feature.
(The same principles apply to the logged extended attribute update
feature bit in the since-merged LARP series.)
The reason for this dance is that xfs_add_incompat_log_feature is an
expensive operation -- it forces the log, pushes the AIL, and then if
nobody's beaten us to it, sets the feature bit and issues a synchronous
write of the primary superblock. That could be a one-time cost
amortized over the life of the filesystem, but the log quiesce and cover
operations call xfs_clear_incompat_log_features to remove feature bits
opportunistically. On a moderately loaded filesystem this leads to us
cycling those bits on and off over and over, which hurts performance.
Why do we clear the log incompat bits? Back in ~2020 I think Dave and I
had a conversation on IRC[2] about what the log incompat bits represent.
IIRC in that conversation we decided that the log incompat bits protect
unrecovered log items so that old kernels won't try to recover them and
barf. Since a clean log has no protected log items, we could clear the
bits at cover/quiesce time.
As Dave Chinner pointed out in the thread, clearing log incompat bits at
unmount time has positive effects for golden root disk image generator
setups, since the generator could be running a newer kernel than what
gets written to the golden image -- if there are log incompat fields set
in the golden image that was generated by a newer kernel/OS image
builder then the provisioning host cannot mount the filesystem even
though the log is clean and recovery is unnecessary to mount the
filesystem.
Given that it's expensive to set log incompat bits, we really only want
to do that once per bit per mount. Therefore, I propose that we only
clear log incompat bits as part of writing a clean unmount record. Do
this by adding an operational state flag to the xfs mount that guards
whether or not the feature bit clearing can actually take place.
This eliminates the l_incompat_users rwsem that we use to protect a log
cleaning operation from clearing a feature bit that a frontend thread is
trying to set -- this lock adds another way to fail w.r.t. locking. For
the swapext series, I shard that into multiple locks just to work around
the lockdep complaints, and that's fugly.
Link: https://lore.kernel.org/linux-xfs/20240131230043.GA6180@frogsfrogsfrogs/
Signed-off-by: Darrick J. Wong <djwong@kernel.org>
Reviewed-by: Christoph Hellwig <hch@lst.de>
Reviewed-by: Dave Chinner <dchinner@redhat.com>
2024-04-15 21:54:06 +00:00
|
|
|
__XFS_IS_OPSTATE(done_with_log_incompat, UNSET_LOG_INCOMPAT)
|
2024-04-22 16:47:25 +00:00
|
|
|
__XFS_IS_OPSTATE(using_logged_xattrs, USE_LARP)
|
2021-08-06 18:05:39 +00:00
|
|
|
|
2022-05-27 00:31:34 +00:00
|
|
|
static inline bool
|
|
|
|
xfs_should_warn(struct xfs_mount *mp, long nr)
|
|
|
|
{
|
|
|
|
return !test_and_set_bit(nr, &mp->m_opstate);
|
|
|
|
}
|
|
|
|
|
2021-08-06 18:05:39 +00:00
|
|
|
#define XFS_OPSTATE_STRINGS \
|
2021-08-19 01:46:52 +00:00
|
|
|
{ (1UL << XFS_OPSTATE_UNMOUNTING), "unmounting" }, \
|
|
|
|
{ (1UL << XFS_OPSTATE_CLEAN), "clean" }, \
|
|
|
|
{ (1UL << XFS_OPSTATE_SHUTDOWN), "shutdown" }, \
|
|
|
|
{ (1UL << XFS_OPSTATE_INODE32), "inode32" }, \
|
|
|
|
{ (1UL << XFS_OPSTATE_READONLY), "read_only" }, \
|
2021-08-06 18:05:42 +00:00
|
|
|
{ (1UL << XFS_OPSTATE_INODEGC_ENABLED), "inodegc" }, \
|
2022-05-27 00:31:34 +00:00
|
|
|
{ (1UL << XFS_OPSTATE_BLOCKGC_ENABLED), "blockgc" }, \
|
|
|
|
{ (1UL << XFS_OPSTATE_WARNED_SCRUB), "wscrub" }, \
|
2022-05-27 00:32:07 +00:00
|
|
|
{ (1UL << XFS_OPSTATE_WARNED_SHRINK), "wshrink" }, \
|
2023-09-11 15:39:08 +00:00
|
|
|
{ (1UL << XFS_OPSTATE_WARNED_LARP), "wlarp" }, \
|
xfs: only clear log incompat flags at clean unmount
While reviewing the online fsck patchset, someone spied the
xfs_swapext_can_use_without_log_assistance function and wondered why we
go through this inverted-bitmask dance to avoid setting the
XFS_SB_FEAT_INCOMPAT_LOG_SWAPEXT feature.
(The same principles apply to the logged extended attribute update
feature bit in the since-merged LARP series.)
The reason for this dance is that xfs_add_incompat_log_feature is an
expensive operation -- it forces the log, pushes the AIL, and then if
nobody's beaten us to it, sets the feature bit and issues a synchronous
write of the primary superblock. That could be a one-time cost
amortized over the life of the filesystem, but the log quiesce and cover
operations call xfs_clear_incompat_log_features to remove feature bits
opportunistically. On a moderately loaded filesystem this leads to us
cycling those bits on and off over and over, which hurts performance.
Why do we clear the log incompat bits? Back in ~2020 I think Dave and I
had a conversation on IRC[2] about what the log incompat bits represent.
IIRC in that conversation we decided that the log incompat bits protect
unrecovered log items so that old kernels won't try to recover them and
barf. Since a clean log has no protected log items, we could clear the
bits at cover/quiesce time.
As Dave Chinner pointed out in the thread, clearing log incompat bits at
unmount time has positive effects for golden root disk image generator
setups, since the generator could be running a newer kernel than what
gets written to the golden image -- if there are log incompat fields set
in the golden image that was generated by a newer kernel/OS image
builder then the provisioning host cannot mount the filesystem even
though the log is clean and recovery is unnecessary to mount the
filesystem.
Given that it's expensive to set log incompat bits, we really only want
to do that once per bit per mount. Therefore, I propose that we only
clear log incompat bits as part of writing a clean unmount record. Do
this by adding an operational state flag to the xfs mount that guards
whether or not the feature bit clearing can actually take place.
This eliminates the l_incompat_users rwsem that we use to protect a log
cleaning operation from clearing a feature bit that a frontend thread is
trying to set -- this lock adds another way to fail w.r.t. locking. For
the swapext series, I shard that into multiple locks just to work around
the lockdep complaints, and that's fugly.
Link: https://lore.kernel.org/linux-xfs/20240131230043.GA6180@frogsfrogsfrogs/
Signed-off-by: Darrick J. Wong <djwong@kernel.org>
Reviewed-by: Christoph Hellwig <hch@lst.de>
Reviewed-by: Dave Chinner <dchinner@redhat.com>
2024-04-15 21:54:06 +00:00
|
|
|
{ (1UL << XFS_OPSTATE_QUOTACHECK_RUNNING), "quotacheck" }, \
|
2024-04-22 16:47:25 +00:00
|
|
|
{ (1UL << XFS_OPSTATE_UNSET_LOG_INCOMPAT), "unset_log_incompat" }, \
|
|
|
|
{ (1UL << XFS_OPSTATE_USE_LARP), "logged_xattrs" }
|
2021-08-06 18:05:39 +00:00
|
|
|
|
2005-04-16 22:20:36 +00:00
|
|
|
/*
|
2005-05-05 20:28:29 +00:00
|
|
|
* Max and min values for mount-option defined I/O
|
|
|
|
* preallocation sizes.
|
2005-04-16 22:20:36 +00:00
|
|
|
*/
|
2005-05-05 20:28:29 +00:00
|
|
|
#define XFS_MAX_IO_LOG 30 /* 1G */
|
2005-04-16 22:20:36 +00:00
|
|
|
#define XFS_MIN_IO_LOG PAGE_SHIFT
|
|
|
|
|
2022-04-21 00:47:38 +00:00
|
|
|
void xfs_do_force_shutdown(struct xfs_mount *mp, uint32_t flags, char *fname,
|
2007-08-30 07:20:39 +00:00
|
|
|
int lnnum);
|
2005-04-16 22:20:36 +00:00
|
|
|
#define xfs_force_shutdown(m,f) \
|
2007-08-30 07:20:39 +00:00
|
|
|
xfs_do_force_shutdown(m, f, __FILE__, __LINE__)
|
2005-04-16 22:20:36 +00:00
|
|
|
|
2022-04-21 00:47:38 +00:00
|
|
|
#define SHUTDOWN_META_IO_ERROR (1u << 0) /* write attempt to metadata failed */
|
|
|
|
#define SHUTDOWN_LOG_IO_ERROR (1u << 1) /* write attempt to the log failed */
|
|
|
|
#define SHUTDOWN_FORCE_UMOUNT (1u << 2) /* shutdown from a forced unmount */
|
|
|
|
#define SHUTDOWN_CORRUPT_INCORE (1u << 3) /* corrupt in-memory structures */
|
2022-06-03 05:37:30 +00:00
|
|
|
#define SHUTDOWN_CORRUPT_ONDISK (1u << 4) /* corrupt metadata on device */
|
2023-06-01 09:44:55 +00:00
|
|
|
#define SHUTDOWN_DEVICE_REMOVED (1u << 5) /* device removed underneath us */
|
2008-11-28 03:23:36 +00:00
|
|
|
|
2021-08-11 00:00:54 +00:00
|
|
|
#define XFS_SHUTDOWN_STRINGS \
|
|
|
|
{ SHUTDOWN_META_IO_ERROR, "metadata_io" }, \
|
|
|
|
{ SHUTDOWN_LOG_IO_ERROR, "log_io" }, \
|
|
|
|
{ SHUTDOWN_FORCE_UMOUNT, "force_umount" }, \
|
2023-06-01 09:44:55 +00:00
|
|
|
{ SHUTDOWN_CORRUPT_INCORE, "corruption" }, \
|
|
|
|
{ SHUTDOWN_DEVICE_REMOVED, "device_removed" }
|
2021-08-11 00:00:54 +00:00
|
|
|
|
2005-04-16 22:20:36 +00:00
|
|
|
/*
|
|
|
|
* Flags for xfs_mountfs
|
|
|
|
*/
|
2006-03-31 03:04:17 +00:00
|
|
|
#define XFS_MFSI_QUIET 0x40 /* Be silent if mount errors found */
|
2005-04-16 22:20:36 +00:00
|
|
|
|
2005-11-02 03:38:42 +00:00
|
|
|
static inline xfs_agnumber_t
|
|
|
|
xfs_daddr_to_agno(struct xfs_mount *mp, xfs_daddr_t d)
|
2005-04-16 22:20:36 +00:00
|
|
|
{
|
2017-04-19 22:19:32 +00:00
|
|
|
xfs_rfsblock_t ld = XFS_BB_TO_FSBT(mp, d);
|
2005-11-02 03:38:42 +00:00
|
|
|
do_div(ld, mp->m_sb.sb_agblocks);
|
|
|
|
return (xfs_agnumber_t) ld;
|
2005-04-16 22:20:36 +00:00
|
|
|
}
|
|
|
|
|
2005-11-02 03:38:42 +00:00
|
|
|
static inline xfs_agblock_t
|
|
|
|
xfs_daddr_to_agbno(struct xfs_mount *mp, xfs_daddr_t d)
|
2005-04-16 22:20:36 +00:00
|
|
|
{
|
2017-04-19 22:19:32 +00:00
|
|
|
xfs_rfsblock_t ld = XFS_BB_TO_FSBT(mp, d);
|
2005-11-02 03:38:42 +00:00
|
|
|
return (xfs_agblock_t) do_div(ld, mp->m_sb.sb_agblocks);
|
2005-04-16 22:20:36 +00:00
|
|
|
}
|
|
|
|
|
2015-11-03 02:06:34 +00:00
|
|
|
extern void xfs_uuid_table_free(void);
|
2017-06-16 18:00:05 +00:00
|
|
|
extern uint64_t xfs_default_resblks(xfs_mount_t *mp);
|
2008-08-13 06:49:32 +00:00
|
|
|
extern int xfs_mountfs(xfs_mount_t *mp);
|
2008-08-13 06:49:57 +00:00
|
|
|
extern void xfs_unmountfs(xfs_mount_t *);
|
2015-02-23 10:24:37 +00:00
|
|
|
|
2021-08-06 18:05:40 +00:00
|
|
|
/*
|
|
|
|
* Deltas for the block count can vary from 1 to very large, but lock contention
|
|
|
|
* only occurs on frequent small block count updates such as in the delayed
|
|
|
|
* allocation path for buffered writes (page a time updates). Hence we set
|
|
|
|
* a large batch count (1024) to minimise global counter updates except when
|
|
|
|
* we get near to ENOSPC and we have to be very accurate with our updates.
|
|
|
|
*/
|
|
|
|
#define XFS_FDBLOCKS_BATCH 1024
|
|
|
|
|
xfs: don't include bnobt blocks when reserving free block pool
xfs_reserve_blocks controls the size of the user-visible free space
reserve pool. Given the difference between the current and requested
pool sizes, it will try to reserve free space from fdblocks. However,
the amount requested from fdblocks is also constrained by the amount of
space that we think xfs_mod_fdblocks will give us. If we forget to
subtract m_allocbt_blks before calling xfs_mod_fdblocks, it will will
return ENOSPC and we'll hang the kernel at mount due to the infinite
loop.
In commit fd43cf600cf6, we decided that xfs_mod_fdblocks should not hand
out the "free space" used by the free space btrees, because some portion
of the free space btrees hold in reserve space for future btree
expansion. Unfortunately, xfs_reserve_blocks' estimation of the number
of blocks that it could request from xfs_mod_fdblocks was not updated to
include m_allocbt_blks, so if space is extremely low, the caller hangs.
Fix this by creating a function to estimate the number of blocks that
can be reserved from fdblocks, which needs to exclude the set-aside and
m_allocbt_blks.
Found by running xfs/306 (which formats a single-AG 20MB filesystem)
with an fstests configuration that specifies a 1k blocksize and a
specially crafted log size that will consume 7/8 of the space (17920
blocks, specifically) in that AG.
Cc: Brian Foster <bfoster@redhat.com>
Fixes: fd43cf600cf6 ("xfs: set aside allocation btree blocks from block reservation")
Signed-off-by: Darrick J. Wong <djwong@kernel.org>
Reviewed-by: Brian Foster <bfoster@redhat.com>
Reviewed-by: Dave Chinner <dchinner@redhat.com>
2022-03-16 18:54:18 +00:00
|
|
|
/*
|
|
|
|
* Estimate the amount of free space that is not available to userspace and is
|
|
|
|
* not explicitly reserved from the incore fdblocks. This includes:
|
|
|
|
*
|
|
|
|
* - The minimum number of blocks needed to support splitting a bmap btree
|
|
|
|
* - The blocks currently in use by the freespace btrees because they record
|
|
|
|
* the actual blocks that will fill per-AG metadata space reservations
|
|
|
|
*/
|
|
|
|
static inline uint64_t
|
|
|
|
xfs_fdblocks_unavailable(
|
|
|
|
struct xfs_mount *mp)
|
|
|
|
{
|
|
|
|
return mp->m_alloc_set_aside + atomic64_read(&mp->m_allocbt_blks);
|
|
|
|
}
|
|
|
|
|
2024-04-22 11:20:12 +00:00
|
|
|
int xfs_dec_freecounter(struct xfs_mount *mp, struct percpu_counter *counter,
|
|
|
|
uint64_t delta, bool rsvd);
|
|
|
|
void xfs_add_freecounter(struct xfs_mount *mp, struct percpu_counter *counter,
|
|
|
|
uint64_t delta);
|
2022-04-11 20:49:42 +00:00
|
|
|
|
2024-04-22 11:20:12 +00:00
|
|
|
static inline int xfs_dec_fdblocks(struct xfs_mount *mp, uint64_t delta,
|
|
|
|
bool reserved)
|
2022-04-11 20:49:42 +00:00
|
|
|
{
|
2024-04-22 11:20:12 +00:00
|
|
|
return xfs_dec_freecounter(mp, &mp->m_fdblocks, delta, reserved);
|
2022-04-11 20:49:42 +00:00
|
|
|
}
|
|
|
|
|
2024-04-22 11:20:12 +00:00
|
|
|
static inline void xfs_add_fdblocks(struct xfs_mount *mp, uint64_t delta)
|
2022-04-11 20:49:42 +00:00
|
|
|
{
|
2024-04-22 11:20:12 +00:00
|
|
|
xfs_add_freecounter(mp, &mp->m_fdblocks, delta);
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline int xfs_dec_frextents(struct xfs_mount *mp, uint64_t delta)
|
|
|
|
{
|
|
|
|
return xfs_dec_freecounter(mp, &mp->m_frextents, delta, false);
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline void xfs_add_frextents(struct xfs_mount *mp, uint64_t delta)
|
|
|
|
{
|
|
|
|
xfs_add_freecounter(mp, &mp->m_frextents, delta);
|
2022-04-11 20:49:42 +00:00
|
|
|
}
|
2015-02-23 10:22:54 +00:00
|
|
|
|
2006-03-31 03:04:17 +00:00
|
|
|
extern int xfs_readsb(xfs_mount_t *, int);
|
2005-04-16 22:20:36 +00:00
|
|
|
extern void xfs_freesb(xfs_mount_t *);
|
2014-11-28 03:02:59 +00:00
|
|
|
extern bool xfs_fs_writable(struct xfs_mount *mp, int level);
|
2017-06-16 18:00:05 +00:00
|
|
|
extern int xfs_sb_validate_fsb_count(struct xfs_sb *, uint64_t);
|
2005-04-16 22:20:36 +00:00
|
|
|
|
2010-02-17 19:36:13 +00:00
|
|
|
extern int xfs_dev_is_read_only(struct xfs_mount *, char *);
|
|
|
|
|
2011-01-04 00:35:03 +00:00
|
|
|
extern void xfs_set_low_space_thresholds(struct xfs_mount *);
|
|
|
|
|
2015-11-03 01:27:22 +00:00
|
|
|
int xfs_zero_extent(struct xfs_inode *ip, xfs_fsblock_t start_fsb,
|
|
|
|
xfs_off_t count_fsb);
|
|
|
|
|
2016-05-18 01:05:33 +00:00
|
|
|
struct xfs_error_cfg * xfs_error_get_cfg(struct xfs_mount *mp,
|
|
|
|
int error_class, int error);
|
2018-07-20 16:28:40 +00:00
|
|
|
void xfs_force_summary_recalc(struct xfs_mount *mp);
|
2021-08-08 15:27:12 +00:00
|
|
|
int xfs_add_incompat_log_feature(struct xfs_mount *mp, uint32_t feature);
|
|
|
|
bool xfs_clear_incompat_log_features(struct xfs_mount *mp);
|
2024-04-22 11:20:15 +00:00
|
|
|
void xfs_mod_delalloc(struct xfs_inode *ip, int64_t data_delta,
|
|
|
|
int64_t ind_delta);
|
2016-05-18 01:05:33 +00:00
|
|
|
|
2005-04-16 22:20:36 +00:00
|
|
|
#endif /* __XFS_MOUNT_H__ */
|