xfs_mount.h 16 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439
  1. // SPDX-License-Identifier: GPL-2.0
  2. /*
  3. * Copyright (c) 2000-2005 Silicon Graphics, Inc.
  4. * All Rights Reserved.
  5. */
  6. #ifndef __XFS_MOUNT_H__
  7. #define __XFS_MOUNT_H__
  8. struct xlog;
  9. struct xfs_inode;
  10. struct xfs_mru_cache;
  11. struct xfs_nameops;
  12. struct xfs_ail;
  13. struct xfs_quotainfo;
  14. struct xfs_dir_ops;
  15. struct xfs_da_geometry;
  16. /* dynamic preallocation free space thresholds, 5% down to 1% */
  17. enum {
  18. XFS_LOWSP_1_PCNT = 0,
  19. XFS_LOWSP_2_PCNT,
  20. XFS_LOWSP_3_PCNT,
  21. XFS_LOWSP_4_PCNT,
  22. XFS_LOWSP_5_PCNT,
  23. XFS_LOWSP_MAX,
  24. };
  25. /*
  26. * Error Configuration
  27. *
  28. * Error classes define the subsystem the configuration belongs to.
  29. * Error numbers define the errors that are configurable.
  30. */
  31. enum {
  32. XFS_ERR_METADATA,
  33. XFS_ERR_CLASS_MAX,
  34. };
  35. enum {
  36. XFS_ERR_DEFAULT,
  37. XFS_ERR_EIO,
  38. XFS_ERR_ENOSPC,
  39. XFS_ERR_ENODEV,
  40. XFS_ERR_ERRNO_MAX,
  41. };
  42. #define XFS_ERR_RETRY_FOREVER -1
  43. /*
  44. * Although retry_timeout is in jiffies which is normally an unsigned long,
  45. * we limit the retry timeout to 86400 seconds, or one day. So even a
  46. * signed 32-bit long is sufficient for a HZ value up to 24855. Making it
  47. * signed lets us store the special "-1" value, meaning retry forever.
  48. */
  49. struct xfs_error_cfg {
  50. struct xfs_kobj kobj;
  51. int max_retries;
  52. long retry_timeout; /* in jiffies, -1 = infinite */
  53. };
  54. typedef struct xfs_mount {
  55. struct super_block *m_super;
  56. xfs_tid_t m_tid; /* next unused tid for fs */
  57. struct xfs_ail *m_ail; /* fs active log item list */
  58. struct xfs_sb m_sb; /* copy of fs superblock */
  59. spinlock_t m_sb_lock; /* sb counter lock */
  60. struct percpu_counter m_icount; /* allocated inodes counter */
  61. struct percpu_counter m_ifree; /* free inodes counter */
  62. struct percpu_counter m_fdblocks; /* free block counter */
  63. struct xfs_buf *m_sb_bp; /* buffer for superblock */
  64. char *m_fsname; /* filesystem name */
  65. int m_fsname_len; /* strlen of fs name */
  66. char *m_rtname; /* realtime device name */
  67. char *m_logname; /* external log device name */
  68. int m_bsize; /* fs logical block size */
  69. xfs_agnumber_t m_agfrotor; /* last ag where space found */
  70. xfs_agnumber_t m_agirotor; /* last ag dir inode alloced */
  71. spinlock_t m_agirotor_lock;/* .. and lock protecting it */
  72. xfs_agnumber_t m_maxagi; /* highest inode alloc group */
  73. uint m_readio_log; /* min read size log bytes */
  74. uint m_readio_blocks; /* min read size blocks */
  75. uint m_writeio_log; /* min write size log bytes */
  76. uint m_writeio_blocks; /* min write size blocks */
  77. struct xfs_da_geometry *m_dir_geo; /* directory block geometry */
  78. struct xfs_da_geometry *m_attr_geo; /* attribute block geometry */
  79. struct xlog *m_log; /* log specific stuff */
  80. int m_logbufs; /* number of log buffers */
  81. int m_logbsize; /* size of each log buffer */
  82. uint m_rsumlevels; /* rt summary levels */
  83. uint m_rsumsize; /* size of rt summary, bytes */
  84. struct xfs_inode *m_rbmip; /* pointer to bitmap inode */
  85. struct xfs_inode *m_rsumip; /* pointer to summary inode */
  86. struct xfs_inode *m_rootip; /* pointer to root directory */
  87. struct xfs_quotainfo *m_quotainfo; /* disk quota information */
  88. xfs_buftarg_t *m_ddev_targp; /* saves taking the address */
  89. xfs_buftarg_t *m_logdev_targp;/* ptr to log device */
  90. xfs_buftarg_t *m_rtdev_targp; /* ptr to rt device */
  91. uint8_t m_blkbit_log; /* blocklog + NBBY */
  92. uint8_t m_blkbb_log; /* blocklog - BBSHIFT */
  93. uint8_t m_agno_log; /* log #ag's */
  94. uint8_t m_agino_log; /* #bits for agino in inum */
  95. uint m_inode_cluster_size;/* min inode buf size */
  96. uint m_blockmask; /* sb_blocksize-1 */
  97. uint m_blockwsize; /* sb_blocksize in words */
  98. uint m_blockwmask; /* blockwsize-1 */
  99. uint m_alloc_mxr[2]; /* max alloc btree records */
  100. uint m_alloc_mnr[2]; /* min alloc btree records */
  101. uint m_bmap_dmxr[2]; /* max bmap btree records */
  102. uint m_bmap_dmnr[2]; /* min bmap btree records */
  103. uint m_inobt_mxr[2]; /* max inobt btree records */
  104. uint m_inobt_mnr[2]; /* min inobt btree records */
  105. uint m_rmap_mxr[2]; /* max rmap btree records */
  106. uint m_rmap_mnr[2]; /* min rmap btree records */
  107. uint m_refc_mxr[2]; /* max refc btree records */
  108. uint m_refc_mnr[2]; /* min refc btree records */
  109. uint m_ag_maxlevels; /* XFS_AG_MAXLEVELS */
  110. uint m_bm_maxlevels[2]; /* XFS_BM_MAXLEVELS */
  111. uint m_in_maxlevels; /* max inobt btree levels. */
  112. uint m_rmap_maxlevels; /* max rmap btree levels */
  113. uint m_refc_maxlevels; /* max refcount btree level */
  114. xfs_extlen_t m_ag_prealloc_blocks; /* reserved ag blocks */
  115. uint m_alloc_set_aside; /* space we can't use */
  116. uint m_ag_max_usable; /* max space per AG */
  117. struct radix_tree_root m_perag_tree; /* per-ag accounting info */
  118. spinlock_t m_perag_lock; /* lock for m_perag_tree */
  119. struct mutex m_growlock; /* growfs mutex */
  120. int m_fixedfsid[2]; /* unchanged for life of FS */
  121. uint64_t m_flags; /* global mount flags */
  122. bool m_finobt_nores; /* no per-AG finobt resv. */
  123. int m_ialloc_inos; /* inodes in inode allocation */
  124. int m_ialloc_blks; /* blocks in inode allocation */
  125. int m_ialloc_min_blks;/* min blocks in sparse inode
  126. * allocation */
  127. int m_inoalign_mask;/* mask sb_inoalignmt if used */
  128. uint m_qflags; /* quota status flags */
  129. struct xfs_trans_resv m_resv; /* precomputed res values */
  130. uint64_t m_maxicount; /* maximum inode count */
  131. uint64_t m_resblks; /* total reserved blocks */
  132. uint64_t m_resblks_avail;/* available reserved blocks */
  133. uint64_t m_resblks_save; /* reserved blks @ remount,ro */
  134. int m_dalign; /* stripe unit */
  135. int m_swidth; /* stripe width */
  136. int m_sinoalign; /* stripe unit inode alignment */
  137. uint8_t m_sectbb_log; /* sectlog - BBSHIFT */
  138. const struct xfs_nameops *m_dirnameops; /* vector of dir name ops */
  139. const struct xfs_dir_ops *m_dir_inode_ops; /* vector of dir inode ops */
  140. const struct xfs_dir_ops *m_nondir_inode_ops; /* !dir inode ops */
  141. uint m_chsize; /* size of next field */
  142. atomic_t m_active_trans; /* number trans frozen */
  143. struct xfs_mru_cache *m_filestream; /* per-mount filestream data */
  144. struct delayed_work m_reclaim_work; /* background inode reclaim */
  145. struct delayed_work m_eofblocks_work; /* background eof blocks
  146. trimming */
  147. struct delayed_work m_cowblocks_work; /* background cow blocks
  148. trimming */
  149. bool m_update_sb; /* sb needs update in mount */
  150. int64_t m_low_space[XFS_LOWSP_MAX];
  151. /* low free space thresholds */
  152. struct xfs_kobj m_kobj;
  153. struct xfs_kobj m_error_kobj;
  154. struct xfs_kobj m_error_meta_kobj;
  155. struct xfs_error_cfg m_error_cfg[XFS_ERR_CLASS_MAX][XFS_ERR_ERRNO_MAX];
  156. struct xstats m_stats; /* per-fs stats */
  157. struct workqueue_struct *m_buf_workqueue;
  158. struct workqueue_struct *m_data_workqueue;
  159. struct workqueue_struct *m_unwritten_workqueue;
  160. struct workqueue_struct *m_cil_workqueue;
  161. struct workqueue_struct *m_reclaim_workqueue;
  162. struct workqueue_struct *m_log_workqueue;
  163. struct workqueue_struct *m_eofblocks_workqueue;
  164. struct workqueue_struct *m_sync_workqueue;
  165. /*
  166. * Generation of the filesysyem layout. This is incremented by each
  167. * growfs, and used by the pNFS server to ensure the client updates
  168. * its view of the block device once it gets a layout that might
  169. * reference the newly added blocks. Does not need to be persistent
  170. * as long as we only allow file system size increments, but if we
  171. * ever support shrinks it would have to be persisted in addition
  172. * to various other kinds of pain inflicted on the pNFS server.
  173. */
  174. uint32_t m_generation;
  175. bool m_fail_unmount;
  176. #ifdef DEBUG
  177. /*
  178. * Frequency with which errors are injected. Replaces xfs_etest; the
  179. * value stored in here is the inverse of the frequency with which the
  180. * error triggers. 1 = always, 2 = half the time, etc.
  181. */
  182. unsigned int *m_errortag;
  183. struct xfs_kobj m_errortag_kobj;
  184. #endif
  185. } xfs_mount_t;
  186. /*
  187. * Flags for m_flags.
  188. */
  189. #define XFS_MOUNT_WSYNC (1ULL << 0) /* for nfs - all metadata ops
  190. must be synchronous except
  191. for space allocations */
  192. #define XFS_MOUNT_UNMOUNTING (1ULL << 1) /* filesystem is unmounting */
  193. #define XFS_MOUNT_BAD_SUMMARY (1ULL << 2) /* summary counters are bad */
  194. #define XFS_MOUNT_WAS_CLEAN (1ULL << 3)
  195. #define XFS_MOUNT_FS_SHUTDOWN (1ULL << 4) /* atomic stop of all filesystem
  196. operations, typically for
  197. disk errors in metadata */
  198. #define XFS_MOUNT_DISCARD (1ULL << 5) /* discard unused blocks */
  199. #define XFS_MOUNT_NOALIGN (1ULL << 7) /* turn off stripe alignment
  200. allocations */
  201. #define XFS_MOUNT_ATTR2 (1ULL << 8) /* allow use of attr2 format */
  202. #define XFS_MOUNT_GRPID (1ULL << 9) /* group-ID assigned from directory */
  203. #define XFS_MOUNT_NORECOVERY (1ULL << 10) /* no recovery - dirty fs */
  204. #define XFS_MOUNT_DFLT_IOSIZE (1ULL << 12) /* set default i/o size */
  205. #define XFS_MOUNT_SMALL_INUMS (1ULL << 14) /* user wants 32bit inodes */
  206. #define XFS_MOUNT_32BITINODES (1ULL << 15) /* inode32 allocator active */
  207. #define XFS_MOUNT_NOUUID (1ULL << 16) /* ignore uuid during mount */
  208. #define XFS_MOUNT_IKEEP (1ULL << 18) /* keep empty inode clusters*/
  209. #define XFS_MOUNT_SWALLOC (1ULL << 19) /* turn on stripe width
  210. * allocation */
  211. #define XFS_MOUNT_RDONLY (1ULL << 20) /* read-only fs */
  212. #define XFS_MOUNT_DIRSYNC (1ULL << 21) /* synchronous directory ops */
  213. #define XFS_MOUNT_COMPAT_IOSIZE (1ULL << 22) /* don't report large preferred
  214. * I/O size in stat() */
  215. #define XFS_MOUNT_FILESTREAMS (1ULL << 24) /* enable the filestreams
  216. allocator */
  217. #define XFS_MOUNT_NOATTR2 (1ULL << 25) /* disable use of attr2 format */
  218. #define XFS_MOUNT_DAX (1ULL << 62) /* TEST ONLY! */
  219. /*
  220. * Default minimum read and write sizes.
  221. */
  222. #define XFS_READIO_LOG_LARGE 16
  223. #define XFS_WRITEIO_LOG_LARGE 16
  224. /*
  225. * Max and min values for mount-option defined I/O
  226. * preallocation sizes.
  227. */
  228. #define XFS_MAX_IO_LOG 30 /* 1G */
  229. #define XFS_MIN_IO_LOG PAGE_SHIFT
  230. /*
  231. * Synchronous read and write sizes. This should be
  232. * better for NFSv2 wsync filesystems.
  233. */
  234. #define XFS_WSYNC_READIO_LOG 15 /* 32k */
  235. #define XFS_WSYNC_WRITEIO_LOG 14 /* 16k */
  236. /*
  237. * Allow large block sizes to be reported to userspace programs if the
  238. * "largeio" mount option is used.
  239. *
  240. * If compatibility mode is specified, simply return the basic unit of caching
  241. * so that we don't get inefficient read/modify/write I/O from user apps.
  242. * Otherwise....
  243. *
  244. * If the underlying volume is a stripe, then return the stripe width in bytes
  245. * as the recommended I/O size. It is not a stripe and we've set a default
  246. * buffered I/O size, return that, otherwise return the compat default.
  247. */
  248. static inline unsigned long
  249. xfs_preferred_iosize(xfs_mount_t *mp)
  250. {
  251. if (mp->m_flags & XFS_MOUNT_COMPAT_IOSIZE)
  252. return PAGE_SIZE;
  253. return (mp->m_swidth ?
  254. (mp->m_swidth << mp->m_sb.sb_blocklog) :
  255. ((mp->m_flags & XFS_MOUNT_DFLT_IOSIZE) ?
  256. (1 << (int)max(mp->m_readio_log, mp->m_writeio_log)) :
  257. PAGE_SIZE));
  258. }
  259. #define XFS_LAST_UNMOUNT_WAS_CLEAN(mp) \
  260. ((mp)->m_flags & XFS_MOUNT_WAS_CLEAN)
  261. #define XFS_FORCED_SHUTDOWN(mp) ((mp)->m_flags & XFS_MOUNT_FS_SHUTDOWN)
  262. void xfs_do_force_shutdown(struct xfs_mount *mp, int flags, char *fname,
  263. int lnnum);
  264. #define xfs_force_shutdown(m,f) \
  265. xfs_do_force_shutdown(m, f, __FILE__, __LINE__)
  266. #define SHUTDOWN_META_IO_ERROR 0x0001 /* write attempt to metadata failed */
  267. #define SHUTDOWN_LOG_IO_ERROR 0x0002 /* write attempt to the log failed */
  268. #define SHUTDOWN_FORCE_UMOUNT 0x0004 /* shutdown from a forced unmount */
  269. #define SHUTDOWN_CORRUPT_INCORE 0x0008 /* corrupt in-memory data structures */
  270. #define SHUTDOWN_REMOTE_REQ 0x0010 /* shutdown came from remote cell */
  271. #define SHUTDOWN_DEVICE_REQ 0x0020 /* failed all paths to the device */
  272. /*
  273. * Flags for xfs_mountfs
  274. */
  275. #define XFS_MFSI_QUIET 0x40 /* Be silent if mount errors found */
  276. static inline xfs_agnumber_t
  277. xfs_daddr_to_agno(struct xfs_mount *mp, xfs_daddr_t d)
  278. {
  279. xfs_rfsblock_t ld = XFS_BB_TO_FSBT(mp, d);
  280. do_div(ld, mp->m_sb.sb_agblocks);
  281. return (xfs_agnumber_t) ld;
  282. }
  283. static inline xfs_agblock_t
  284. xfs_daddr_to_agbno(struct xfs_mount *mp, xfs_daddr_t d)
  285. {
  286. xfs_rfsblock_t ld = XFS_BB_TO_FSBT(mp, d);
  287. return (xfs_agblock_t) do_div(ld, mp->m_sb.sb_agblocks);
  288. }
  289. /* per-AG block reservation data structures*/
  290. enum xfs_ag_resv_type {
  291. XFS_AG_RESV_NONE = 0,
  292. XFS_AG_RESV_AGFL,
  293. XFS_AG_RESV_METADATA,
  294. XFS_AG_RESV_RMAPBT,
  295. };
  296. struct xfs_ag_resv {
  297. /* number of blocks originally reserved here */
  298. xfs_extlen_t ar_orig_reserved;
  299. /* number of blocks reserved here */
  300. xfs_extlen_t ar_reserved;
  301. /* number of blocks originally asked for */
  302. xfs_extlen_t ar_asked;
  303. };
  304. /*
  305. * Per-ag incore structure, copies of information in agf and agi, to improve the
  306. * performance of allocation group selection.
  307. */
  308. typedef struct xfs_perag {
  309. struct xfs_mount *pag_mount; /* owner filesystem */
  310. xfs_agnumber_t pag_agno; /* AG this structure belongs to */
  311. atomic_t pag_ref; /* perag reference count */
  312. char pagf_init; /* this agf's entry is initialized */
  313. char pagi_init; /* this agi's entry is initialized */
  314. char pagf_metadata; /* the agf is preferred to be metadata */
  315. char pagi_inodeok; /* The agi is ok for inodes */
  316. uint8_t pagf_levels[XFS_BTNUM_AGF];
  317. /* # of levels in bno & cnt btree */
  318. bool pagf_agflreset; /* agfl requires reset before use */
  319. uint32_t pagf_flcount; /* count of blocks in freelist */
  320. xfs_extlen_t pagf_freeblks; /* total free blocks */
  321. xfs_extlen_t pagf_longest; /* longest free space */
  322. uint32_t pagf_btreeblks; /* # of blocks held in AGF btrees */
  323. xfs_agino_t pagi_freecount; /* number of free inodes */
  324. xfs_agino_t pagi_count; /* number of allocated inodes */
  325. /*
  326. * Inode allocation search lookup optimisation.
  327. * If the pagino matches, the search for new inodes
  328. * doesn't need to search the near ones again straight away
  329. */
  330. xfs_agino_t pagl_pagino;
  331. xfs_agino_t pagl_leftrec;
  332. xfs_agino_t pagl_rightrec;
  333. spinlock_t pagb_lock; /* lock for pagb_tree */
  334. struct rb_root pagb_tree; /* ordered tree of busy extents */
  335. unsigned int pagb_gen; /* generation count for pagb_tree */
  336. wait_queue_head_t pagb_wait; /* woken when pagb_gen changes */
  337. atomic_t pagf_fstrms; /* # of filestreams active in this AG */
  338. spinlock_t pag_ici_lock; /* incore inode cache lock */
  339. struct radix_tree_root pag_ici_root; /* incore inode cache root */
  340. int pag_ici_reclaimable; /* reclaimable inodes */
  341. struct mutex pag_ici_reclaim_lock; /* serialisation point */
  342. unsigned long pag_ici_reclaim_cursor; /* reclaim restart point */
  343. /* buffer cache index */
  344. spinlock_t pag_buf_lock; /* lock for pag_buf_hash */
  345. struct rhashtable pag_buf_hash;
  346. /* for rcu-safe freeing */
  347. struct rcu_head rcu_head;
  348. int pagb_count; /* pagb slots in use */
  349. /* Blocks reserved for all kinds of metadata. */
  350. struct xfs_ag_resv pag_meta_resv;
  351. /* Blocks reserved for the reverse mapping btree. */
  352. struct xfs_ag_resv pag_rmapbt_resv;
  353. /* reference count */
  354. uint8_t pagf_refcount_level;
  355. } xfs_perag_t;
  356. static inline struct xfs_ag_resv *
  357. xfs_perag_resv(
  358. struct xfs_perag *pag,
  359. enum xfs_ag_resv_type type)
  360. {
  361. switch (type) {
  362. case XFS_AG_RESV_METADATA:
  363. return &pag->pag_meta_resv;
  364. case XFS_AG_RESV_RMAPBT:
  365. return &pag->pag_rmapbt_resv;
  366. default:
  367. return NULL;
  368. }
  369. }
  370. int xfs_buf_hash_init(xfs_perag_t *pag);
  371. void xfs_buf_hash_destroy(xfs_perag_t *pag);
  372. extern void xfs_uuid_table_free(void);
  373. extern int xfs_log_sbcount(xfs_mount_t *);
  374. extern uint64_t xfs_default_resblks(xfs_mount_t *mp);
  375. extern int xfs_mountfs(xfs_mount_t *mp);
  376. extern int xfs_initialize_perag(xfs_mount_t *mp, xfs_agnumber_t agcount,
  377. xfs_agnumber_t *maxagi);
  378. extern void xfs_unmountfs(xfs_mount_t *);
  379. extern int xfs_mod_icount(struct xfs_mount *mp, int64_t delta);
  380. extern int xfs_mod_ifree(struct xfs_mount *mp, int64_t delta);
  381. extern int xfs_mod_fdblocks(struct xfs_mount *mp, int64_t delta,
  382. bool reserved);
  383. extern int xfs_mod_frextents(struct xfs_mount *mp, int64_t delta);
  384. extern struct xfs_buf *xfs_getsb(xfs_mount_t *, int);
  385. extern int xfs_readsb(xfs_mount_t *, int);
  386. extern void xfs_freesb(xfs_mount_t *);
  387. extern bool xfs_fs_writable(struct xfs_mount *mp, int level);
  388. extern int xfs_sb_validate_fsb_count(struct xfs_sb *, uint64_t);
  389. extern int xfs_dev_is_read_only(struct xfs_mount *, char *);
  390. extern void xfs_set_low_space_thresholds(struct xfs_mount *);
  391. int xfs_zero_extent(struct xfs_inode *ip, xfs_fsblock_t start_fsb,
  392. xfs_off_t count_fsb);
  393. struct xfs_error_cfg * xfs_error_get_cfg(struct xfs_mount *mp,
  394. int error_class, int error);
  395. void xfs_force_summary_recalc(struct xfs_mount *mp);
  396. #endif /* __XFS_MOUNT_H__ */