xfs_log_rlimit.c 7.9 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247
  1. // SPDX-License-Identifier: GPL-2.0
  2. /*
  3. * Copyright (c) 2013 Jie Liu.
  4. * All Rights Reserved.
  5. */
  6. #include "xfs.h"
  7. #include "xfs_fs.h"
  8. #include "xfs_shared.h"
  9. #include "xfs_format.h"
  10. #include "xfs_log_format.h"
  11. #include "xfs_trans_resv.h"
  12. #include "xfs_mount.h"
  13. #include "xfs_da_format.h"
  14. #include "xfs_trans_space.h"
  15. #include "xfs_da_btree.h"
  16. #include "xfs_bmap_btree.h"
  17. #include "xfs_trace.h"
  18. /*
  19. * Shortly after enabling the large extents count feature in 2023, longstanding
  20. * bugs were found in the code that computes the minimum log size. Luckily,
  21. * the bugs resulted in over-estimates of that size, so there's no impact to
  22. * existing users. However, we don't want to reduce the minimum log size
  23. * because that can create the situation where a newer mkfs writes a new
  24. * filesystem that an older kernel won't mount.
  25. *
  26. * Several years prior, we also discovered that the transaction reservations
  27. * for rmap and reflink operations were unnecessarily large. That was fixed,
  28. * but the minimum log size computation was left alone to avoid the
  29. * compatibility problems noted above. Fix that too.
  30. *
  31. * Therefore, we only may correct the computation starting with filesystem
  32. * features that didn't exist in 2023. In other words, only turn this on if
  33. * the filesystem has parent pointers.
  34. *
  35. * This function can be called before the XFS_HAS_* flags have been set up,
  36. * (e.g. mkfs) so we must check the ondisk superblock.
  37. */
  38. static inline bool
  39. xfs_want_minlogsize_fixes(
  40. struct xfs_sb *sb)
  41. {
  42. return xfs_sb_is_v5(sb) &&
  43. xfs_sb_has_incompat_feature(sb, XFS_SB_FEAT_INCOMPAT_PARENT);
  44. }
  45. /*
  46. * Calculate the maximum length in bytes that would be required for a local
  47. * attribute value as large attributes out of line are not logged.
  48. */
  49. STATIC int
  50. xfs_log_calc_max_attrsetm_res(
  51. struct xfs_mount *mp)
  52. {
  53. int size;
  54. int nblks;
  55. size = xfs_attr_leaf_entsize_local_max(mp->m_attr_geo->blksize) -
  56. MAXNAMELEN - 1;
  57. nblks = XFS_DAENTER_SPACE_RES(mp, XFS_ATTR_FORK);
  58. nblks += XFS_B_TO_FSB(mp, size);
  59. /*
  60. * If the feature set is new enough, correct a unit conversion error in
  61. * the xattr transaction reservation code that resulted in oversized
  62. * minimum log size computations.
  63. */
  64. if (xfs_want_minlogsize_fixes(&mp->m_sb))
  65. size = XFS_B_TO_FSB(mp, size);
  66. nblks += XFS_NEXTENTADD_SPACE_RES(mp, size, XFS_ATTR_FORK);
  67. return M_RES(mp)->tr_attrsetm.tr_logres +
  68. M_RES(mp)->tr_attrsetrt.tr_logres * nblks;
  69. }
  70. /*
  71. * Compute an alternate set of log reservation sizes for use exclusively with
  72. * minimum log size calculations.
  73. */
  74. static void
  75. xfs_log_calc_trans_resv_for_minlogblocks(
  76. struct xfs_mount *mp,
  77. struct xfs_trans_resv *resv)
  78. {
  79. unsigned int rmap_maxlevels = mp->m_rmap_maxlevels;
  80. /*
  81. * If the feature set is new enough, drop the oversized minimum log
  82. * size computation introduced by the original reflink code.
  83. */
  84. if (xfs_want_minlogsize_fixes(&mp->m_sb)) {
  85. xfs_trans_resv_calc(mp, resv);
  86. return;
  87. }
  88. /*
  89. * In the early days of rmap+reflink, we always set the rmap maxlevels
  90. * to 9 even if the AG was small enough that it would never grow to
  91. * that height. Transaction reservation sizes influence the minimum
  92. * log size calculation, which influences the size of the log that mkfs
  93. * creates. Use the old value here to ensure that newly formatted
  94. * small filesystems will mount on older kernels.
  95. */
  96. if (xfs_has_rmapbt(mp) && xfs_has_reflink(mp))
  97. mp->m_rmap_maxlevels = XFS_OLD_REFLINK_RMAP_MAXLEVELS;
  98. xfs_trans_resv_calc(mp, resv);
  99. if (xfs_has_reflink(mp)) {
  100. /*
  101. * In the early days of reflink, typical log operation counts
  102. * were greatly overestimated.
  103. */
  104. resv->tr_write.tr_logcount = XFS_WRITE_LOG_COUNT_REFLINK;
  105. resv->tr_itruncate.tr_logcount =
  106. XFS_ITRUNCATE_LOG_COUNT_REFLINK;
  107. resv->tr_qm_dqalloc.tr_logcount = XFS_WRITE_LOG_COUNT_REFLINK;
  108. } else if (xfs_has_rmapbt(mp)) {
  109. /*
  110. * In the early days of non-reflink rmap, the impact of rmapbt
  111. * updates on log counts were not taken into account at all.
  112. */
  113. resv->tr_write.tr_logcount = XFS_WRITE_LOG_COUNT;
  114. resv->tr_itruncate.tr_logcount = XFS_ITRUNCATE_LOG_COUNT;
  115. resv->tr_qm_dqalloc.tr_logcount = XFS_WRITE_LOG_COUNT;
  116. }
  117. /*
  118. * In the early days of reflink, we did not use deferred refcount
  119. * update log items, so log reservations must be recomputed using the
  120. * old calculations.
  121. */
  122. resv->tr_write.tr_logres =
  123. xfs_calc_write_reservation_minlogsize(mp);
  124. resv->tr_itruncate.tr_logres =
  125. xfs_calc_itruncate_reservation_minlogsize(mp);
  126. resv->tr_qm_dqalloc.tr_logres =
  127. xfs_calc_qm_dqalloc_reservation_minlogsize(mp);
  128. /* Put everything back the way it was. This goes at the end. */
  129. mp->m_rmap_maxlevels = rmap_maxlevels;
  130. }
  131. /*
  132. * Iterate over the log space reservation table to figure out and return
  133. * the maximum one in terms of the pre-calculated values which were done
  134. * at mount time.
  135. */
  136. void
  137. xfs_log_get_max_trans_res(
  138. struct xfs_mount *mp,
  139. struct xfs_trans_res *max_resp)
  140. {
  141. struct xfs_trans_resv resv = {};
  142. struct xfs_trans_res *resp;
  143. struct xfs_trans_res *end_resp;
  144. unsigned int i;
  145. int log_space = 0;
  146. int attr_space;
  147. attr_space = xfs_log_calc_max_attrsetm_res(mp);
  148. xfs_log_calc_trans_resv_for_minlogblocks(mp, &resv);
  149. resp = (struct xfs_trans_res *)&resv;
  150. end_resp = (struct xfs_trans_res *)(&resv + 1);
  151. for (i = 0; resp < end_resp; i++, resp++) {
  152. int tmp = resp->tr_logcount > 1 ?
  153. resp->tr_logres * resp->tr_logcount :
  154. resp->tr_logres;
  155. trace_xfs_trans_resv_calc_minlogsize(mp, i, resp);
  156. if (log_space < tmp) {
  157. log_space = tmp;
  158. *max_resp = *resp; /* struct copy */
  159. }
  160. }
  161. if (attr_space > log_space) {
  162. *max_resp = resv.tr_attrsetm; /* struct copy */
  163. max_resp->tr_logres = attr_space;
  164. }
  165. trace_xfs_log_get_max_trans_res(mp, max_resp);
  166. }
  167. /*
  168. * Calculate the minimum valid log size for the given superblock configuration.
  169. * Used to calculate the minimum log size at mkfs time, and to determine if
  170. * the log is large enough or not at mount time. Returns the minimum size in
  171. * filesystem block size units.
  172. */
  173. int
  174. xfs_log_calc_minimum_size(
  175. struct xfs_mount *mp)
  176. {
  177. struct xfs_trans_res tres = {0};
  178. int max_logres;
  179. int min_logblks = 0;
  180. int lsunit = 0;
  181. xfs_log_get_max_trans_res(mp, &tres);
  182. max_logres = xfs_log_calc_unit_res(mp, tres.tr_logres);
  183. if (tres.tr_logcount > 1)
  184. max_logres *= tres.tr_logcount;
  185. if (xfs_has_logv2(mp) && mp->m_sb.sb_logsunit > 1)
  186. lsunit = BTOBB(mp->m_sb.sb_logsunit);
  187. /*
  188. * Two factors should be taken into account for calculating the minimum
  189. * log space.
  190. * 1) The fundamental limitation is that no single transaction can be
  191. * larger than half size of the log.
  192. *
  193. * From mkfs.xfs, this is considered by the XFS_MIN_LOG_FACTOR
  194. * define, which is set to 3. That means we can definitely fit
  195. * maximally sized 2 transactions in the log. We'll use this same
  196. * value here.
  197. *
  198. * 2) If the lsunit option is specified, a transaction requires 2 LSU
  199. * for the reservation because there are two log writes that can
  200. * require padding - the transaction data and the commit record which
  201. * are written separately and both can require padding to the LSU.
  202. * Consider that we can have an active CIL reservation holding 2*LSU,
  203. * but the CIL is not over a push threshold, in this case, if we
  204. * don't have enough log space for at one new transaction, which
  205. * includes another 2*LSU in the reservation, we will run into dead
  206. * loop situation in log space grant procedure. i.e.
  207. * xlog_grant_head_wait().
  208. *
  209. * Hence the log size needs to be able to contain two maximally sized
  210. * and padded transactions, which is (2 * (2 * LSU + maxlres)).
  211. *
  212. * Also, the log size should be a multiple of the log stripe unit, round
  213. * it up to lsunit boundary if lsunit is specified.
  214. */
  215. if (lsunit) {
  216. min_logblks = roundup_64(BTOBB(max_logres), lsunit) +
  217. 2 * lsunit;
  218. } else
  219. min_logblks = BTOBB(max_logres) + 2 * BBSIZE;
  220. min_logblks *= XFS_MIN_LOG_FACTOR;
  221. return XFS_BB_TO_FSB(mp, min_logblks);
  222. }