Loading...
1// SPDX-License-Identifier: GPL-2.0
2/*
3 * Copyright (c) 2013 Jie Liu.
4 * All Rights Reserved.
5 */
6#include "xfs.h"
7#include "xfs_fs.h"
8#include "xfs_shared.h"
9#include "xfs_format.h"
10#include "xfs_log_format.h"
11#include "xfs_trans_resv.h"
12#include "xfs_mount.h"
13#include "xfs_da_format.h"
14#include "xfs_trans_space.h"
15#include "xfs_da_btree.h"
16#include "xfs_bmap_btree.h"
17#include "xfs_trace.h"
18
19/*
20 * Calculate the maximum length in bytes that would be required for a local
21 * attribute value as large attributes out of line are not logged.
22 */
23STATIC int
24xfs_log_calc_max_attrsetm_res(
25 struct xfs_mount *mp)
26{
27 int size;
28 int nblks;
29
30 size = xfs_attr_leaf_entsize_local_max(mp->m_attr_geo->blksize) -
31 MAXNAMELEN - 1;
32 nblks = XFS_DAENTER_SPACE_RES(mp, XFS_ATTR_FORK);
33 nblks += XFS_B_TO_FSB(mp, size);
34 nblks += XFS_NEXTENTADD_SPACE_RES(mp, size, XFS_ATTR_FORK);
35
36 return M_RES(mp)->tr_attrsetm.tr_logres +
37 M_RES(mp)->tr_attrsetrt.tr_logres * nblks;
38}
39
40/*
41 * Compute an alternate set of log reservation sizes for use exclusively with
42 * minimum log size calculations.
43 */
44static void
45xfs_log_calc_trans_resv_for_minlogblocks(
46 struct xfs_mount *mp,
47 struct xfs_trans_resv *resv)
48{
49 unsigned int rmap_maxlevels = mp->m_rmap_maxlevels;
50
51 /*
52 * In the early days of rmap+reflink, we always set the rmap maxlevels
53 * to 9 even if the AG was small enough that it would never grow to
54 * that height. Transaction reservation sizes influence the minimum
55 * log size calculation, which influences the size of the log that mkfs
56 * creates. Use the old value here to ensure that newly formatted
57 * small filesystems will mount on older kernels.
58 */
59 if (xfs_has_rmapbt(mp) && xfs_has_reflink(mp))
60 mp->m_rmap_maxlevels = XFS_OLD_REFLINK_RMAP_MAXLEVELS;
61
62 xfs_trans_resv_calc(mp, resv);
63
64 if (xfs_has_reflink(mp)) {
65 /*
66 * In the early days of reflink, typical log operation counts
67 * were greatly overestimated.
68 */
69 resv->tr_write.tr_logcount = XFS_WRITE_LOG_COUNT_REFLINK;
70 resv->tr_itruncate.tr_logcount =
71 XFS_ITRUNCATE_LOG_COUNT_REFLINK;
72 resv->tr_qm_dqalloc.tr_logcount = XFS_WRITE_LOG_COUNT_REFLINK;
73 } else if (xfs_has_rmapbt(mp)) {
74 /*
75 * In the early days of non-reflink rmap, the impact of rmapbt
76 * updates on log counts were not taken into account at all.
77 */
78 resv->tr_write.tr_logcount = XFS_WRITE_LOG_COUNT;
79 resv->tr_itruncate.tr_logcount = XFS_ITRUNCATE_LOG_COUNT;
80 resv->tr_qm_dqalloc.tr_logcount = XFS_WRITE_LOG_COUNT;
81 }
82
83 /*
84 * In the early days of reflink, we did not use deferred refcount
85 * update log items, so log reservations must be recomputed using the
86 * old calculations.
87 */
88 resv->tr_write.tr_logres =
89 xfs_calc_write_reservation_minlogsize(mp);
90 resv->tr_itruncate.tr_logres =
91 xfs_calc_itruncate_reservation_minlogsize(mp);
92 resv->tr_qm_dqalloc.tr_logres =
93 xfs_calc_qm_dqalloc_reservation_minlogsize(mp);
94
95 /* Put everything back the way it was. This goes at the end. */
96 mp->m_rmap_maxlevels = rmap_maxlevels;
97}
98
99/*
100 * Iterate over the log space reservation table to figure out and return
101 * the maximum one in terms of the pre-calculated values which were done
102 * at mount time.
103 */
104void
105xfs_log_get_max_trans_res(
106 struct xfs_mount *mp,
107 struct xfs_trans_res *max_resp)
108{
109 struct xfs_trans_resv resv = {};
110 struct xfs_trans_res *resp;
111 struct xfs_trans_res *end_resp;
112 unsigned int i;
113 int log_space = 0;
114 int attr_space;
115
116 attr_space = xfs_log_calc_max_attrsetm_res(mp);
117
118 xfs_log_calc_trans_resv_for_minlogblocks(mp, &resv);
119
120 resp = (struct xfs_trans_res *)&resv;
121 end_resp = (struct xfs_trans_res *)(&resv + 1);
122 for (i = 0; resp < end_resp; i++, resp++) {
123 int tmp = resp->tr_logcount > 1 ?
124 resp->tr_logres * resp->tr_logcount :
125 resp->tr_logres;
126
127 trace_xfs_trans_resv_calc_minlogsize(mp, i, resp);
128 if (log_space < tmp) {
129 log_space = tmp;
130 *max_resp = *resp; /* struct copy */
131 }
132 }
133
134 if (attr_space > log_space) {
135 *max_resp = resv.tr_attrsetm; /* struct copy */
136 max_resp->tr_logres = attr_space;
137 }
138 trace_xfs_log_get_max_trans_res(mp, max_resp);
139}
140
141/*
142 * Calculate the minimum valid log size for the given superblock configuration.
143 * Used to calculate the minimum log size at mkfs time, and to determine if
144 * the log is large enough or not at mount time. Returns the minimum size in
145 * filesystem block size units.
146 */
147int
148xfs_log_calc_minimum_size(
149 struct xfs_mount *mp)
150{
151 struct xfs_trans_res tres = {0};
152 int max_logres;
153 int min_logblks = 0;
154 int lsunit = 0;
155
156 xfs_log_get_max_trans_res(mp, &tres);
157
158 max_logres = xfs_log_calc_unit_res(mp, tres.tr_logres);
159 if (tres.tr_logcount > 1)
160 max_logres *= tres.tr_logcount;
161
162 if (xfs_has_logv2(mp) && mp->m_sb.sb_logsunit > 1)
163 lsunit = BTOBB(mp->m_sb.sb_logsunit);
164
165 /*
166 * Two factors should be taken into account for calculating the minimum
167 * log space.
168 * 1) The fundamental limitation is that no single transaction can be
169 * larger than half size of the log.
170 *
171 * From mkfs.xfs, this is considered by the XFS_MIN_LOG_FACTOR
172 * define, which is set to 3. That means we can definitely fit
173 * maximally sized 2 transactions in the log. We'll use this same
174 * value here.
175 *
176 * 2) If the lsunit option is specified, a transaction requires 2 LSU
177 * for the reservation because there are two log writes that can
178 * require padding - the transaction data and the commit record which
179 * are written separately and both can require padding to the LSU.
180 * Consider that we can have an active CIL reservation holding 2*LSU,
181 * but the CIL is not over a push threshold, in this case, if we
182 * don't have enough log space for at one new transaction, which
183 * includes another 2*LSU in the reservation, we will run into dead
184 * loop situation in log space grant procedure. i.e.
185 * xlog_grant_head_wait().
186 *
187 * Hence the log size needs to be able to contain two maximally sized
188 * and padded transactions, which is (2 * (2 * LSU + maxlres)).
189 *
190 * Also, the log size should be a multiple of the log stripe unit, round
191 * it up to lsunit boundary if lsunit is specified.
192 */
193 if (lsunit) {
194 min_logblks = roundup_64(BTOBB(max_logres), lsunit) +
195 2 * lsunit;
196 } else
197 min_logblks = BTOBB(max_logres) + 2 * BBSIZE;
198 min_logblks *= XFS_MIN_LOG_FACTOR;
199
200 return XFS_BB_TO_FSB(mp, min_logblks);
201}
1// SPDX-License-Identifier: GPL-2.0
2/*
3 * Copyright (c) 2013 Jie Liu.
4 * All Rights Reserved.
5 */
6#include "xfs.h"
7#include "xfs_fs.h"
8#include "xfs_shared.h"
9#include "xfs_format.h"
10#include "xfs_log_format.h"
11#include "xfs_trans_resv.h"
12#include "xfs_mount.h"
13#include "xfs_da_format.h"
14#include "xfs_trans_space.h"
15#include "xfs_da_btree.h"
16#include "xfs_bmap_btree.h"
17#include "xfs_trace.h"
18
19/*
20 * Shortly after enabling the large extents count feature in 2023, longstanding
21 * bugs were found in the code that computes the minimum log size. Luckily,
22 * the bugs resulted in over-estimates of that size, so there's no impact to
23 * existing users. However, we don't want to reduce the minimum log size
24 * because that can create the situation where a newer mkfs writes a new
25 * filesystem that an older kernel won't mount.
26 *
27 * Several years prior, we also discovered that the transaction reservations
28 * for rmap and reflink operations were unnecessarily large. That was fixed,
29 * but the minimum log size computation was left alone to avoid the
30 * compatibility problems noted above. Fix that too.
31 *
32 * Therefore, we only may correct the computation starting with filesystem
33 * features that didn't exist in 2023. In other words, only turn this on if
34 * the filesystem has parent pointers.
35 *
36 * This function can be called before the XFS_HAS_* flags have been set up,
37 * (e.g. mkfs) so we must check the ondisk superblock.
38 */
39static inline bool
40xfs_want_minlogsize_fixes(
41 struct xfs_sb *sb)
42{
43 return xfs_sb_is_v5(sb) &&
44 xfs_sb_has_incompat_feature(sb, XFS_SB_FEAT_INCOMPAT_PARENT);
45}
46
47/*
48 * Calculate the maximum length in bytes that would be required for a local
49 * attribute value as large attributes out of line are not logged.
50 */
51STATIC int
52xfs_log_calc_max_attrsetm_res(
53 struct xfs_mount *mp)
54{
55 int size;
56 int nblks;
57
58 size = xfs_attr_leaf_entsize_local_max(mp->m_attr_geo->blksize) -
59 MAXNAMELEN - 1;
60 nblks = XFS_DAENTER_SPACE_RES(mp, XFS_ATTR_FORK);
61 nblks += XFS_B_TO_FSB(mp, size);
62
63 /*
64 * If the feature set is new enough, correct a unit conversion error in
65 * the xattr transaction reservation code that resulted in oversized
66 * minimum log size computations.
67 */
68 if (xfs_want_minlogsize_fixes(&mp->m_sb))
69 size = XFS_B_TO_FSB(mp, size);
70
71 nblks += XFS_NEXTENTADD_SPACE_RES(mp, size, XFS_ATTR_FORK);
72
73 return M_RES(mp)->tr_attrsetm.tr_logres +
74 M_RES(mp)->tr_attrsetrt.tr_logres * nblks;
75}
76
77/*
78 * Compute an alternate set of log reservation sizes for use exclusively with
79 * minimum log size calculations.
80 */
81static void
82xfs_log_calc_trans_resv_for_minlogblocks(
83 struct xfs_mount *mp,
84 struct xfs_trans_resv *resv)
85{
86 unsigned int rmap_maxlevels = mp->m_rmap_maxlevels;
87
88 /*
89 * If the feature set is new enough, drop the oversized minimum log
90 * size computation introduced by the original reflink code.
91 */
92 if (xfs_want_minlogsize_fixes(&mp->m_sb)) {
93 xfs_trans_resv_calc(mp, resv);
94 return;
95 }
96
97 /*
98 * In the early days of rmap+reflink, we always set the rmap maxlevels
99 * to 9 even if the AG was small enough that it would never grow to
100 * that height. Transaction reservation sizes influence the minimum
101 * log size calculation, which influences the size of the log that mkfs
102 * creates. Use the old value here to ensure that newly formatted
103 * small filesystems will mount on older kernels.
104 */
105 if (xfs_has_rmapbt(mp) && xfs_has_reflink(mp))
106 mp->m_rmap_maxlevels = XFS_OLD_REFLINK_RMAP_MAXLEVELS;
107
108 xfs_trans_resv_calc(mp, resv);
109
110 if (xfs_has_reflink(mp)) {
111 /*
112 * In the early days of reflink, typical log operation counts
113 * were greatly overestimated.
114 */
115 resv->tr_write.tr_logcount = XFS_WRITE_LOG_COUNT_REFLINK;
116 resv->tr_itruncate.tr_logcount =
117 XFS_ITRUNCATE_LOG_COUNT_REFLINK;
118 resv->tr_qm_dqalloc.tr_logcount = XFS_WRITE_LOG_COUNT_REFLINK;
119 } else if (xfs_has_rmapbt(mp)) {
120 /*
121 * In the early days of non-reflink rmap, the impact of rmapbt
122 * updates on log counts were not taken into account at all.
123 */
124 resv->tr_write.tr_logcount = XFS_WRITE_LOG_COUNT;
125 resv->tr_itruncate.tr_logcount = XFS_ITRUNCATE_LOG_COUNT;
126 resv->tr_qm_dqalloc.tr_logcount = XFS_WRITE_LOG_COUNT;
127 }
128
129 /*
130 * In the early days of reflink, we did not use deferred refcount
131 * update log items, so log reservations must be recomputed using the
132 * old calculations.
133 */
134 resv->tr_write.tr_logres =
135 xfs_calc_write_reservation_minlogsize(mp);
136 resv->tr_itruncate.tr_logres =
137 xfs_calc_itruncate_reservation_minlogsize(mp);
138 resv->tr_qm_dqalloc.tr_logres =
139 xfs_calc_qm_dqalloc_reservation_minlogsize(mp);
140
141 /* Put everything back the way it was. This goes at the end. */
142 mp->m_rmap_maxlevels = rmap_maxlevels;
143}
144
145/*
146 * Iterate over the log space reservation table to figure out and return
147 * the maximum one in terms of the pre-calculated values which were done
148 * at mount time.
149 */
150void
151xfs_log_get_max_trans_res(
152 struct xfs_mount *mp,
153 struct xfs_trans_res *max_resp)
154{
155 struct xfs_trans_resv resv = {};
156 struct xfs_trans_res *resp;
157 struct xfs_trans_res *end_resp;
158 unsigned int i;
159 int log_space = 0;
160 int attr_space;
161
162 attr_space = xfs_log_calc_max_attrsetm_res(mp);
163
164 xfs_log_calc_trans_resv_for_minlogblocks(mp, &resv);
165
166 resp = (struct xfs_trans_res *)&resv;
167 end_resp = (struct xfs_trans_res *)(&resv + 1);
168 for (i = 0; resp < end_resp; i++, resp++) {
169 int tmp = resp->tr_logcount > 1 ?
170 resp->tr_logres * resp->tr_logcount :
171 resp->tr_logres;
172
173 trace_xfs_trans_resv_calc_minlogsize(mp, i, resp);
174 if (log_space < tmp) {
175 log_space = tmp;
176 *max_resp = *resp; /* struct copy */
177 }
178 }
179
180 if (attr_space > log_space) {
181 *max_resp = resv.tr_attrsetm; /* struct copy */
182 max_resp->tr_logres = attr_space;
183 }
184 trace_xfs_log_get_max_trans_res(mp, max_resp);
185}
186
187/*
188 * Calculate the minimum valid log size for the given superblock configuration.
189 * Used to calculate the minimum log size at mkfs time, and to determine if
190 * the log is large enough or not at mount time. Returns the minimum size in
191 * filesystem block size units.
192 */
193int
194xfs_log_calc_minimum_size(
195 struct xfs_mount *mp)
196{
197 struct xfs_trans_res tres = {0};
198 int max_logres;
199 int min_logblks = 0;
200 int lsunit = 0;
201
202 xfs_log_get_max_trans_res(mp, &tres);
203
204 max_logres = xfs_log_calc_unit_res(mp, tres.tr_logres);
205 if (tres.tr_logcount > 1)
206 max_logres *= tres.tr_logcount;
207
208 if (xfs_has_logv2(mp) && mp->m_sb.sb_logsunit > 1)
209 lsunit = BTOBB(mp->m_sb.sb_logsunit);
210
211 /*
212 * Two factors should be taken into account for calculating the minimum
213 * log space.
214 * 1) The fundamental limitation is that no single transaction can be
215 * larger than half size of the log.
216 *
217 * From mkfs.xfs, this is considered by the XFS_MIN_LOG_FACTOR
218 * define, which is set to 3. That means we can definitely fit
219 * maximally sized 2 transactions in the log. We'll use this same
220 * value here.
221 *
222 * 2) If the lsunit option is specified, a transaction requires 2 LSU
223 * for the reservation because there are two log writes that can
224 * require padding - the transaction data and the commit record which
225 * are written separately and both can require padding to the LSU.
226 * Consider that we can have an active CIL reservation holding 2*LSU,
227 * but the CIL is not over a push threshold, in this case, if we
228 * don't have enough log space for at one new transaction, which
229 * includes another 2*LSU in the reservation, we will run into dead
230 * loop situation in log space grant procedure. i.e.
231 * xlog_grant_head_wait().
232 *
233 * Hence the log size needs to be able to contain two maximally sized
234 * and padded transactions, which is (2 * (2 * LSU + maxlres)).
235 *
236 * Also, the log size should be a multiple of the log stripe unit, round
237 * it up to lsunit boundary if lsunit is specified.
238 */
239 if (lsunit) {
240 min_logblks = roundup_64(BTOBB(max_logres), lsunit) +
241 2 * lsunit;
242 } else
243 min_logblks = BTOBB(max_logres) + 2 * BBSIZE;
244 min_logblks *= XFS_MIN_LOG_FACTOR;
245
246 return XFS_BB_TO_FSB(mp, min_logblks);
247}