blob: a2e1df488df04a305d2a8eca84327a2461e158bf [file] [log] [blame]
David Teiglandb3b94fa2006-01-16 16:50:04 +00001/*
2 * Copyright (C) Sistina Software, Inc. 1997-2003 All rights reserved.
Bob Petersonda6dd402007-12-11 18:49:21 -06003 * Copyright (C) 2004-2007 Red Hat, Inc. All rights reserved.
David Teiglandb3b94fa2006-01-16 16:50:04 +00004 *
5 * This copyrighted material is made available to anyone wishing to use,
6 * modify, copy, or redistribute it subject to the terms and conditions
Steven Whitehousee9fc2aa2006-09-01 11:05:15 -04007 * of the GNU General Public License version 2.
David Teiglandb3b94fa2006-01-16 16:50:04 +00008 */
9
10#include <linux/sched.h>
11#include <linux/slab.h>
12#include <linux/spinlock.h>
13#include <linux/completion.h>
14#include <linux/buffer_head.h>
Steven Whitehouse5c676f62006-02-27 17:23:27 -050015#include <linux/gfs2_ondisk.h>
Steven Whitehouse71b86f52006-03-28 14:14:04 -050016#include <linux/crc32.h>
Bob Petersonc1696fb2018-01-17 00:01:33 +010017#include <linux/crc32c.h>
Steven Whitehousea25311c2006-11-23 11:06:35 -050018#include <linux/delay.h>
Steven Whitehouseec69b182007-11-09 10:01:41 +000019#include <linux/kthread.h>
20#include <linux/freezer.h>
Steven Whitehouse254db572008-09-26 10:23:22 +010021#include <linux/bio.h>
Steven Whitehouse885bcec2014-02-03 09:57:29 +000022#include <linux/blkdev.h>
Steven Whitehouse4667a0e2011-04-18 14:18:09 +010023#include <linux/writeback.h>
Bob Peterson4a36d082012-02-14 14:49:57 -050024#include <linux/list_sort.h>
David Teiglandb3b94fa2006-01-16 16:50:04 +000025
26#include "gfs2.h"
Steven Whitehouse5c676f62006-02-27 17:23:27 -050027#include "incore.h"
David Teiglandb3b94fa2006-01-16 16:50:04 +000028#include "bmap.h"
29#include "glock.h"
30#include "log.h"
31#include "lops.h"
32#include "meta_io.h"
Steven Whitehouse5c676f62006-02-27 17:23:27 -050033#include "util.h"
Steven Whitehouse71b86f52006-03-28 14:14:04 -050034#include "dir.h"
Steven Whitehouse63997772009-06-12 08:49:20 +010035#include "trace_gfs2.h"
David Teiglandb3b94fa2006-01-16 16:50:04 +000036
David Teiglandb3b94fa2006-01-16 16:50:04 +000037/**
38 * gfs2_struct2blk - compute stuff
39 * @sdp: the filesystem
40 * @nstruct: the number of structures
41 * @ssize: the size of the structures
42 *
43 * Compute the number of log descriptor blocks needed to hold a certain number
44 * of structures of a certain size.
45 *
46 * Returns: the number of blocks needed (minimum is always 1)
47 */
48
49unsigned int gfs2_struct2blk(struct gfs2_sbd *sdp, unsigned int nstruct,
50 unsigned int ssize)
51{
52 unsigned int blks;
53 unsigned int first, second;
54
55 blks = 1;
Steven Whitehousefaa31ce2006-09-13 11:13:27 -040056 first = (sdp->sd_sb.sb_bsize - sizeof(struct gfs2_log_descriptor)) / ssize;
David Teiglandb3b94fa2006-01-16 16:50:04 +000057
58 if (nstruct > first) {
Steven Whitehouse568f4c92006-02-27 12:00:42 -050059 second = (sdp->sd_sb.sb_bsize -
60 sizeof(struct gfs2_meta_header)) / ssize;
Steven Whitehouse5c676f62006-02-27 17:23:27 -050061 blks += DIV_ROUND_UP(nstruct - first, second);
David Teiglandb3b94fa2006-01-16 16:50:04 +000062 }
63
64 return blks;
65}
66
Steven Whitehouseddacfaf2006-10-03 11:10:41 -040067/**
Steven Whitehouse1e1a3d02007-08-27 09:45:26 +010068 * gfs2_remove_from_ail - Remove an entry from the ail lists, updating counters
69 * @mapping: The associated mapping (maybe NULL)
70 * @bd: The gfs2_bufdata to remove
71 *
Steven Whitehousec618e872011-03-14 12:40:29 +000072 * The ail lock _must_ be held when calling this function
Steven Whitehouse1e1a3d02007-08-27 09:45:26 +010073 *
74 */
75
Bob Peterson9bc980c2018-03-02 06:59:44 -070076static void gfs2_remove_from_ail(struct gfs2_bufdata *bd)
Steven Whitehouse1e1a3d02007-08-27 09:45:26 +010077{
Benjamin Marzinski16ca9412013-04-05 20:31:46 -050078 bd->bd_tr = NULL;
Steven Whitehouse1ad38c42007-09-03 11:01:33 +010079 list_del_init(&bd->bd_ail_st_list);
80 list_del_init(&bd->bd_ail_gl_list);
Steven Whitehouse1e1a3d02007-08-27 09:45:26 +010081 atomic_dec(&bd->bd_gl->gl_ail_count);
Steven Whitehouse1e1a3d02007-08-27 09:45:26 +010082 brelse(bd->bd_bh);
83}
84
85/**
Steven Whitehouseddacfaf2006-10-03 11:10:41 -040086 * gfs2_ail1_start_one - Start I/O on a part of the AIL
87 * @sdp: the filesystem
Steven Whitehouse4667a0e2011-04-18 14:18:09 +010088 * @wbc: The writeback control structure
89 * @ai: The ail structure
Steven Whitehouseddacfaf2006-10-03 11:10:41 -040090 *
91 */
92
Steven Whitehouse4f1de012011-04-26 10:23:56 +010093static int gfs2_ail1_start_one(struct gfs2_sbd *sdp,
94 struct writeback_control *wbc,
Andreas Gruenbacher9e1a9ec2018-06-07 11:56:46 +010095 struct gfs2_trans *tr,
96 bool *withdraw)
Dave Chinnerd6a079e2011-03-11 11:52:25 +000097__releases(&sdp->sd_ail_lock)
98__acquires(&sdp->sd_ail_lock)
Steven Whitehouseddacfaf2006-10-03 11:10:41 -040099{
Steven Whitehouse5ac048b2011-03-30 16:25:51 +0100100 struct gfs2_glock *gl = NULL;
Steven Whitehouse4667a0e2011-04-18 14:18:09 +0100101 struct address_space *mapping;
Steven Whitehouseddacfaf2006-10-03 11:10:41 -0400102 struct gfs2_bufdata *bd, *s;
103 struct buffer_head *bh;
Steven Whitehouseddacfaf2006-10-03 11:10:41 -0400104
Benjamin Marzinski16ca9412013-04-05 20:31:46 -0500105 list_for_each_entry_safe_reverse(bd, s, &tr->tr_ail1_list, bd_ail_st_list) {
Steven Whitehouse4667a0e2011-04-18 14:18:09 +0100106 bh = bd->bd_bh;
Steven Whitehouseddacfaf2006-10-03 11:10:41 -0400107
Benjamin Marzinski16ca9412013-04-05 20:31:46 -0500108 gfs2_assert(sdp, bd->bd_tr == tr);
Steven Whitehouseddacfaf2006-10-03 11:10:41 -0400109
Steven Whitehouse4667a0e2011-04-18 14:18:09 +0100110 if (!buffer_busy(bh)) {
Bob Petersonb524abc2018-10-04 10:21:07 -0500111 if (!buffer_uptodate(bh) &&
112 !test_and_set_bit(SDF_AIL1_IO_ERROR,
113 &sdp->sd_flags)) {
Steven Whitehouse4667a0e2011-04-18 14:18:09 +0100114 gfs2_io_error_bh(sdp, bh);
Andreas Gruenbacher9e1a9ec2018-06-07 11:56:46 +0100115 *withdraw = true;
116 }
Benjamin Marzinski16ca9412013-04-05 20:31:46 -0500117 list_move(&bd->bd_ail_st_list, &tr->tr_ail2_list);
Steven Whitehouse4667a0e2011-04-18 14:18:09 +0100118 continue;
Steven Whitehouseddacfaf2006-10-03 11:10:41 -0400119 }
Steven Whitehouse4667a0e2011-04-18 14:18:09 +0100120
121 if (!buffer_dirty(bh))
122 continue;
123 if (gl == bd->bd_gl)
124 continue;
125 gl = bd->bd_gl;
Benjamin Marzinski16ca9412013-04-05 20:31:46 -0500126 list_move(&bd->bd_ail_st_list, &tr->tr_ail1_list);
Steven Whitehouse4667a0e2011-04-18 14:18:09 +0100127 mapping = bh->b_page->mapping;
Steven Whitehouse4f1de012011-04-26 10:23:56 +0100128 if (!mapping)
129 continue;
Steven Whitehouse4667a0e2011-04-18 14:18:09 +0100130 spin_unlock(&sdp->sd_ail_lock);
131 generic_writepages(mapping, wbc);
132 spin_lock(&sdp->sd_ail_lock);
133 if (wbc->nr_to_write <= 0)
134 break;
Steven Whitehouse4f1de012011-04-26 10:23:56 +0100135 return 1;
Steven Whitehouse4667a0e2011-04-18 14:18:09 +0100136 }
Steven Whitehouse4f1de012011-04-26 10:23:56 +0100137
138 return 0;
Steven Whitehouse4667a0e2011-04-18 14:18:09 +0100139}
140
141
142/**
143 * gfs2_ail1_flush - start writeback of some ail1 entries
144 * @sdp: The super block
145 * @wbc: The writeback control structure
146 *
147 * Writes back some ail1 entries, according to the limits in the
148 * writeback control structure
149 */
150
151void gfs2_ail1_flush(struct gfs2_sbd *sdp, struct writeback_control *wbc)
152{
153 struct list_head *head = &sdp->sd_ail1_list;
Benjamin Marzinski16ca9412013-04-05 20:31:46 -0500154 struct gfs2_trans *tr;
Steven Whitehouse885bcec2014-02-03 09:57:29 +0000155 struct blk_plug plug;
Andreas Gruenbacher9e1a9ec2018-06-07 11:56:46 +0100156 bool withdraw = false;
Steven Whitehouse4667a0e2011-04-18 14:18:09 +0100157
Steven Whitehousec83ae9c2011-04-18 14:18:38 +0100158 trace_gfs2_ail_flush(sdp, wbc, 1);
Steven Whitehouse885bcec2014-02-03 09:57:29 +0000159 blk_start_plug(&plug);
Steven Whitehouse4667a0e2011-04-18 14:18:09 +0100160 spin_lock(&sdp->sd_ail_lock);
Steven Whitehouse4f1de012011-04-26 10:23:56 +0100161restart:
Benjamin Marzinski16ca9412013-04-05 20:31:46 -0500162 list_for_each_entry_reverse(tr, head, tr_list) {
Steven Whitehouse4667a0e2011-04-18 14:18:09 +0100163 if (wbc->nr_to_write <= 0)
164 break;
Andreas Gruenbacher9e1a9ec2018-06-07 11:56:46 +0100165 if (gfs2_ail1_start_one(sdp, wbc, tr, &withdraw))
Steven Whitehouse4f1de012011-04-26 10:23:56 +0100166 goto restart;
Steven Whitehouse4667a0e2011-04-18 14:18:09 +0100167 }
168 spin_unlock(&sdp->sd_ail_lock);
Steven Whitehouse885bcec2014-02-03 09:57:29 +0000169 blk_finish_plug(&plug);
Andreas Gruenbacher9e1a9ec2018-06-07 11:56:46 +0100170 if (withdraw)
171 gfs2_lm_withdraw(sdp, NULL);
Steven Whitehousec83ae9c2011-04-18 14:18:38 +0100172 trace_gfs2_ail_flush(sdp, wbc, 0);
Steven Whitehouse4667a0e2011-04-18 14:18:09 +0100173}
174
175/**
176 * gfs2_ail1_start - start writeback of all ail1 entries
177 * @sdp: The superblock
178 */
179
180static void gfs2_ail1_start(struct gfs2_sbd *sdp)
181{
182 struct writeback_control wbc = {
183 .sync_mode = WB_SYNC_NONE,
184 .nr_to_write = LONG_MAX,
185 .range_start = 0,
186 .range_end = LLONG_MAX,
187 };
188
189 return gfs2_ail1_flush(sdp, &wbc);
Steven Whitehouseddacfaf2006-10-03 11:10:41 -0400190}
191
192/**
193 * gfs2_ail1_empty_one - Check whether or not a trans in the AIL has been synced
194 * @sdp: the filesystem
195 * @ai: the AIL entry
196 *
197 */
198
Andreas Gruenbacher9e1a9ec2018-06-07 11:56:46 +0100199static void gfs2_ail1_empty_one(struct gfs2_sbd *sdp, struct gfs2_trans *tr,
200 bool *withdraw)
Steven Whitehouseddacfaf2006-10-03 11:10:41 -0400201{
202 struct gfs2_bufdata *bd, *s;
203 struct buffer_head *bh;
204
Benjamin Marzinski16ca9412013-04-05 20:31:46 -0500205 list_for_each_entry_safe_reverse(bd, s, &tr->tr_ail1_list,
Steven Whitehouseddacfaf2006-10-03 11:10:41 -0400206 bd_ail_st_list) {
207 bh = bd->bd_bh;
Benjamin Marzinski16ca9412013-04-05 20:31:46 -0500208 gfs2_assert(sdp, bd->bd_tr == tr);
Steven Whitehouse4667a0e2011-04-18 14:18:09 +0100209 if (buffer_busy(bh))
210 continue;
Bob Petersonb524abc2018-10-04 10:21:07 -0500211 if (!buffer_uptodate(bh) &&
212 !test_and_set_bit(SDF_AIL1_IO_ERROR, &sdp->sd_flags)) {
Steven Whitehouseddacfaf2006-10-03 11:10:41 -0400213 gfs2_io_error_bh(sdp, bh);
Andreas Gruenbacher9e1a9ec2018-06-07 11:56:46 +0100214 *withdraw = true;
215 }
Benjamin Marzinski16ca9412013-04-05 20:31:46 -0500216 list_move(&bd->bd_ail_st_list, &tr->tr_ail2_list);
Steven Whitehouseddacfaf2006-10-03 11:10:41 -0400217 }
Steven Whitehouseddacfaf2006-10-03 11:10:41 -0400218}
219
Steven Whitehouse4667a0e2011-04-18 14:18:09 +0100220/**
221 * gfs2_ail1_empty - Try to empty the ail1 lists
222 * @sdp: The superblock
223 *
224 * Tries to empty the ail1 lists, starting with the oldest first
225 */
David Teiglandb3b94fa2006-01-16 16:50:04 +0000226
Steven Whitehouse4667a0e2011-04-18 14:18:09 +0100227static int gfs2_ail1_empty(struct gfs2_sbd *sdp)
David Teiglandb3b94fa2006-01-16 16:50:04 +0000228{
Benjamin Marzinski16ca9412013-04-05 20:31:46 -0500229 struct gfs2_trans *tr, *s;
Benjamin Marzinski5d054962013-06-14 11:38:29 -0500230 int oldest_tr = 1;
David Teiglandb3b94fa2006-01-16 16:50:04 +0000231 int ret;
Andreas Gruenbacher9e1a9ec2018-06-07 11:56:46 +0100232 bool withdraw = false;
David Teiglandb3b94fa2006-01-16 16:50:04 +0000233
Dave Chinnerd6a079e2011-03-11 11:52:25 +0000234 spin_lock(&sdp->sd_ail_lock);
Benjamin Marzinski16ca9412013-04-05 20:31:46 -0500235 list_for_each_entry_safe_reverse(tr, s, &sdp->sd_ail1_list, tr_list) {
Andreas Gruenbacher9e1a9ec2018-06-07 11:56:46 +0100236 gfs2_ail1_empty_one(sdp, tr, &withdraw);
Benjamin Marzinski5d054962013-06-14 11:38:29 -0500237 if (list_empty(&tr->tr_ail1_list) && oldest_tr)
Benjamin Marzinski16ca9412013-04-05 20:31:46 -0500238 list_move(&tr->tr_list, &sdp->sd_ail2_list);
Steven Whitehouse4667a0e2011-04-18 14:18:09 +0100239 else
Benjamin Marzinski5d054962013-06-14 11:38:29 -0500240 oldest_tr = 0;
David Teiglandb3b94fa2006-01-16 16:50:04 +0000241 }
David Teiglandb3b94fa2006-01-16 16:50:04 +0000242 ret = list_empty(&sdp->sd_ail1_list);
Dave Chinnerd6a079e2011-03-11 11:52:25 +0000243 spin_unlock(&sdp->sd_ail_lock);
David Teiglandb3b94fa2006-01-16 16:50:04 +0000244
Andreas Gruenbacher9e1a9ec2018-06-07 11:56:46 +0100245 if (withdraw)
246 gfs2_lm_withdraw(sdp, "fatal: I/O error(s)\n");
247
David Teiglandb3b94fa2006-01-16 16:50:04 +0000248 return ret;
249}
250
Steven Whitehouse26b06a62011-05-21 19:21:07 +0100251static void gfs2_ail1_wait(struct gfs2_sbd *sdp)
252{
Benjamin Marzinski16ca9412013-04-05 20:31:46 -0500253 struct gfs2_trans *tr;
Steven Whitehouse26b06a62011-05-21 19:21:07 +0100254 struct gfs2_bufdata *bd;
255 struct buffer_head *bh;
256
257 spin_lock(&sdp->sd_ail_lock);
Benjamin Marzinski16ca9412013-04-05 20:31:46 -0500258 list_for_each_entry_reverse(tr, &sdp->sd_ail1_list, tr_list) {
259 list_for_each_entry(bd, &tr->tr_ail1_list, bd_ail_st_list) {
Steven Whitehouse26b06a62011-05-21 19:21:07 +0100260 bh = bd->bd_bh;
261 if (!buffer_locked(bh))
262 continue;
263 get_bh(bh);
264 spin_unlock(&sdp->sd_ail_lock);
265 wait_on_buffer(bh);
266 brelse(bh);
267 return;
268 }
269 }
270 spin_unlock(&sdp->sd_ail_lock);
271}
Steven Whitehouseddacfaf2006-10-03 11:10:41 -0400272
273/**
274 * gfs2_ail2_empty_one - Check whether or not a trans in the AIL has been synced
275 * @sdp: the filesystem
276 * @ai: the AIL entry
277 *
278 */
279
Benjamin Marzinski16ca9412013-04-05 20:31:46 -0500280static void gfs2_ail2_empty_one(struct gfs2_sbd *sdp, struct gfs2_trans *tr)
Steven Whitehouseddacfaf2006-10-03 11:10:41 -0400281{
Benjamin Marzinski16ca9412013-04-05 20:31:46 -0500282 struct list_head *head = &tr->tr_ail2_list;
Steven Whitehouseddacfaf2006-10-03 11:10:41 -0400283 struct gfs2_bufdata *bd;
284
285 while (!list_empty(head)) {
286 bd = list_entry(head->prev, struct gfs2_bufdata,
287 bd_ail_st_list);
Benjamin Marzinski16ca9412013-04-05 20:31:46 -0500288 gfs2_assert(sdp, bd->bd_tr == tr);
Steven Whitehousef91a0d32007-10-15 16:29:05 +0100289 gfs2_remove_from_ail(bd);
Steven Whitehouseddacfaf2006-10-03 11:10:41 -0400290 }
291}
292
David Teiglandb3b94fa2006-01-16 16:50:04 +0000293static void ail2_empty(struct gfs2_sbd *sdp, unsigned int new_tail)
294{
Benjamin Marzinski16ca9412013-04-05 20:31:46 -0500295 struct gfs2_trans *tr, *safe;
David Teiglandb3b94fa2006-01-16 16:50:04 +0000296 unsigned int old_tail = sdp->sd_log_tail;
297 int wrap = (new_tail < old_tail);
298 int a, b, rm;
299
Dave Chinnerd6a079e2011-03-11 11:52:25 +0000300 spin_lock(&sdp->sd_ail_lock);
David Teiglandb3b94fa2006-01-16 16:50:04 +0000301
Benjamin Marzinski16ca9412013-04-05 20:31:46 -0500302 list_for_each_entry_safe(tr, safe, &sdp->sd_ail2_list, tr_list) {
303 a = (old_tail <= tr->tr_first);
304 b = (tr->tr_first < new_tail);
David Teiglandb3b94fa2006-01-16 16:50:04 +0000305 rm = (wrap) ? (a || b) : (a && b);
306 if (!rm)
307 continue;
308
Benjamin Marzinski16ca9412013-04-05 20:31:46 -0500309 gfs2_ail2_empty_one(sdp, tr);
310 list_del(&tr->tr_list);
311 gfs2_assert_warn(sdp, list_empty(&tr->tr_ail1_list));
312 gfs2_assert_warn(sdp, list_empty(&tr->tr_ail2_list));
313 kfree(tr);
David Teiglandb3b94fa2006-01-16 16:50:04 +0000314 }
315
Dave Chinnerd6a079e2011-03-11 11:52:25 +0000316 spin_unlock(&sdp->sd_ail_lock);
David Teiglandb3b94fa2006-01-16 16:50:04 +0000317}
318
319/**
Benjamin Marzinski24972552014-05-01 22:26:55 -0500320 * gfs2_log_release - Release a given number of log blocks
321 * @sdp: The GFS2 superblock
322 * @blks: The number of blocks
323 *
324 */
325
326void gfs2_log_release(struct gfs2_sbd *sdp, unsigned int blks)
327{
328
329 atomic_add(blks, &sdp->sd_log_blks_free);
330 trace_gfs2_log_blocks(sdp, blks);
331 gfs2_assert_withdraw(sdp, atomic_read(&sdp->sd_log_blks_free) <=
332 sdp->sd_jdesc->jd_blocks);
333 up_read(&sdp->sd_log_flush_lock);
334}
335
336/**
David Teiglandb3b94fa2006-01-16 16:50:04 +0000337 * gfs2_log_reserve - Make a log reservation
338 * @sdp: The GFS2 superblock
339 * @blks: The number of blocks to reserve
340 *
Steven Whitehouse89918642007-06-01 15:19:33 +0100341 * Note that we never give out the last few blocks of the journal. Thats
Robert Peterson2332c442007-06-18 14:50:20 -0500342 * due to the fact that there is a small number of header blocks
Steven Whitehouseb0041572006-11-23 10:51:34 -0500343 * associated with each log flush. The exact number can't be known until
344 * flush time, so we ensure that we have just enough free blocks at all
345 * times to avoid running out during a log flush.
346 *
Benjamin Marzinski5e687ea2010-05-04 14:29:16 -0500347 * We no longer flush the log here, instead we wake up logd to do that
348 * for us. To avoid the thundering herd and to ensure that we deal fairly
349 * with queued waiters, we use an exclusive wait. This means that when we
350 * get woken with enough journal space to get our reservation, we need to
351 * wake the next waiter on the list.
352 *
David Teiglandb3b94fa2006-01-16 16:50:04 +0000353 * Returns: errno
354 */
355
356int gfs2_log_reserve(struct gfs2_sbd *sdp, unsigned int blks)
357{
Benjamin Marzinski2e60d762014-11-13 20:42:04 -0600358 int ret = 0;
Benjamin Marzinski5d054962013-06-14 11:38:29 -0500359 unsigned reserved_blks = 7 * (4096 / sdp->sd_vfs->s_blocksize);
Benjamin Marzinski5e687ea2010-05-04 14:29:16 -0500360 unsigned wanted = blks + reserved_blks;
361 DEFINE_WAIT(wait);
362 int did_wait = 0;
363 unsigned int free_blocks;
David Teiglandb3b94fa2006-01-16 16:50:04 +0000364
365 if (gfs2_assert_warn(sdp, blks) ||
366 gfs2_assert_warn(sdp, blks <= sdp->sd_jdesc->jd_blocks))
367 return -EINVAL;
Bob Petersonf07b3522017-01-05 16:01:45 -0500368 atomic_add(blks, &sdp->sd_log_blks_needed);
Benjamin Marzinski5e687ea2010-05-04 14:29:16 -0500369retry:
370 free_blocks = atomic_read(&sdp->sd_log_blks_free);
371 if (unlikely(free_blocks <= wanted)) {
372 do {
373 prepare_to_wait_exclusive(&sdp->sd_log_waitq, &wait,
374 TASK_UNINTERRUPTIBLE);
375 wake_up(&sdp->sd_logd_waitq);
376 did_wait = 1;
377 if (atomic_read(&sdp->sd_log_blks_free) <= wanted)
378 io_schedule();
379 free_blocks = atomic_read(&sdp->sd_log_blks_free);
380 } while(free_blocks <= wanted);
381 finish_wait(&sdp->sd_log_waitq, &wait);
David Teiglandb3b94fa2006-01-16 16:50:04 +0000382 }
Benjamin Marzinski2e60d762014-11-13 20:42:04 -0600383 atomic_inc(&sdp->sd_reserving_log);
Benjamin Marzinski5e687ea2010-05-04 14:29:16 -0500384 if (atomic_cmpxchg(&sdp->sd_log_blks_free, free_blocks,
Benjamin Marzinski2e60d762014-11-13 20:42:04 -0600385 free_blocks - blks) != free_blocks) {
386 if (atomic_dec_and_test(&sdp->sd_reserving_log))
387 wake_up(&sdp->sd_reserving_log_wait);
Benjamin Marzinski5e687ea2010-05-04 14:29:16 -0500388 goto retry;
Benjamin Marzinski2e60d762014-11-13 20:42:04 -0600389 }
Bob Petersonf07b3522017-01-05 16:01:45 -0500390 atomic_sub(blks, &sdp->sd_log_blks_needed);
Steven Whitehouse63997772009-06-12 08:49:20 +0100391 trace_gfs2_log_blocks(sdp, -blks);
Benjamin Marzinski5e687ea2010-05-04 14:29:16 -0500392
393 /*
394 * If we waited, then so might others, wake them up _after_ we get
395 * our share of the log.
396 */
397 if (unlikely(did_wait))
398 wake_up(&sdp->sd_log_waitq);
Steven Whitehouse484adff2006-03-29 09:12:12 -0500399
400 down_read(&sdp->sd_log_flush_lock);
Benjamin Marzinski24972552014-05-01 22:26:55 -0500401 if (unlikely(!test_bit(SDF_JOURNAL_LIVE, &sdp->sd_flags))) {
402 gfs2_log_release(sdp, blks);
Benjamin Marzinski2e60d762014-11-13 20:42:04 -0600403 ret = -EROFS;
Benjamin Marzinski24972552014-05-01 22:26:55 -0500404 }
Benjamin Marzinski2e60d762014-11-13 20:42:04 -0600405 if (atomic_dec_and_test(&sdp->sd_reserving_log))
406 wake_up(&sdp->sd_reserving_log_wait);
407 return ret;
David Teiglandb3b94fa2006-01-16 16:50:04 +0000408}
409
David Teiglandb3b94fa2006-01-16 16:50:04 +0000410/**
411 * log_distance - Compute distance between two journal blocks
412 * @sdp: The GFS2 superblock
413 * @newer: The most recent journal block of the pair
414 * @older: The older journal block of the pair
415 *
416 * Compute the distance (in the journal direction) between two
417 * blocks in the journal
418 *
419 * Returns: the distance in blocks
420 */
421
Steven Whitehousefaa31ce2006-09-13 11:13:27 -0400422static inline unsigned int log_distance(struct gfs2_sbd *sdp, unsigned int newer,
David Teiglandb3b94fa2006-01-16 16:50:04 +0000423 unsigned int older)
424{
425 int dist;
426
427 dist = newer - older;
428 if (dist < 0)
429 dist += sdp->sd_jdesc->jd_blocks;
430
431 return dist;
432}
433
Robert Peterson2332c442007-06-18 14:50:20 -0500434/**
435 * calc_reserved - Calculate the number of blocks to reserve when
436 * refunding a transaction's unused buffers.
437 * @sdp: The GFS2 superblock
438 *
439 * This is complex. We need to reserve room for all our currently used
440 * metadata buffers (e.g. normal file I/O rewriting file time stamps) and
441 * all our journaled data buffers for journaled files (e.g. files in the
442 * meta_fs like rindex, or files for which chattr +j was done.)
443 * If we don't reserve enough space, gfs2_log_refund and gfs2_log_flush
444 * will count it as free space (sd_log_blks_free) and corruption will follow.
445 *
446 * We can have metadata bufs and jdata bufs in the same journal. So each
447 * type gets its own log header, for which we need to reserve a block.
448 * In fact, each type has the potential for needing more than one header
449 * in cases where we have more buffers than will fit on a journal page.
450 * Metadata journal entries take up half the space of journaled buffer entries.
451 * Thus, metadata entries have buf_limit (502) and journaled buffers have
452 * databuf_limit (251) before they cause a wrap around.
453 *
454 * Also, we need to reserve blocks for revoke journal entries and one for an
455 * overall header for the lot.
456 *
457 * Returns: the number of blocks reserved
458 */
459static unsigned int calc_reserved(struct gfs2_sbd *sdp)
460{
461 unsigned int reserved = 0;
Steven Whitehouse022ef4f2014-02-21 21:55:33 +0000462 unsigned int mbuf;
463 unsigned int dbuf;
464 struct gfs2_trans *tr = sdp->sd_log_tr;
Robert Peterson2332c442007-06-18 14:50:20 -0500465
Steven Whitehouse022ef4f2014-02-21 21:55:33 +0000466 if (tr) {
467 mbuf = tr->tr_num_buf_new - tr->tr_num_buf_rm;
468 dbuf = tr->tr_num_databuf_new - tr->tr_num_databuf_rm;
469 reserved = mbuf + dbuf;
470 /* Account for header blocks */
471 reserved += DIV_ROUND_UP(mbuf, buf_limit(sdp));
472 reserved += DIV_ROUND_UP(dbuf, databuf_limit(sdp));
473 }
Robert Peterson2332c442007-06-18 14:50:20 -0500474
Benjamin Marzinski2e95e3f2010-03-10 18:10:19 -0600475 if (sdp->sd_log_commited_revoke > 0)
Steven Whitehouse022ef4f2014-02-21 21:55:33 +0000476 reserved += gfs2_struct2blk(sdp, sdp->sd_log_commited_revoke,
Robert Peterson2332c442007-06-18 14:50:20 -0500477 sizeof(u64));
Robert Peterson2332c442007-06-18 14:50:20 -0500478 /* One for the overall header */
479 if (reserved)
480 reserved++;
481 return reserved;
482}
483
David Teiglandb3b94fa2006-01-16 16:50:04 +0000484static unsigned int current_tail(struct gfs2_sbd *sdp)
485{
Benjamin Marzinski16ca9412013-04-05 20:31:46 -0500486 struct gfs2_trans *tr;
David Teiglandb3b94fa2006-01-16 16:50:04 +0000487 unsigned int tail;
488
Dave Chinnerd6a079e2011-03-11 11:52:25 +0000489 spin_lock(&sdp->sd_ail_lock);
David Teiglandb3b94fa2006-01-16 16:50:04 +0000490
Steven Whitehousefaa31ce2006-09-13 11:13:27 -0400491 if (list_empty(&sdp->sd_ail1_list)) {
David Teiglandb3b94fa2006-01-16 16:50:04 +0000492 tail = sdp->sd_log_head;
Steven Whitehousefaa31ce2006-09-13 11:13:27 -0400493 } else {
Benjamin Marzinski16ca9412013-04-05 20:31:46 -0500494 tr = list_entry(sdp->sd_ail1_list.prev, struct gfs2_trans,
495 tr_list);
496 tail = tr->tr_first;
David Teiglandb3b94fa2006-01-16 16:50:04 +0000497 }
498
Dave Chinnerd6a079e2011-03-11 11:52:25 +0000499 spin_unlock(&sdp->sd_ail_lock);
David Teiglandb3b94fa2006-01-16 16:50:04 +0000500
501 return tail;
502}
503
Robert Peterson2332c442007-06-18 14:50:20 -0500504static void log_pull_tail(struct gfs2_sbd *sdp, unsigned int new_tail)
David Teiglandb3b94fa2006-01-16 16:50:04 +0000505{
506 unsigned int dist = log_distance(sdp, new_tail, sdp->sd_log_tail);
507
508 ail2_empty(sdp, new_tail);
509
Steven Whitehousefd041f02007-11-08 14:55:03 +0000510 atomic_add(dist, &sdp->sd_log_blks_free);
Steven Whitehouse63997772009-06-12 08:49:20 +0100511 trace_gfs2_log_blocks(sdp, dist);
Benjamin Marzinski5e687ea2010-05-04 14:29:16 -0500512 gfs2_assert_withdraw(sdp, atomic_read(&sdp->sd_log_blks_free) <=
513 sdp->sd_jdesc->jd_blocks);
David Teiglandb3b94fa2006-01-16 16:50:04 +0000514
515 sdp->sd_log_tail = new_tail;
516}
517
David Teiglandb3b94fa2006-01-16 16:50:04 +0000518
Steven Whitehouse34cc1782012-03-09 10:45:56 +0000519static void log_flush_wait(struct gfs2_sbd *sdp)
David Teiglandb3b94fa2006-01-16 16:50:04 +0000520{
Steven Whitehouse16615be2007-09-17 10:59:52 +0100521 DEFINE_WAIT(wait);
David Teiglandb3b94fa2006-01-16 16:50:04 +0000522
Steven Whitehouse16615be2007-09-17 10:59:52 +0100523 if (atomic_read(&sdp->sd_log_in_flight)) {
524 do {
525 prepare_to_wait(&sdp->sd_log_flush_wait, &wait,
526 TASK_UNINTERRUPTIBLE);
527 if (atomic_read(&sdp->sd_log_in_flight))
528 io_schedule();
529 } while(atomic_read(&sdp->sd_log_in_flight));
530 finish_wait(&sdp->sd_log_flush_wait, &wait);
David Teiglandb3b94fa2006-01-16 16:50:04 +0000531 }
David Teiglandb3b94fa2006-01-16 16:50:04 +0000532}
533
Steven Whitehouse45138992013-01-28 09:30:07 +0000534static int ip_cmp(void *priv, struct list_head *a, struct list_head *b)
Bob Peterson4a36d082012-02-14 14:49:57 -0500535{
Steven Whitehouse45138992013-01-28 09:30:07 +0000536 struct gfs2_inode *ipa, *ipb;
Bob Peterson4a36d082012-02-14 14:49:57 -0500537
Steven Whitehouse45138992013-01-28 09:30:07 +0000538 ipa = list_entry(a, struct gfs2_inode, i_ordered);
539 ipb = list_entry(b, struct gfs2_inode, i_ordered);
Bob Peterson4a36d082012-02-14 14:49:57 -0500540
Steven Whitehouse45138992013-01-28 09:30:07 +0000541 if (ipa->i_no_addr < ipb->i_no_addr)
Bob Peterson4a36d082012-02-14 14:49:57 -0500542 return -1;
Steven Whitehouse45138992013-01-28 09:30:07 +0000543 if (ipa->i_no_addr > ipb->i_no_addr)
Bob Peterson4a36d082012-02-14 14:49:57 -0500544 return 1;
545 return 0;
546}
547
Steven Whitehoused7b616e2007-09-02 10:48:13 +0100548static void gfs2_ordered_write(struct gfs2_sbd *sdp)
549{
Steven Whitehouse45138992013-01-28 09:30:07 +0000550 struct gfs2_inode *ip;
Steven Whitehoused7b616e2007-09-02 10:48:13 +0100551 LIST_HEAD(written);
552
Steven Whitehouse45138992013-01-28 09:30:07 +0000553 spin_lock(&sdp->sd_ordered_lock);
Andreas Gruenbachera5b1d3f2019-04-05 12:16:14 +0100554 list_sort(NULL, &sdp->sd_log_ordered, &ip_cmp);
555 while (!list_empty(&sdp->sd_log_ordered)) {
556 ip = list_entry(sdp->sd_log_ordered.next, struct gfs2_inode, i_ordered);
Abhi Das1f23bc72017-12-22 07:55:31 -0600557 if (ip->i_inode.i_mapping->nrpages == 0) {
558 test_and_clear_bit(GIF_ORDERED, &ip->i_flags);
559 list_del(&ip->i_ordered);
Steven Whitehoused7b616e2007-09-02 10:48:13 +0100560 continue;
Abhi Das1f23bc72017-12-22 07:55:31 -0600561 }
562 list_move(&ip->i_ordered, &written);
Steven Whitehouse45138992013-01-28 09:30:07 +0000563 spin_unlock(&sdp->sd_ordered_lock);
564 filemap_fdatawrite(ip->i_inode.i_mapping);
565 spin_lock(&sdp->sd_ordered_lock);
Steven Whitehoused7b616e2007-09-02 10:48:13 +0100566 }
Andreas Gruenbachera5b1d3f2019-04-05 12:16:14 +0100567 list_splice(&written, &sdp->sd_log_ordered);
Steven Whitehouse45138992013-01-28 09:30:07 +0000568 spin_unlock(&sdp->sd_ordered_lock);
Steven Whitehoused7b616e2007-09-02 10:48:13 +0100569}
570
571static void gfs2_ordered_wait(struct gfs2_sbd *sdp)
572{
Steven Whitehouse45138992013-01-28 09:30:07 +0000573 struct gfs2_inode *ip;
Steven Whitehoused7b616e2007-09-02 10:48:13 +0100574
Steven Whitehouse45138992013-01-28 09:30:07 +0000575 spin_lock(&sdp->sd_ordered_lock);
Andreas Gruenbachera5b1d3f2019-04-05 12:16:14 +0100576 while (!list_empty(&sdp->sd_log_ordered)) {
577 ip = list_entry(sdp->sd_log_ordered.next, struct gfs2_inode, i_ordered);
Steven Whitehouse45138992013-01-28 09:30:07 +0000578 list_del(&ip->i_ordered);
579 WARN_ON(!test_and_clear_bit(GIF_ORDERED, &ip->i_flags));
580 if (ip->i_inode.i_mapping->nrpages == 0)
Steven Whitehoused7b616e2007-09-02 10:48:13 +0100581 continue;
Steven Whitehouse45138992013-01-28 09:30:07 +0000582 spin_unlock(&sdp->sd_ordered_lock);
583 filemap_fdatawait(ip->i_inode.i_mapping);
584 spin_lock(&sdp->sd_ordered_lock);
Steven Whitehoused7b616e2007-09-02 10:48:13 +0100585 }
Steven Whitehouse45138992013-01-28 09:30:07 +0000586 spin_unlock(&sdp->sd_ordered_lock);
587}
588
589void gfs2_ordered_del_inode(struct gfs2_inode *ip)
590{
591 struct gfs2_sbd *sdp = GFS2_SB(&ip->i_inode);
592
593 spin_lock(&sdp->sd_ordered_lock);
594 if (test_and_clear_bit(GIF_ORDERED, &ip->i_flags))
595 list_del(&ip->i_ordered);
596 spin_unlock(&sdp->sd_ordered_lock);
Steven Whitehoused7b616e2007-09-02 10:48:13 +0100597}
598
Benjamin Marzinski5d054962013-06-14 11:38:29 -0500599void gfs2_add_revoke(struct gfs2_sbd *sdp, struct gfs2_bufdata *bd)
600{
601 struct buffer_head *bh = bd->bd_bh;
602 struct gfs2_glock *gl = bd->bd_gl;
603
Benjamin Marzinski5d054962013-06-14 11:38:29 -0500604 bh->b_private = NULL;
605 bd->bd_blkno = bh->b_blocknr;
Bob Peterson9290a9a2013-12-10 12:06:35 -0500606 gfs2_remove_from_ail(bd); /* drops ref on bh */
607 bd->bd_bh = NULL;
Benjamin Marzinski5d054962013-06-14 11:38:29 -0500608 sdp->sd_log_num_revoke++;
Bob Peterson73118ca2019-04-05 04:41:38 +0100609 if (!test_bit(GLF_REVOKES, &gl->gl_flags)) {
610 set_bit(GLF_REVOKES, &gl->gl_flags);
Andreas Gruenbacher9287c642019-04-04 21:11:11 +0100611 gfs2_glock_hold(gl);
Bob Peterson73118ca2019-04-05 04:41:38 +0100612 }
Benjamin Marzinski5d054962013-06-14 11:38:29 -0500613 set_bit(GLF_LFLUSH, &gl->gl_flags);
Andreas Gruenbachera5b1d3f2019-04-05 12:16:14 +0100614 list_add(&bd->bd_list, &sdp->sd_log_revokes);
Benjamin Marzinski5d054962013-06-14 11:38:29 -0500615}
616
617void gfs2_write_revokes(struct gfs2_sbd *sdp)
618{
619 struct gfs2_trans *tr;
620 struct gfs2_bufdata *bd, *tmp;
621 int have_revokes = 0;
622 int max_revokes = (sdp->sd_sb.sb_bsize - sizeof(struct gfs2_log_descriptor)) / sizeof(u64);
623
624 gfs2_ail1_empty(sdp);
625 spin_lock(&sdp->sd_ail_lock);
Bob Petersonc9e58fb2018-10-15 12:17:30 -0500626 list_for_each_entry_reverse(tr, &sdp->sd_ail1_list, tr_list) {
Benjamin Marzinski5d054962013-06-14 11:38:29 -0500627 list_for_each_entry(bd, &tr->tr_ail2_list, bd_ail_st_list) {
628 if (list_empty(&bd->bd_list)) {
629 have_revokes = 1;
630 goto done;
631 }
632 }
633 }
634done:
635 spin_unlock(&sdp->sd_ail_lock);
636 if (have_revokes == 0)
637 return;
638 while (sdp->sd_log_num_revoke > max_revokes)
639 max_revokes += (sdp->sd_sb.sb_bsize - sizeof(struct gfs2_meta_header)) / sizeof(u64);
640 max_revokes -= sdp->sd_log_num_revoke;
641 if (!sdp->sd_log_num_revoke) {
642 atomic_dec(&sdp->sd_log_blks_free);
643 /* If no blocks have been reserved, we need to also
644 * reserve a block for the header */
645 if (!sdp->sd_log_blks_reserved)
646 atomic_dec(&sdp->sd_log_blks_free);
647 }
648 gfs2_log_lock(sdp);
649 spin_lock(&sdp->sd_ail_lock);
Bob Petersonc9e58fb2018-10-15 12:17:30 -0500650 list_for_each_entry_reverse(tr, &sdp->sd_ail1_list, tr_list) {
Benjamin Marzinski5d054962013-06-14 11:38:29 -0500651 list_for_each_entry_safe(bd, tmp, &tr->tr_ail2_list, bd_ail_st_list) {
652 if (max_revokes == 0)
653 goto out_of_blocks;
654 if (!list_empty(&bd->bd_list))
655 continue;
656 gfs2_add_revoke(sdp, bd);
657 max_revokes--;
658 }
659 }
660out_of_blocks:
661 spin_unlock(&sdp->sd_ail_lock);
662 gfs2_log_unlock(sdp);
663
664 if (!sdp->sd_log_num_revoke) {
665 atomic_inc(&sdp->sd_log_blks_free);
666 if (!sdp->sd_log_blks_reserved)
667 atomic_inc(&sdp->sd_log_blks_free);
668 }
669}
670
David Teiglandb3b94fa2006-01-16 16:50:04 +0000671/**
Bob Peterson7c70b892019-03-25 09:34:19 -0600672 * gfs2_write_log_header - Write a journal log header buffer at lblock
Bob Peterson588bff92017-12-18 12:48:29 -0600673 * @sdp: The GFS2 superblock
Bob Petersonc1696fb2018-01-17 00:01:33 +0100674 * @jd: journal descriptor of the journal to which we are writing
Bob Peterson588bff92017-12-18 12:48:29 -0600675 * @seq: sequence number
676 * @tail: tail of the log
Bob Peterson7c70b892019-03-25 09:34:19 -0600677 * @lblock: value for lh_blkno (block number relative to start of journal)
Bob Petersonc1696fb2018-01-17 00:01:33 +0100678 * @flags: log header flags GFS2_LOG_HEAD_*
Bob Peterson588bff92017-12-18 12:48:29 -0600679 * @op_flags: flags to pass to the bio
680 *
681 * Returns: the initialized log buffer descriptor
682 */
683
Bob Petersonc1696fb2018-01-17 00:01:33 +0100684void gfs2_write_log_header(struct gfs2_sbd *sdp, struct gfs2_jdesc *jd,
Bob Peterson7c70b892019-03-25 09:34:19 -0600685 u64 seq, u32 tail, u32 lblock, u32 flags,
686 int op_flags)
Bob Peterson588bff92017-12-18 12:48:29 -0600687{
688 struct gfs2_log_header *lh;
Bob Petersonc1696fb2018-01-17 00:01:33 +0100689 u32 hash, crc;
Bob Peterson588bff92017-12-18 12:48:29 -0600690 struct page *page = mempool_alloc(gfs2_page_pool, GFP_NOIO);
Bob Petersonc1696fb2018-01-17 00:01:33 +0100691 struct gfs2_statfs_change_host *l_sc = &sdp->sd_statfs_local;
692 struct timespec64 tv;
693 struct super_block *sb = sdp->sd_vfs;
Bob Peterson7c70b892019-03-25 09:34:19 -0600694 u64 dblock;
Bob Peterson588bff92017-12-18 12:48:29 -0600695
696 lh = page_address(page);
697 clear_page(lh);
698
699 lh->lh_header.mh_magic = cpu_to_be32(GFS2_MAGIC);
700 lh->lh_header.mh_type = cpu_to_be32(GFS2_METATYPE_LH);
701 lh->lh_header.__pad0 = cpu_to_be64(0);
702 lh->lh_header.mh_format = cpu_to_be32(GFS2_FORMAT_LH);
703 lh->lh_header.mh_jid = cpu_to_be32(sdp->sd_jdesc->jd_jid);
704 lh->lh_sequence = cpu_to_be64(seq);
705 lh->lh_flags = cpu_to_be32(flags);
706 lh->lh_tail = cpu_to_be32(tail);
Bob Peterson7c70b892019-03-25 09:34:19 -0600707 lh->lh_blkno = cpu_to_be32(lblock);
Bob Petersonc1696fb2018-01-17 00:01:33 +0100708 hash = ~crc32(~0, lh, LH_V1_SIZE);
Bob Peterson588bff92017-12-18 12:48:29 -0600709 lh->lh_hash = cpu_to_be32(hash);
710
Arnd Bergmannee9c7f92018-06-20 15:15:24 -0500711 ktime_get_coarse_real_ts64(&tv);
Bob Petersonc1696fb2018-01-17 00:01:33 +0100712 lh->lh_nsec = cpu_to_be32(tv.tv_nsec);
713 lh->lh_sec = cpu_to_be64(tv.tv_sec);
Bob Peterson7c70b892019-03-25 09:34:19 -0600714 if (!list_empty(&jd->extent_list))
715 dblock = gfs2_log_bmap(sdp);
716 else {
717 int ret = gfs2_lblk_to_dblk(jd->jd_inode, lblock, &dblock);
718 if (gfs2_assert_withdraw(sdp, ret == 0))
719 return;
720 }
721 lh->lh_addr = cpu_to_be64(dblock);
Bob Petersonc1696fb2018-01-17 00:01:33 +0100722 lh->lh_jinode = cpu_to_be64(GFS2_I(jd->jd_inode)->i_no_addr);
723
724 /* We may only write local statfs, quota, etc., when writing to our
725 own journal. The values are left 0 when recovering a journal
726 different from our own. */
727 if (!(flags & GFS2_LOG_HEAD_RECOVERY)) {
728 lh->lh_statfs_addr =
729 cpu_to_be64(GFS2_I(sdp->sd_sc_inode)->i_no_addr);
730 lh->lh_quota_addr =
731 cpu_to_be64(GFS2_I(sdp->sd_qc_inode)->i_no_addr);
732
733 spin_lock(&sdp->sd_statfs_spin);
734 lh->lh_local_total = cpu_to_be64(l_sc->sc_total);
735 lh->lh_local_free = cpu_to_be64(l_sc->sc_free);
736 lh->lh_local_dinodes = cpu_to_be64(l_sc->sc_dinodes);
737 spin_unlock(&sdp->sd_statfs_spin);
738 }
739
740 BUILD_BUG_ON(offsetof(struct gfs2_log_header, lh_crc) != LH_V1_SIZE);
741
742 crc = crc32c(~0, (void *)lh + LH_V1_SIZE + 4,
743 sb->s_blocksize - LH_V1_SIZE - 4);
744 lh->lh_crc = cpu_to_be32(crc);
745
Bob Peterson7c70b892019-03-25 09:34:19 -0600746 gfs2_log_write(sdp, page, sb->s_blocksize, 0, dblock);
Abhi Dasf4686c22019-05-02 14:17:40 -0500747 gfs2_log_submit_bio(&sdp->sd_log_bio, REQ_OP_WRITE | op_flags);
Bob Peterson588bff92017-12-18 12:48:29 -0600748 log_flush_wait(sdp);
749}
750
751/**
Steven Whitehouse34cc1782012-03-09 10:45:56 +0000752 * log_write_header - Get and initialize a journal header buffer
753 * @sdp: The GFS2 superblock
Bob Petersonc1696fb2018-01-17 00:01:33 +0100754 * @flags: The log header flags, including log header origin
Steven Whitehouse34cc1782012-03-09 10:45:56 +0000755 *
756 * Returns: the initialized log buffer descriptor
757 */
758
Steven Whitehousefdb76a42012-04-02 15:34:36 +0100759static void log_write_header(struct gfs2_sbd *sdp, u32 flags)
Steven Whitehouse34cc1782012-03-09 10:45:56 +0000760{
Steven Whitehouse34cc1782012-03-09 10:45:56 +0000761 unsigned int tail;
Jan Kara0f0b9b62017-05-02 13:14:13 +0200762 int op_flags = REQ_PREFLUSH | REQ_FUA | REQ_META | REQ_SYNC;
Benjamin Marzinski2e60d762014-11-13 20:42:04 -0600763 enum gfs2_freeze_state state = atomic_read(&sdp->sd_freeze_state);
Steven Whitehouse34cc1782012-03-09 10:45:56 +0000764
Benjamin Marzinski2e60d762014-11-13 20:42:04 -0600765 gfs2_assert_withdraw(sdp, (state != SFS_FROZEN));
Steven Whitehouse34cc1782012-03-09 10:45:56 +0000766 tail = current_tail(sdp);
767
Steven Whitehouse34cc1782012-03-09 10:45:56 +0000768 if (test_bit(SDF_NOBARRIERS, &sdp->sd_flags)) {
769 gfs2_ordered_wait(sdp);
770 log_flush_wait(sdp);
Christoph Hellwig70fd7612016-11-01 07:40:10 -0600771 op_flags = REQ_SYNC | REQ_META | REQ_PRIO;
Steven Whitehouse34cc1782012-03-09 10:45:56 +0000772 }
Steven Whitehousee8c92ed2012-04-16 09:28:31 +0100773 sdp->sd_log_idle = (tail == sdp->sd_log_flush_head);
Bob Petersonc1696fb2018-01-17 00:01:33 +0100774 gfs2_write_log_header(sdp, sdp->sd_jdesc, sdp->sd_log_sequence++, tail,
Bob Peterson7c70b892019-03-25 09:34:19 -0600775 sdp->sd_log_flush_head, flags, op_flags);
Steven Whitehouse34cc1782012-03-09 10:45:56 +0000776
777 if (sdp->sd_log_tail != tail)
778 log_pull_tail(sdp, tail);
Steven Whitehouse34cc1782012-03-09 10:45:56 +0000779}
780
781/**
Steven Whitehouseb09e5932006-04-07 11:17:32 -0400782 * gfs2_log_flush - flush incore transaction(s)
David Teiglandb3b94fa2006-01-16 16:50:04 +0000783 * @sdp: the filesystem
784 * @gl: The glock structure to flush. If NULL, flush the whole incore log
Bob Peterson805c09072018-01-08 10:34:17 -0500785 * @flags: The log header flags: GFS2_LOG_HEAD_FLUSH_* and debug flags
David Teiglandb3b94fa2006-01-16 16:50:04 +0000786 *
787 */
788
Bob Petersonc1696fb2018-01-17 00:01:33 +0100789void gfs2_log_flush(struct gfs2_sbd *sdp, struct gfs2_glock *gl, u32 flags)
David Teiglandb3b94fa2006-01-16 16:50:04 +0000790{
Benjamin Marzinski16ca9412013-04-05 20:31:46 -0500791 struct gfs2_trans *tr;
Benjamin Marzinski2e60d762014-11-13 20:42:04 -0600792 enum gfs2_freeze_state state = atomic_read(&sdp->sd_freeze_state);
David Teiglandb3b94fa2006-01-16 16:50:04 +0000793
Steven Whitehouse484adff2006-03-29 09:12:12 -0500794 down_write(&sdp->sd_log_flush_lock);
Steven Whitehousef55ab262006-02-21 12:51:39 +0000795
Steven Whitehouse2bcd6102007-11-08 14:25:12 +0000796 /* Log might have been flushed while we waited for the flush lock */
797 if (gl && !test_bit(GLF_LFLUSH, &gl->gl_flags)) {
798 up_write(&sdp->sd_log_flush_lock);
799 return;
Steven Whitehousef55ab262006-02-21 12:51:39 +0000800 }
Bob Peterson805c09072018-01-08 10:34:17 -0500801 trace_gfs2_log_flush(sdp, 1, flags);
Steven Whitehousef55ab262006-02-21 12:51:39 +0000802
Bob Petersonc1696fb2018-01-17 00:01:33 +0100803 if (flags & GFS2_LOG_HEAD_FLUSH_SHUTDOWN)
Benjamin Marzinski400ac522015-12-09 07:46:33 -0600804 clear_bit(SDF_JOURNAL_LIVE, &sdp->sd_flags);
805
Steven Whitehouseb1ab1e42014-02-25 11:52:20 +0000806 sdp->sd_log_flush_head = sdp->sd_log_head;
Benjamin Marzinski16ca9412013-04-05 20:31:46 -0500807 tr = sdp->sd_log_tr;
808 if (tr) {
809 sdp->sd_log_tr = NULL;
810 INIT_LIST_HEAD(&tr->tr_ail1_list);
811 INIT_LIST_HEAD(&tr->tr_ail2_list);
Steven Whitehouseb1ab1e42014-02-25 11:52:20 +0000812 tr->tr_first = sdp->sd_log_flush_head;
Benjamin Marzinski2e60d762014-11-13 20:42:04 -0600813 if (unlikely (state == SFS_FROZEN))
814 gfs2_assert_withdraw(sdp, !tr->tr_num_buf_new && !tr->tr_num_databuf_new);
Benjamin Marzinski16ca9412013-04-05 20:31:46 -0500815 }
David Teiglandb3b94fa2006-01-16 16:50:04 +0000816
Benjamin Marzinski2e60d762014-11-13 20:42:04 -0600817 if (unlikely(state == SFS_FROZEN))
818 gfs2_assert_withdraw(sdp, !sdp->sd_log_num_revoke);
David Teiglandb3b94fa2006-01-16 16:50:04 +0000819 gfs2_assert_withdraw(sdp,
820 sdp->sd_log_num_revoke == sdp->sd_log_commited_revoke);
821
Steven Whitehoused7b616e2007-09-02 10:48:13 +0100822 gfs2_ordered_write(sdp);
Steven Whitehoused69a3c62014-02-21 15:22:35 +0000823 lops_before_commit(sdp, tr);
Abhi Dasf4686c22019-05-02 14:17:40 -0500824 gfs2_log_submit_bio(&sdp->sd_log_bio, REQ_OP_WRITE);
Steven Whitehoused7b616e2007-09-02 10:48:13 +0100825
Steven Whitehouse34cc1782012-03-09 10:45:56 +0000826 if (sdp->sd_log_head != sdp->sd_log_flush_head) {
Bob Peterson428fd952014-03-12 10:34:16 -0400827 log_flush_wait(sdp);
Bob Petersonc1696fb2018-01-17 00:01:33 +0100828 log_write_header(sdp, flags);
Steven Whitehouse34cc1782012-03-09 10:45:56 +0000829 } else if (sdp->sd_log_tail != current_tail(sdp) && !sdp->sd_log_idle){
Steven Whitehousefd041f02007-11-08 14:55:03 +0000830 atomic_dec(&sdp->sd_log_blks_free); /* Adjust for unreserved buffer */
Steven Whitehouse63997772009-06-12 08:49:20 +0100831 trace_gfs2_log_blocks(sdp, -1);
Bob Petersonc1696fb2018-01-17 00:01:33 +0100832 log_write_header(sdp, flags);
Robert Peterson2332c442007-06-18 14:50:20 -0500833 }
Benjamin Marzinski16ca9412013-04-05 20:31:46 -0500834 lops_after_commit(sdp, tr);
Steven Whitehousefe1a6982006-10-11 13:34:59 -0400835
836 gfs2_log_lock(sdp);
David Teiglandb3b94fa2006-01-16 16:50:04 +0000837 sdp->sd_log_head = sdp->sd_log_flush_head;
Steven Whitehousefaa31ce2006-09-13 11:13:27 -0400838 sdp->sd_log_blks_reserved = 0;
Steven Whitehousefaa31ce2006-09-13 11:13:27 -0400839 sdp->sd_log_commited_revoke = 0;
David Teiglandb3b94fa2006-01-16 16:50:04 +0000840
Dave Chinnerd6a079e2011-03-11 11:52:25 +0000841 spin_lock(&sdp->sd_ail_lock);
Benjamin Marzinski16ca9412013-04-05 20:31:46 -0500842 if (tr && !list_empty(&tr->tr_ail1_list)) {
843 list_add(&tr->tr_list, &sdp->sd_ail1_list);
844 tr = NULL;
David Teiglandb3b94fa2006-01-16 16:50:04 +0000845 }
Dave Chinnerd6a079e2011-03-11 11:52:25 +0000846 spin_unlock(&sdp->sd_ail_lock);
David Teiglandb3b94fa2006-01-16 16:50:04 +0000847 gfs2_log_unlock(sdp);
Benjamin Marzinski24972552014-05-01 22:26:55 -0500848
Bob Petersonc1696fb2018-01-17 00:01:33 +0100849 if (!(flags & GFS2_LOG_HEAD_FLUSH_NORMAL)) {
Benjamin Marzinski24972552014-05-01 22:26:55 -0500850 if (!sdp->sd_log_idle) {
851 for (;;) {
852 gfs2_ail1_start(sdp);
853 gfs2_ail1_wait(sdp);
854 if (gfs2_ail1_empty(sdp))
855 break;
856 }
857 atomic_dec(&sdp->sd_log_blks_free); /* Adjust for unreserved buffer */
858 trace_gfs2_log_blocks(sdp, -1);
Bob Petersonc1696fb2018-01-17 00:01:33 +0100859 log_write_header(sdp, flags);
Benjamin Marzinski24972552014-05-01 22:26:55 -0500860 sdp->sd_log_head = sdp->sd_log_flush_head;
861 }
Bob Petersonc1696fb2018-01-17 00:01:33 +0100862 if (flags & (GFS2_LOG_HEAD_FLUSH_SHUTDOWN |
863 GFS2_LOG_HEAD_FLUSH_FREEZE))
Benjamin Marzinski24972552014-05-01 22:26:55 -0500864 gfs2_log_shutdown(sdp);
Bob Petersonc1696fb2018-01-17 00:01:33 +0100865 if (flags & GFS2_LOG_HEAD_FLUSH_FREEZE)
Benjamin Marzinski2e60d762014-11-13 20:42:04 -0600866 atomic_set(&sdp->sd_freeze_state, SFS_FROZEN);
Benjamin Marzinski24972552014-05-01 22:26:55 -0500867 }
868
Bob Peterson805c09072018-01-08 10:34:17 -0500869 trace_gfs2_log_flush(sdp, 0, flags);
Steven Whitehouse484adff2006-03-29 09:12:12 -0500870 up_write(&sdp->sd_log_flush_lock);
David Teiglandb3b94fa2006-01-16 16:50:04 +0000871
Benjamin Marzinski16ca9412013-04-05 20:31:46 -0500872 kfree(tr);
David Teiglandb3b94fa2006-01-16 16:50:04 +0000873}
874
Steven Whitehoused69a3c62014-02-21 15:22:35 +0000875/**
876 * gfs2_merge_trans - Merge a new transaction into a cached transaction
877 * @old: Original transaction to be expanded
878 * @new: New transaction to be merged
879 */
880
881static void gfs2_merge_trans(struct gfs2_trans *old, struct gfs2_trans *new)
882{
Bob Peterson9862ca02017-01-25 12:50:47 -0500883 WARN_ON_ONCE(!test_bit(TR_ATTACHED, &old->tr_flags));
Steven Whitehoused69a3c62014-02-21 15:22:35 +0000884
885 old->tr_num_buf_new += new->tr_num_buf_new;
886 old->tr_num_databuf_new += new->tr_num_databuf_new;
887 old->tr_num_buf_rm += new->tr_num_buf_rm;
888 old->tr_num_databuf_rm += new->tr_num_databuf_rm;
889 old->tr_num_revoke += new->tr_num_revoke;
890 old->tr_num_revoke_rm += new->tr_num_revoke_rm;
891
892 list_splice_tail_init(&new->tr_databuf, &old->tr_databuf);
893 list_splice_tail_init(&new->tr_buf, &old->tr_buf);
894}
895
David Teiglandb3b94fa2006-01-16 16:50:04 +0000896static void log_refund(struct gfs2_sbd *sdp, struct gfs2_trans *tr)
897{
Robert Peterson2332c442007-06-18 14:50:20 -0500898 unsigned int reserved;
Steven Whitehouseac39aad2008-01-10 14:49:43 +0000899 unsigned int unused;
Steven Whitehouse022ef4f2014-02-21 21:55:33 +0000900 unsigned int maxres;
David Teiglandb3b94fa2006-01-16 16:50:04 +0000901
902 gfs2_log_lock(sdp);
903
Steven Whitehoused69a3c62014-02-21 15:22:35 +0000904 if (sdp->sd_log_tr) {
905 gfs2_merge_trans(sdp->sd_log_tr, tr);
906 } else if (tr->tr_num_buf_new || tr->tr_num_databuf_new) {
Bob Peterson9862ca02017-01-25 12:50:47 -0500907 gfs2_assert_withdraw(sdp, test_bit(TR_ALLOCED, &tr->tr_flags));
Benjamin Marzinski16ca9412013-04-05 20:31:46 -0500908 sdp->sd_log_tr = tr;
Bob Peterson9862ca02017-01-25 12:50:47 -0500909 set_bit(TR_ATTACHED, &tr->tr_flags);
Benjamin Marzinski16ca9412013-04-05 20:31:46 -0500910 }
Steven Whitehouse022ef4f2014-02-21 21:55:33 +0000911
912 sdp->sd_log_commited_revoke += tr->tr_num_revoke - tr->tr_num_revoke_rm;
913 reserved = calc_reserved(sdp);
914 maxres = sdp->sd_log_blks_reserved + tr->tr_reserved;
915 gfs2_assert_withdraw(sdp, maxres >= reserved);
916 unused = maxres - reserved;
917 atomic_add(unused, &sdp->sd_log_blks_free);
918 trace_gfs2_log_blocks(sdp, unused);
919 gfs2_assert_withdraw(sdp, atomic_read(&sdp->sd_log_blks_free) <=
920 sdp->sd_jdesc->jd_blocks);
921 sdp->sd_log_blks_reserved = reserved;
922
David Teiglandb3b94fa2006-01-16 16:50:04 +0000923 gfs2_log_unlock(sdp);
924}
925
926/**
927 * gfs2_log_commit - Commit a transaction to the log
928 * @sdp: the filesystem
929 * @tr: the transaction
930 *
Benjamin Marzinski5e687ea2010-05-04 14:29:16 -0500931 * We wake up gfs2_logd if the number of pinned blocks exceed thresh1
932 * or the total number of used blocks (pinned blocks plus AIL blocks)
933 * is greater than thresh2.
934 *
935 * At mount time thresh1 is 1/3rd of journal size, thresh2 is 2/3rd of
936 * journal size.
937 *
David Teiglandb3b94fa2006-01-16 16:50:04 +0000938 * Returns: errno
939 */
940
941void gfs2_log_commit(struct gfs2_sbd *sdp, struct gfs2_trans *tr)
942{
943 log_refund(sdp, tr);
David Teiglandb3b94fa2006-01-16 16:50:04 +0000944
Benjamin Marzinski5e687ea2010-05-04 14:29:16 -0500945 if (atomic_read(&sdp->sd_log_pinned) > atomic_read(&sdp->sd_log_thresh1) ||
946 ((sdp->sd_jdesc->jd_blocks - atomic_read(&sdp->sd_log_blks_free)) >
947 atomic_read(&sdp->sd_log_thresh2)))
948 wake_up(&sdp->sd_logd_waitq);
David Teiglandb3b94fa2006-01-16 16:50:04 +0000949}
950
951/**
952 * gfs2_log_shutdown - write a shutdown header into a journal
953 * @sdp: the filesystem
954 *
955 */
956
957void gfs2_log_shutdown(struct gfs2_sbd *sdp)
958{
David Teiglandb3b94fa2006-01-16 16:50:04 +0000959 gfs2_assert_withdraw(sdp, !sdp->sd_log_blks_reserved);
David Teiglandb3b94fa2006-01-16 16:50:04 +0000960 gfs2_assert_withdraw(sdp, !sdp->sd_log_num_revoke);
David Teiglandb3b94fa2006-01-16 16:50:04 +0000961 gfs2_assert_withdraw(sdp, list_empty(&sdp->sd_ail1_list));
962
963 sdp->sd_log_flush_head = sdp->sd_log_head;
David Teiglandb3b94fa2006-01-16 16:50:04 +0000964
Bob Peterson805c09072018-01-08 10:34:17 -0500965 log_write_header(sdp, GFS2_LOG_HEAD_UNMOUNT | GFS2_LFC_SHUTDOWN);
David Teiglandb3b94fa2006-01-16 16:50:04 +0000966
Steven Whitehousea74604b2006-04-21 15:10:46 -0400967 gfs2_assert_warn(sdp, sdp->sd_log_head == sdp->sd_log_tail);
968 gfs2_assert_warn(sdp, list_empty(&sdp->sd_ail2_list));
David Teiglandb3b94fa2006-01-16 16:50:04 +0000969
970 sdp->sd_log_head = sdp->sd_log_flush_head;
David Teiglandb3b94fa2006-01-16 16:50:04 +0000971 sdp->sd_log_tail = sdp->sd_log_head;
Steven Whitehousea25311c2006-11-23 11:06:35 -0500972}
973
Benjamin Marzinski5e687ea2010-05-04 14:29:16 -0500974static inline int gfs2_jrnl_flush_reqd(struct gfs2_sbd *sdp)
975{
Bob Petersonf07b3522017-01-05 16:01:45 -0500976 return (atomic_read(&sdp->sd_log_pinned) +
977 atomic_read(&sdp->sd_log_blks_needed) >=
978 atomic_read(&sdp->sd_log_thresh1));
Benjamin Marzinski5e687ea2010-05-04 14:29:16 -0500979}
980
981static inline int gfs2_ail_flush_reqd(struct gfs2_sbd *sdp)
982{
983 unsigned int used_blocks = sdp->sd_jdesc->jd_blocks - atomic_read(&sdp->sd_log_blks_free);
Abhi Dasb066a4eeb2017-08-04 12:15:32 -0500984
985 if (test_and_clear_bit(SDF_FORCE_AIL_FLUSH, &sdp->sd_flags))
986 return 1;
987
Bob Petersonf07b3522017-01-05 16:01:45 -0500988 return used_blocks + atomic_read(&sdp->sd_log_blks_needed) >=
989 atomic_read(&sdp->sd_log_thresh2);
Benjamin Marzinski5e687ea2010-05-04 14:29:16 -0500990}
Steven Whitehouseec69b182007-11-09 10:01:41 +0000991
992/**
993 * gfs2_logd - Update log tail as Active Items get flushed to in-place blocks
994 * @sdp: Pointer to GFS2 superblock
995 *
996 * Also, periodically check to make sure that we're using the most recent
997 * journal index.
998 */
999
1000int gfs2_logd(void *data)
1001{
1002 struct gfs2_sbd *sdp = data;
Benjamin Marzinski5e687ea2010-05-04 14:29:16 -05001003 unsigned long t = 1;
1004 DEFINE_WAIT(wait);
Bob Petersonb63f5e82017-01-06 22:14:28 -05001005 bool did_flush;
Steven Whitehouseec69b182007-11-09 10:01:41 +00001006
1007 while (!kthread_should_stop()) {
Steven Whitehouseec69b182007-11-09 10:01:41 +00001008
Bob Peterson942b0cd2017-08-16 11:30:06 -05001009 /* Check for errors writing to the journal */
1010 if (sdp->sd_log_error) {
1011 gfs2_lm_withdraw(sdp,
1012 "GFS2: fsid=%s: error %d: "
1013 "withdrawing the file system to "
1014 "prevent further damage.\n",
1015 sdp->sd_fsname, sdp->sd_log_error);
1016 }
1017
Bob Petersonb63f5e82017-01-06 22:14:28 -05001018 did_flush = false;
Benjamin Marzinski5e687ea2010-05-04 14:29:16 -05001019 if (gfs2_jrnl_flush_reqd(sdp) || t == 0) {
Steven Whitehouse4667a0e2011-04-18 14:18:09 +01001020 gfs2_ail1_empty(sdp);
Bob Peterson805c09072018-01-08 10:34:17 -05001021 gfs2_log_flush(sdp, NULL, GFS2_LOG_HEAD_FLUSH_NORMAL |
1022 GFS2_LFC_LOGD_JFLUSH_REQD);
Bob Petersonb63f5e82017-01-06 22:14:28 -05001023 did_flush = true;
Steven Whitehouseec69b182007-11-09 10:01:41 +00001024 }
1025
Benjamin Marzinski5e687ea2010-05-04 14:29:16 -05001026 if (gfs2_ail_flush_reqd(sdp)) {
1027 gfs2_ail1_start(sdp);
Steven Whitehouse26b06a62011-05-21 19:21:07 +01001028 gfs2_ail1_wait(sdp);
Steven Whitehouse4667a0e2011-04-18 14:18:09 +01001029 gfs2_ail1_empty(sdp);
Bob Peterson805c09072018-01-08 10:34:17 -05001030 gfs2_log_flush(sdp, NULL, GFS2_LOG_HEAD_FLUSH_NORMAL |
1031 GFS2_LFC_LOGD_AIL_FLUSH_REQD);
Bob Petersonb63f5e82017-01-06 22:14:28 -05001032 did_flush = true;
Benjamin Marzinski5e687ea2010-05-04 14:29:16 -05001033 }
1034
Bob Petersonb63f5e82017-01-06 22:14:28 -05001035 if (!gfs2_ail_flush_reqd(sdp) || did_flush)
Steven Whitehouse26b06a62011-05-21 19:21:07 +01001036 wake_up(&sdp->sd_log_waitq);
1037
Steven Whitehouseec69b182007-11-09 10:01:41 +00001038 t = gfs2_tune_get(sdp, gt_logd_secs) * HZ;
Tejun Heoa0acae02011-11-21 12:32:22 -08001039
1040 try_to_freeze();
Benjamin Marzinski5e687ea2010-05-04 14:29:16 -05001041
1042 do {
1043 prepare_to_wait(&sdp->sd_logd_waitq, &wait,
Steven Whitehouse5f487492010-09-09 14:45:00 +01001044 TASK_INTERRUPTIBLE);
Benjamin Marzinski5e687ea2010-05-04 14:29:16 -05001045 if (!gfs2_ail_flush_reqd(sdp) &&
1046 !gfs2_jrnl_flush_reqd(sdp) &&
1047 !kthread_should_stop())
1048 t = schedule_timeout(t);
1049 } while(t && !gfs2_ail_flush_reqd(sdp) &&
1050 !gfs2_jrnl_flush_reqd(sdp) &&
1051 !kthread_should_stop());
1052 finish_wait(&sdp->sd_logd_waitq, &wait);
Steven Whitehouseec69b182007-11-09 10:01:41 +00001053 }
1054
1055 return 0;
1056}
1057