blob: 1852ed9de7fd56bf9f0d9b41d96a29e5a3e66cac [file] [log] [blame]
David Sterba9888c342018-04-03 19:16:55 +02001/* SPDX-License-Identifier: GPL-2.0 */
Chris Mason6cbd5572007-06-12 09:07:21 -04002/*
3 * Copyright (C) 2007 Oracle. All rights reserved.
Chris Mason6cbd5572007-06-12 09:07:21 -04004 */
5
David Sterba9888c342018-04-03 19:16:55 +02006#ifndef BTRFS_TRANSACTION_H
7#define BTRFS_TRANSACTION_H
Elena Reshetova9b64f572017-03-03 10:55:11 +02008
9#include <linux/refcount.h>
Chris Mason31f3c992007-04-30 15:25:45 -040010#include "btrfs_inode.h"
Chris Mason56bec292009-03-13 10:10:06 -040011#include "delayed-ref.h"
Arne Jansenbed92ea2012-06-28 18:03:02 +020012#include "ctree.h"
Chris Masone089f052007-03-16 16:20:31 -040013
Miao Xie4a9d8bd2013-05-17 03:53:43 +000014enum btrfs_trans_state {
David Sterbabbe339c2018-11-27 15:25:13 +010015 TRANS_STATE_RUNNING,
David Sterbabbe339c2018-11-27 15:25:13 +010016 TRANS_STATE_COMMIT_START,
17 TRANS_STATE_COMMIT_DOING,
18 TRANS_STATE_UNBLOCKED,
Filipe Mananad0c2f4f2021-01-27 10:35:00 +000019 TRANS_STATE_SUPER_COMMITTED,
David Sterbabbe339c2018-11-27 15:25:13 +010020 TRANS_STATE_COMPLETED,
21 TRANS_STATE_MAX,
Miao Xie4a9d8bd2013-05-17 03:53:43 +000022};
23
Josef Bacik3204d332015-09-24 10:46:10 -040024#define BTRFS_TRANS_HAVE_FREE_BGS 0
25#define BTRFS_TRANS_DIRTY_BG_RUN 1
Josef Bacik2968b1f2015-10-01 12:55:18 -040026#define BTRFS_TRANS_CACHE_ENOSPC 2
Josef Bacik3204d332015-09-24 10:46:10 -040027
Chris Mason79154b12007-03-22 15:59:16 -040028struct btrfs_transaction {
29 u64 transid;
Chris Masonb7ec40d2009-03-12 20:12:45 -040030 /*
Miao Xie0860adf2013-05-15 07:48:27 +000031 * total external writers(USERSPACE/START/ATTACH) in this
32 * transaction, it must be zero before the transaction is
33 * being committed
34 */
35 atomic_t num_extwriters;
36 /*
Chris Masonb7ec40d2009-03-12 20:12:45 -040037 * total writers in this transaction, it must be zero before the
38 * transaction can end
39 */
Josef Bacik13c5a932011-04-11 15:45:29 -040040 atomic_t num_writers;
Elena Reshetova9b64f572017-03-03 10:55:11 +020041 refcount_t use_count;
Chris Masonb7ec40d2009-03-12 20:12:45 -040042
Josef Bacik3204d332015-09-24 10:46:10 -040043 unsigned long flags;
Zhao Lei13212b52015-02-12 14:18:17 +080044
Miao Xie4a9d8bd2013-05-17 03:53:43 +000045 /* Be protected by fs_info->trans_lock when we want to change it. */
46 enum btrfs_trans_state state;
David Sterba5302e082017-11-08 01:54:33 +010047 int aborted;
Chris Mason8fd17792007-04-19 21:01:03 -040048 struct list_head list;
Chris Masond1310b22008-01-24 16:13:08 -050049 struct extent_io_tree dirty_pages;
Allen Paisa9444422018-06-12 17:18:25 +053050 time64_t start_time;
Chris Mason79154b12007-03-22 15:59:16 -040051 wait_queue_head_t writer_wait;
52 wait_queue_head_t commit_wait;
Chris Mason3063d292008-01-08 15:46:30 -050053 struct list_head pending_snapshots;
Nikolay Borisovbbbf7242019-03-25 14:31:22 +020054 struct list_head dev_update_list;
Josef Bacik9e351cc2014-03-13 15:42:13 -040055 struct list_head switch_commits;
Josef Bacikce93ec52014-11-17 15:45:48 -050056 struct list_head dirty_bgs;
Nikolay Borisov45ae2c12018-02-08 18:25:18 +020057
58 /*
59 * There is no explicit lock which protects io_bgs, rather its
60 * consistency is implied by the fact that all the sites which modify
61 * it do so under some form of transaction critical section, namely:
62 *
63 * - btrfs_start_dirty_block_groups - This function can only ever be
64 * run by one of the transaction committers. Refer to
65 * BTRFS_TRANS_DIRTY_BG_RUN usage in btrfs_commit_transaction
66 *
67 * - btrfs_write_dirty_blockgroups - this is called by
68 * commit_cowonly_roots from transaction critical section
69 * (TRANS_STATE_COMMIT_DOING)
70 *
71 * - btrfs_cleanup_dirty_bgs - called on transaction abort
72 */
Chris Mason1bbc6212015-04-06 12:46:08 -070073 struct list_head io_bgs;
Josef Bacik2b9dbef2015-09-15 10:07:04 -040074 struct list_head dropped_roots;
Nikolay Borisovfe119a62020-01-20 16:09:18 +020075 struct extent_io_tree pinned_extents;
Chris Mason1bbc6212015-04-06 12:46:08 -070076
77 /*
78 * we need to make sure block group deletion doesn't race with
79 * free space cache writeout. This mutex keeps them from stomping
80 * on each other
81 */
82 struct mutex cache_write_mutex;
Josef Bacikce93ec52014-11-17 15:45:48 -050083 spinlock_t dirty_bgs_lock;
Filipe Manana348a0012015-11-27 12:16:16 +000084 /* Protected by spin lock fs_info->unused_bgs_lock. */
Jeff Mahoneye33e17e2015-06-15 09:41:19 -040085 struct list_head deleted_bgs;
Josef Bacik2b9dbef2015-09-15 10:07:04 -040086 spinlock_t dropped_roots_lock;
Chris Mason56bec292009-03-13 10:10:06 -040087 struct btrfs_delayed_ref_root delayed_refs;
Jeff Mahoneyab8d0fc2016-09-20 10:05:02 -040088 struct btrfs_fs_info *fs_info;
Filipe Manana48778172020-08-11 12:43:58 +010089
90 /*
91 * Number of ordered extents the transaction must wait for before
92 * committing. These are ordered extents started by a fast fsync.
93 */
94 atomic_t pending_ordered;
95 wait_queue_head_t pending_wait;
Naohiro Aotad35751562021-02-04 19:21:54 +090096
97 spinlock_t releasing_ebs_lock;
98 struct list_head releasing_ebs;
Chris Mason79154b12007-03-22 15:59:16 -040099};
100
Miao Xie0860adf2013-05-15 07:48:27 +0000101#define __TRANS_FREEZABLE (1U << 0)
102
Miao Xie0860adf2013-05-15 07:48:27 +0000103#define __TRANS_START (1U << 9)
104#define __TRANS_ATTACH (1U << 10)
105#define __TRANS_JOIN (1U << 11)
106#define __TRANS_JOIN_NOLOCK (1U << 12)
Josef Bacikfaa2dbf2014-05-07 17:06:09 -0400107#define __TRANS_DUMMY (1U << 13)
Filipe Mananaa6d155d2019-07-29 09:37:10 +0100108#define __TRANS_JOIN_NOSTART (1U << 14)
Miao Xie0860adf2013-05-15 07:48:27 +0000109
Miao Xie0860adf2013-05-15 07:48:27 +0000110#define TRANS_START (__TRANS_START | __TRANS_FREEZABLE)
111#define TRANS_ATTACH (__TRANS_ATTACH)
112#define TRANS_JOIN (__TRANS_JOIN | __TRANS_FREEZABLE)
113#define TRANS_JOIN_NOLOCK (__TRANS_JOIN_NOLOCK)
Filipe Mananaa6d155d2019-07-29 09:37:10 +0100114#define TRANS_JOIN_NOSTART (__TRANS_JOIN_NOSTART)
Miao Xie0860adf2013-05-15 07:48:27 +0000115
Nikolay Borisovbcf3a3e2018-02-05 10:41:15 +0200116#define TRANS_EXTWRITERS (__TRANS_START | __TRANS_ATTACH)
Miao Xiea698d0752012-09-20 01:51:59 -0600117
Chris Masone089f052007-03-16 16:20:31 -0400118struct btrfs_trans_handle {
119 u64 transid;
Yan, Zhengf0486c62010-05-16 10:46:25 -0400120 u64 bytes_reserved;
Filipe Manana4fbcdf62015-05-20 14:01:54 +0100121 u64 chunk_bytes_reserved;
Chris Mason56bec292009-03-13 10:10:06 -0400122 unsigned long delayed_ref_updates;
Yan, Zhengf0486c62010-05-16 10:46:25 -0400123 struct btrfs_transaction *transaction;
124 struct btrfs_block_rsv *block_rsv;
Josef Bacik2a1eb462011-04-13 15:15:59 -0400125 struct btrfs_block_rsv *orig_rsv;
David Sterba1ca4bb62017-11-08 01:54:33 +0100126 refcount_t use_count;
127 unsigned int type;
David Sterbabf31f872020-02-05 17:34:34 +0100128 /*
129 * Error code of transaction abort, set outside of locks and must use
130 * the READ_ONCE/WRITE_ONCE access
131 */
Miao Xiea698d0752012-09-20 01:51:59 -0600132 short aborted;
David Sterba7c2871a2017-11-08 01:07:43 +0100133 bool adding_csums;
Josef Bacikc6b305a2012-12-18 09:16:16 -0500134 bool allocating_chunk;
Filipe Manana79bd3712021-06-29 14:43:06 +0100135 bool removing_chunk;
Miao Xie20dd2cb2013-09-25 21:47:45 +0800136 bool reloc_reserved;
Filipe Mananad0c2f4f2021-01-27 10:35:00 +0000137 bool in_fsync;
Jeff Mahoney64b63582016-06-20 17:23:41 -0400138 struct btrfs_fs_info *fs_info;
Josef Bacikea658ba2012-09-11 16:57:25 -0400139 struct list_head new_bgs;
Chris Masone089f052007-03-16 16:20:31 -0400140};
141
David Sterbabf31f872020-02-05 17:34:34 +0100142/*
143 * The abort status can be changed between calls and is not protected by locks.
144 * This accepts btrfs_transaction and btrfs_trans_handle as types. Once it's
145 * set to a non-zero value it does not change, so the macro should be in checks
146 * but is not necessary for further reads of the value.
147 */
148#define TRANS_ABORTED(trans) (unlikely(READ_ONCE((trans)->aborted)))
149
Chris Mason3063d292008-01-08 15:46:30 -0500150struct btrfs_pending_snapshot {
Chris Mason3de45862008-11-17 21:02:50 -0500151 struct dentry *dentry;
Miao Xiee9662f72013-02-28 10:01:15 +0000152 struct inode *dir;
Chris Mason3063d292008-01-08 15:46:30 -0500153 struct btrfs_root *root;
David Sterbab0c0ea62015-11-10 18:54:00 +0100154 struct btrfs_root_item *root_item;
Yan, Zhenga22285a2010-05-16 10:48:46 -0400155 struct btrfs_root *snap;
Arne Jansen6f72c7e2011-09-14 15:58:21 +0200156 struct btrfs_qgroup_inherit *inherit;
David Sterba8546b572015-11-10 18:54:03 +0100157 struct btrfs_path *path;
Yan, Zhenga22285a2010-05-16 10:48:46 -0400158 /* block reservation for the operation */
159 struct btrfs_block_rsv block_rsv;
Nicholas D Steeves01327612016-05-19 21:18:45 -0400160 /* extra metadata reservation for relocation */
Yan, Zhenga22285a2010-05-16 10:48:46 -0400161 int error;
Qu Wenruo2dfb1e42020-06-16 10:17:36 +0800162 /* Preallocated anonymous block device number */
163 dev_t anon_dev;
Li Zefanb83cc962010-12-20 16:04:08 +0800164 bool readonly;
Chris Mason3063d292008-01-08 15:46:30 -0500165 struct list_head list;
166};
167
Josef Bacik15ee9bc2007-08-10 16:22:09 -0400168static inline void btrfs_set_inode_last_trans(struct btrfs_trans_handle *trans,
Nikolay Borisovd9094412020-06-05 10:41:13 +0300169 struct btrfs_inode *inode)
Josef Bacik15ee9bc2007-08-10 16:22:09 -0400170{
Nikolay Borisovd9094412020-06-05 10:41:13 +0300171 spin_lock(&inode->lock);
172 inode->last_trans = trans->transaction->transid;
173 inode->last_sub_trans = inode->root->log_transid;
Filipe Mananabc0939f2021-02-23 12:08:48 +0000174 inode->last_log_commit = inode->last_sub_trans - 1;
Nikolay Borisovd9094412020-06-05 10:41:13 +0300175 spin_unlock(&inode->lock);
Josef Bacik15ee9bc2007-08-10 16:22:09 -0400176}
177
Qu Wenruo9086db82015-04-20 09:53:50 +0800178/*
179 * Make qgroup codes to skip given qgroupid, means the old/new_roots for
180 * qgroup won't contain the qgroupid in it.
181 */
182static inline void btrfs_set_skip_qgroup(struct btrfs_trans_handle *trans,
183 u64 qgroupid)
184{
185 struct btrfs_delayed_ref_root *delayed_refs;
186
187 delayed_refs = &trans->transaction->delayed_refs;
188 WARN_ON(delayed_refs->qgroup_to_skip);
189 delayed_refs->qgroup_to_skip = qgroupid;
190}
191
192static inline void btrfs_clear_skip_qgroup(struct btrfs_trans_handle *trans)
193{
194 struct btrfs_delayed_ref_root *delayed_refs;
195
196 delayed_refs = &trans->transaction->delayed_refs;
197 WARN_ON(!delayed_refs->qgroup_to_skip);
198 delayed_refs->qgroup_to_skip = 0;
199}
200
Jeff Mahoney3a45bb22016-09-09 21:39:03 -0400201int btrfs_end_transaction(struct btrfs_trans_handle *trans);
Chris Mason79154b12007-03-22 15:59:16 -0400202struct btrfs_trans_handle *btrfs_start_transaction(struct btrfs_root *root,
Alexandru Moise5aed1dd2015-09-22 20:59:15 +0000203 unsigned int num_items);
Filipe Manana8eab77f2015-11-13 23:57:16 +0000204struct btrfs_trans_handle *btrfs_start_transaction_fallback_global_rsv(
205 struct btrfs_root *root,
Josef Bacik7f9fe612020-03-13 15:58:05 -0400206 unsigned int num_items);
Josef Bacik7a7eaa42011-04-13 12:54:33 -0400207struct btrfs_trans_handle *btrfs_join_transaction(struct btrfs_root *root);
Nikolay Borisov8d510122019-10-08 20:43:06 +0300208struct btrfs_trans_handle *btrfs_join_transaction_spacecache(struct btrfs_root *root);
Filipe Mananaa6d155d2019-07-29 09:37:10 +0100209struct btrfs_trans_handle *btrfs_join_transaction_nostart(struct btrfs_root *root);
Miao Xie354aa0f2012-09-20 01:54:00 -0600210struct btrfs_trans_handle *btrfs_attach_transaction(struct btrfs_root *root);
Miao Xied4edf392013-02-20 09:17:06 +0000211struct btrfs_trans_handle *btrfs_attach_transaction_barrier(
212 struct btrfs_root *root);
Jeff Mahoney2ff7e612016-06-22 18:54:24 -0400213int btrfs_wait_for_commit(struct btrfs_fs_info *fs_info, u64 transid);
Chris Mason08607c12007-06-08 15:33:54 -0400214
Josef Bacikcfad3922013-07-25 15:11:47 -0400215void btrfs_add_dead_root(struct btrfs_root *root);
Eric Sandeende78b512013-01-31 18:21:12 +0000216int btrfs_defrag_root(struct btrfs_root *root);
David Sterba9d1a2a32013-03-12 15:13:28 +0000217int btrfs_clean_one_deleted_snapshot(struct btrfs_root *root);
Jeff Mahoney3a45bb22016-09-09 21:39:03 -0400218int btrfs_commit_transaction(struct btrfs_trans_handle *trans);
Josef Bacikfdfbf022021-11-05 16:45:28 -0400219void btrfs_commit_transaction_async(struct btrfs_trans_handle *trans);
Jeff Mahoney3a45bb22016-09-09 21:39:03 -0400220int btrfs_end_transaction_throttle(struct btrfs_trans_handle *trans);
Nikolay Borisova2633b62020-11-24 16:49:25 +0200221bool btrfs_should_end_transaction(struct btrfs_trans_handle *trans);
Jeff Mahoney2ff7e612016-06-22 18:54:24 -0400222void btrfs_throttle(struct btrfs_fs_info *fs_info);
Yan Zheng5d4f98a2009-06-10 10:45:14 -0400223int btrfs_record_root_in_trans(struct btrfs_trans_handle *trans,
224 struct btrfs_root *root);
Jeff Mahoney2ff7e612016-06-22 18:54:24 -0400225int btrfs_write_marked_extents(struct btrfs_fs_info *fs_info,
Yan, Zheng8cef4e12009-11-12 09:33:26 +0000226 struct extent_io_tree *dirty_pages, int mark);
Jeff Mahoneybf89d382016-09-09 20:42:44 -0400227int btrfs_wait_tree_log_extents(struct btrfs_root *root, int mark);
Yan, Zheng8929ecfa2010-05-16 10:49:58 -0400228int btrfs_transaction_blocked(struct btrfs_fs_info *info);
Chris Masonf36f3042009-07-30 10:04:48 -0400229int btrfs_transaction_in_commit(struct btrfs_fs_info *info);
Josef Bacik724e2312013-09-30 11:36:38 -0400230void btrfs_put_transaction(struct btrfs_transaction *transaction);
David Sterba572d9ab2014-02-05 15:26:17 +0100231void btrfs_apply_pending_changes(struct btrfs_fs_info *fs_info);
Josef Bacik2b9dbef2015-09-15 10:07:04 -0400232void btrfs_add_dropped_root(struct btrfs_trans_handle *trans,
233 struct btrfs_root *root);
Josef Bacikfb6dea22019-06-19 15:11:59 -0400234void btrfs_trans_release_chunk_metadata(struct btrfs_trans_handle *trans);
David Sterba9888c342018-04-03 19:16:55 +0200235
Chris Masone089f052007-03-16 16:20:31 -0400236#endif