]> git.ipfire.org Git - thirdparty/linux.git/blame - fs/btrfs/transaction.h
btrfs: fix use-after-free after failure to create a snapshot
[thirdparty/linux.git] / fs / btrfs / transaction.h
CommitLineData
9888c340 1/* SPDX-License-Identifier: GPL-2.0 */
6cbd5570
CM
2/*
3 * Copyright (C) 2007 Oracle. All rights reserved.
6cbd5570
CM
4 */
5
9888c340
DS
6#ifndef BTRFS_TRANSACTION_H
7#define BTRFS_TRANSACTION_H
9b64f57d
ER
8
9#include <linux/refcount.h>
31f3c99b 10#include "btrfs_inode.h"
56bec294 11#include "delayed-ref.h"
bed92eae 12#include "ctree.h"
e089f05c 13
4a9d8bde 14enum btrfs_trans_state {
bbe339cc 15 TRANS_STATE_RUNNING,
bbe339cc
DS
16 TRANS_STATE_COMMIT_START,
17 TRANS_STATE_COMMIT_DOING,
18 TRANS_STATE_UNBLOCKED,
d0c2f4fa 19 TRANS_STATE_SUPER_COMMITTED,
bbe339cc
DS
20 TRANS_STATE_COMPLETED,
21 TRANS_STATE_MAX,
4a9d8bde
MX
22};
23
3204d33c
JB
24#define BTRFS_TRANS_HAVE_FREE_BGS 0
25#define BTRFS_TRANS_DIRTY_BG_RUN 1
2968b1f4 26#define BTRFS_TRANS_CACHE_ENOSPC 2
3204d33c 27
79154b1b
CM
28struct btrfs_transaction {
29 u64 transid;
0860adfd
MX
30 /*
31 * total external writers(USERSPACE/START/ATTACH) in this
32 * transaction, it must be zero before the transaction is
33 * being committed
34 */
35 atomic_t num_extwriters;
b7ec40d7
CM
36 /*
37 * total writers in this transaction, it must be zero before the
38 * transaction can end
39 */
13c5a93e 40 atomic_t num_writers;
9b64f57d 41 refcount_t use_count;
b7ec40d7 42
3204d33c 43 unsigned long flags;
13212b54 44
4a9d8bde
MX
45 /* Be protected by fs_info->trans_lock when we want to change it. */
46 enum btrfs_trans_state state;
5302e089 47 int aborted;
8fd17795 48 struct list_head list;
d1310b2e 49 struct extent_io_tree dirty_pages;
a944442c 50 time64_t start_time;
79154b1b
CM
51 wait_queue_head_t writer_wait;
52 wait_queue_head_t commit_wait;
3063d29f 53 struct list_head pending_snapshots;
bbbf7243 54 struct list_head dev_update_list;
9e351cc8 55 struct list_head switch_commits;
ce93ec54 56 struct list_head dirty_bgs;
45ae2c18
NB
57
58 /*
59 * There is no explicit lock which protects io_bgs, rather its
60 * consistency is implied by the fact that all the sites which modify
61 * it do so under some form of transaction critical section, namely:
62 *
63 * - btrfs_start_dirty_block_groups - This function can only ever be
64 * run by one of the transaction committers. Refer to
65 * BTRFS_TRANS_DIRTY_BG_RUN usage in btrfs_commit_transaction
66 *
67 * - btrfs_write_dirty_blockgroups - this is called by
68 * commit_cowonly_roots from transaction critical section
69 * (TRANS_STATE_COMMIT_DOING)
70 *
71 * - btrfs_cleanup_dirty_bgs - called on transaction abort
72 */
1bbc621e 73 struct list_head io_bgs;
2b9dbef2 74 struct list_head dropped_roots;
fe119a6e 75 struct extent_io_tree pinned_extents;
1bbc621e
CM
76
77 /*
78 * we need to make sure block group deletion doesn't race with
79 * free space cache writeout. This mutex keeps them from stomping
80 * on each other
81 */
82 struct mutex cache_write_mutex;
ce93ec54 83 spinlock_t dirty_bgs_lock;
348a0013 84 /* Protected by spin lock fs_info->unused_bgs_lock. */
e33e17ee 85 struct list_head deleted_bgs;
2b9dbef2 86 spinlock_t dropped_roots_lock;
56bec294 87 struct btrfs_delayed_ref_root delayed_refs;
ab8d0fc4 88 struct btrfs_fs_info *fs_info;
48778179
FM
89
90 /*
91 * Number of ordered extents the transaction must wait for before
92 * committing. These are ordered extents started by a fast fsync.
93 */
94 atomic_t pending_ordered;
95 wait_queue_head_t pending_wait;
d3575156
NA
96
97 spinlock_t releasing_ebs_lock;
98 struct list_head releasing_ebs;
79154b1b
CM
99};
100
0860adfd
MX
101#define __TRANS_FREEZABLE (1U << 0)
102
0860adfd
MX
103#define __TRANS_START (1U << 9)
104#define __TRANS_ATTACH (1U << 10)
105#define __TRANS_JOIN (1U << 11)
106#define __TRANS_JOIN_NOLOCK (1U << 12)
faa2dbf0 107#define __TRANS_DUMMY (1U << 13)
a6d155d2 108#define __TRANS_JOIN_NOSTART (1U << 14)
0860adfd 109
0860adfd
MX
110#define TRANS_START (__TRANS_START | __TRANS_FREEZABLE)
111#define TRANS_ATTACH (__TRANS_ATTACH)
112#define TRANS_JOIN (__TRANS_JOIN | __TRANS_FREEZABLE)
113#define TRANS_JOIN_NOLOCK (__TRANS_JOIN_NOLOCK)
a6d155d2 114#define TRANS_JOIN_NOSTART (__TRANS_JOIN_NOSTART)
0860adfd 115
bcf3a3e7 116#define TRANS_EXTWRITERS (__TRANS_START | __TRANS_ATTACH)
a698d075 117
e089f05c
CM
118struct btrfs_trans_handle {
119 u64 transid;
f0486c68 120 u64 bytes_reserved;
4fbcdf66 121 u64 chunk_bytes_reserved;
56bec294 122 unsigned long delayed_ref_updates;
f0486c68
YZ
123 struct btrfs_transaction *transaction;
124 struct btrfs_block_rsv *block_rsv;
2a1eb461 125 struct btrfs_block_rsv *orig_rsv;
28b21c55
FM
126 /* Set by a task that wants to create a snapshot. */
127 struct btrfs_pending_snapshot *pending_snapshot;
1ca4bb63
DS
128 refcount_t use_count;
129 unsigned int type;
bf31f87f
DS
130 /*
131 * Error code of transaction abort, set outside of locks and must use
132 * the READ_ONCE/WRITE_ONCE access
133 */
a698d075 134 short aborted;
7c2871a2 135 bool adding_csums;
c6b305a8 136 bool allocating_chunk;
79bd3712 137 bool removing_chunk;
20dd2cbf 138 bool reloc_reserved;
d0c2f4fa 139 bool in_fsync;
64b63580 140 struct btrfs_fs_info *fs_info;
ea658bad 141 struct list_head new_bgs;
e089f05c
CM
142};
143
bf31f87f
DS
144/*
145 * The abort status can be changed between calls and is not protected by locks.
146 * This accepts btrfs_transaction and btrfs_trans_handle as types. Once it's
147 * set to a non-zero value it does not change, so the macro should be in checks
148 * but is not necessary for further reads of the value.
149 */
150#define TRANS_ABORTED(trans) (unlikely(READ_ONCE((trans)->aborted)))
151
3063d29f 152struct btrfs_pending_snapshot {
3de4586c 153 struct dentry *dentry;
e9662f70 154 struct inode *dir;
3063d29f 155 struct btrfs_root *root;
b0c0ea63 156 struct btrfs_root_item *root_item;
a22285a6 157 struct btrfs_root *snap;
6f72c7e2 158 struct btrfs_qgroup_inherit *inherit;
8546b570 159 struct btrfs_path *path;
a22285a6
YZ
160 /* block reservation for the operation */
161 struct btrfs_block_rsv block_rsv;
01327610 162 /* extra metadata reservation for relocation */
a22285a6 163 int error;
2dfb1e43
QW
164 /* Preallocated anonymous block device number */
165 dev_t anon_dev;
b83cc969 166 bool readonly;
3063d29f
CM
167 struct list_head list;
168};
169
15ee9bc7 170static inline void btrfs_set_inode_last_trans(struct btrfs_trans_handle *trans,
d9094414 171 struct btrfs_inode *inode)
15ee9bc7 172{
d9094414
NB
173 spin_lock(&inode->lock);
174 inode->last_trans = trans->transaction->transid;
175 inode->last_sub_trans = inode->root->log_transid;
bc0939fc 176 inode->last_log_commit = inode->last_sub_trans - 1;
d9094414 177 spin_unlock(&inode->lock);
15ee9bc7
JB
178}
179
9086db86
QW
180/*
181 * Make qgroup codes to skip given qgroupid, means the old/new_roots for
182 * qgroup won't contain the qgroupid in it.
183 */
184static inline void btrfs_set_skip_qgroup(struct btrfs_trans_handle *trans,
185 u64 qgroupid)
186{
187 struct btrfs_delayed_ref_root *delayed_refs;
188
189 delayed_refs = &trans->transaction->delayed_refs;
190 WARN_ON(delayed_refs->qgroup_to_skip);
191 delayed_refs->qgroup_to_skip = qgroupid;
192}
193
194static inline void btrfs_clear_skip_qgroup(struct btrfs_trans_handle *trans)
195{
196 struct btrfs_delayed_ref_root *delayed_refs;
197
198 delayed_refs = &trans->transaction->delayed_refs;
199 WARN_ON(!delayed_refs->qgroup_to_skip);
200 delayed_refs->qgroup_to_skip = 0;
201}
202
3a45bb20 203int btrfs_end_transaction(struct btrfs_trans_handle *trans);
79154b1b 204struct btrfs_trans_handle *btrfs_start_transaction(struct btrfs_root *root,
5aed1dd8 205 unsigned int num_items);
8eab77ff
FM
206struct btrfs_trans_handle *btrfs_start_transaction_fallback_global_rsv(
207 struct btrfs_root *root,
7f9fe614 208 unsigned int num_items);
7a7eaa40 209struct btrfs_trans_handle *btrfs_join_transaction(struct btrfs_root *root);
8d510121 210struct btrfs_trans_handle *btrfs_join_transaction_spacecache(struct btrfs_root *root);
a6d155d2 211struct btrfs_trans_handle *btrfs_join_transaction_nostart(struct btrfs_root *root);
354aa0fb 212struct btrfs_trans_handle *btrfs_attach_transaction(struct btrfs_root *root);
d4edf39b
MX
213struct btrfs_trans_handle *btrfs_attach_transaction_barrier(
214 struct btrfs_root *root);
2ff7e61e 215int btrfs_wait_for_commit(struct btrfs_fs_info *fs_info, u64 transid);
08607c1b 216
cfad392b 217void btrfs_add_dead_root(struct btrfs_root *root);
de78b51a 218int btrfs_defrag_root(struct btrfs_root *root);
9d1a2a3a 219int btrfs_clean_one_deleted_snapshot(struct btrfs_root *root);
3a45bb20 220int btrfs_commit_transaction(struct btrfs_trans_handle *trans);
fdfbf020 221void btrfs_commit_transaction_async(struct btrfs_trans_handle *trans);
3a45bb20 222int btrfs_end_transaction_throttle(struct btrfs_trans_handle *trans);
a2633b6a 223bool btrfs_should_end_transaction(struct btrfs_trans_handle *trans);
2ff7e61e 224void btrfs_throttle(struct btrfs_fs_info *fs_info);
5d4f98a2
YZ
225int btrfs_record_root_in_trans(struct btrfs_trans_handle *trans,
226 struct btrfs_root *root);
2ff7e61e 227int btrfs_write_marked_extents(struct btrfs_fs_info *fs_info,
8cef4e16 228 struct extent_io_tree *dirty_pages, int mark);
bf89d38f 229int btrfs_wait_tree_log_extents(struct btrfs_root *root, int mark);
8929ecfa 230int btrfs_transaction_blocked(struct btrfs_fs_info *info);
f36f3042 231int btrfs_transaction_in_commit(struct btrfs_fs_info *info);
724e2315 232void btrfs_put_transaction(struct btrfs_transaction *transaction);
572d9ab7 233void btrfs_apply_pending_changes(struct btrfs_fs_info *fs_info);
2b9dbef2
JB
234void btrfs_add_dropped_root(struct btrfs_trans_handle *trans,
235 struct btrfs_root *root);
fb6dea26 236void btrfs_trans_release_chunk_metadata(struct btrfs_trans_handle *trans);
9888c340 237
e089f05c 238#endif