]>
Commit | Line | Data |
---|---|---|
d8a5ba45 MS |
1 | /* |
2 | FUSE: Filesystem in Userspace | |
1729a16c | 3 | Copyright (C) 2001-2008 Miklos Szeredi <miklos@szeredi.hu> |
d8a5ba45 MS |
4 | |
5 | This program can be distributed under the terms of the GNU GPL. | |
6 | See the file COPYING. | |
7 | */ | |
8 | ||
9 | #include "fuse_i.h" | |
10 | ||
11 | #include <linux/pagemap.h> | |
12 | #include <linux/slab.h> | |
13 | #include <linux/file.h> | |
d8a5ba45 MS |
14 | #include <linux/seq_file.h> |
15 | #include <linux/init.h> | |
16 | #include <linux/module.h> | |
487ea5af | 17 | #include <linux/moduleparam.h> |
c30da2e9 DH |
18 | #include <linux/fs_context.h> |
19 | #include <linux/fs_parser.h> | |
d8a5ba45 | 20 | #include <linux/statfs.h> |
9c8ef561 | 21 | #include <linux/random.h> |
e8edc6e0 | 22 | #include <linux/sched.h> |
dbd561d2 | 23 | #include <linux/exportfs.h> |
60bcc88a | 24 | #include <linux/posix_acl.h> |
0b6e9ea0 | 25 | #include <linux/pid_namespace.h> |
c086df49 | 26 | #include <uapi/linux/magic.h> |
d8a5ba45 MS |
27 | |
28 | MODULE_AUTHOR("Miklos Szeredi <miklos@szeredi.hu>"); | |
29 | MODULE_DESCRIPTION("Filesystem in Userspace"); | |
30 | MODULE_LICENSE("GPL"); | |
31 | ||
e18b890b | 32 | static struct kmem_cache *fuse_inode_cachep; |
bafa9654 MS |
33 | struct list_head fuse_conn_list; |
34 | DEFINE_MUTEX(fuse_mutex); | |
d8a5ba45 | 35 | |
e4dca7b7 | 36 | static int set_global_limit(const char *val, const struct kernel_param *kp); |
487ea5af | 37 | |
79a9d994 | 38 | unsigned max_user_bgreq; |
487ea5af CH |
39 | module_param_call(max_user_bgreq, set_global_limit, param_get_uint, |
40 | &max_user_bgreq, 0644); | |
41 | __MODULE_PARM_TYPE(max_user_bgreq, "uint"); | |
42 | MODULE_PARM_DESC(max_user_bgreq, | |
43 | "Global limit for the maximum number of backgrounded requests an " | |
44 | "unprivileged user can set"); | |
45 | ||
79a9d994 | 46 | unsigned max_user_congthresh; |
487ea5af CH |
47 | module_param_call(max_user_congthresh, set_global_limit, param_get_uint, |
48 | &max_user_congthresh, 0644); | |
49 | __MODULE_PARM_TYPE(max_user_congthresh, "uint"); | |
50 | MODULE_PARM_DESC(max_user_congthresh, | |
51 | "Global limit for the maximum congestion threshold an " | |
52 | "unprivileged user can set"); | |
53 | ||
d1875dba MS |
54 | #define FUSE_DEFAULT_BLKSIZE 512 |
55 | ||
7a6d3c8b CH |
56 | /** Maximum number of outstanding background requests */ |
57 | #define FUSE_DEFAULT_MAX_BACKGROUND 12 | |
58 | ||
59 | /** Congestion starts at 75% of maximum */ | |
60 | #define FUSE_DEFAULT_CONGESTION_THRESHOLD (FUSE_DEFAULT_MAX_BACKGROUND * 3 / 4) | |
61 | ||
c30da2e9 DH |
62 | #ifdef CONFIG_BLOCK |
63 | static struct file_system_type fuseblk_fs_type; | |
64 | #endif | |
65 | ||
a2daff68 | 66 | struct fuse_forget_link *fuse_alloc_forget(void) |
07e77dca | 67 | { |
dc69e98c | 68 | return kzalloc(sizeof(struct fuse_forget_link), GFP_KERNEL_ACCOUNT); |
07e77dca MS |
69 | } |
70 | ||
c4d361f6 KJ |
71 | static struct fuse_submount_lookup *fuse_alloc_submount_lookup(void) |
72 | { | |
73 | struct fuse_submount_lookup *sl; | |
74 | ||
75 | sl = kzalloc(sizeof(struct fuse_submount_lookup), GFP_KERNEL_ACCOUNT); | |
76 | if (!sl) | |
77 | return NULL; | |
78 | sl->forget = fuse_alloc_forget(); | |
79 | if (!sl->forget) | |
80 | goto out_free; | |
81 | ||
82 | return sl; | |
83 | ||
84 | out_free: | |
85 | kfree(sl); | |
86 | return NULL; | |
87 | } | |
88 | ||
d8a5ba45 MS |
89 | static struct inode *fuse_alloc_inode(struct super_block *sb) |
90 | { | |
d8a5ba45 MS |
91 | struct fuse_inode *fi; |
92 | ||
fd60b288 | 93 | fi = alloc_inode_sb(sb, fuse_inode_cachep, GFP_KERNEL); |
9031a69c | 94 | if (!fi) |
d8a5ba45 MS |
95 | return NULL; |
96 | ||
0a0898cf | 97 | fi->i_time = 0; |
d3045530 | 98 | fi->inval_mask = ~0; |
d8a5ba45 | 99 | fi->nodeid = 0; |
9e6268db | 100 | fi->nlookup = 0; |
fbee36b9 | 101 | fi->attr_version = 0; |
45c72cd7 | 102 | fi->orig_ino = 0; |
4582a4ab | 103 | fi->state = 0; |
c4d361f6 | 104 | fi->submount_lookup = NULL; |
5c672ab3 | 105 | mutex_init(&fi->mutex); |
f15ecfef | 106 | spin_lock_init(&fi->lock); |
07e77dca | 107 | fi->forget = fuse_alloc_forget(); |
c2d0ad00 VG |
108 | if (!fi->forget) |
109 | goto out_free; | |
110 | ||
111 | if (IS_ENABLED(CONFIG_FUSE_DAX) && !fuse_dax_inode_alloc(sb, fi)) | |
112 | goto out_free_forget; | |
d8a5ba45 | 113 | |
7dc4e97a AG |
114 | if (IS_ENABLED(CONFIG_FUSE_PASSTHROUGH)) |
115 | fuse_inode_backing_set(fi, NULL); | |
116 | ||
9031a69c | 117 | return &fi->inode; |
c2d0ad00 VG |
118 | |
119 | out_free_forget: | |
120 | kfree(fi->forget); | |
121 | out_free: | |
122 | kmem_cache_free(fuse_inode_cachep, fi); | |
123 | return NULL; | |
d8a5ba45 MS |
124 | } |
125 | ||
9baf28bb | 126 | static void fuse_free_inode(struct inode *inode) |
d8a5ba45 | 127 | { |
e5e5558e | 128 | struct fuse_inode *fi = get_fuse_inode(inode); |
9baf28bb | 129 | |
5c672ab3 | 130 | mutex_destroy(&fi->mutex); |
07e77dca | 131 | kfree(fi->forget); |
c2d0ad00 VG |
132 | #ifdef CONFIG_FUSE_DAX |
133 | kfree(fi->dax); | |
134 | #endif | |
7dc4e97a AG |
135 | if (IS_ENABLED(CONFIG_FUSE_PASSTHROUGH)) |
136 | fuse_backing_put(fuse_inode_backing(fi)); | |
137 | ||
9baf28bb | 138 | kmem_cache_free(fuse_inode_cachep, fi); |
d8a5ba45 MS |
139 | } |
140 | ||
c4d361f6 KJ |
141 | static void fuse_cleanup_submount_lookup(struct fuse_conn *fc, |
142 | struct fuse_submount_lookup *sl) | |
143 | { | |
144 | if (!refcount_dec_and_test(&sl->count)) | |
145 | return; | |
146 | ||
147 | fuse_queue_forget(fc, sl->forget, sl->nodeid, 1); | |
148 | sl->forget = NULL; | |
149 | kfree(sl); | |
150 | } | |
151 | ||
b57922d9 | 152 | static void fuse_evict_inode(struct inode *inode) |
d8a5ba45 | 153 | { |
9baf28bb AV |
154 | struct fuse_inode *fi = get_fuse_inode(inode); |
155 | ||
5c791fe1 MS |
156 | /* Will write inode on close/munmap and in all other dirtiers */ |
157 | WARN_ON(inode->i_state & I_DIRTY_INODE); | |
158 | ||
91b0abe3 | 159 | truncate_inode_pages_final(&inode->i_data); |
dbd5768f | 160 | clear_inode(inode); |
1751e8a6 | 161 | if (inode->i_sb->s_flags & SB_ACTIVE) { |
1e9a4ed9 | 162 | struct fuse_conn *fc = get_fuse_conn(inode); |
c2d0ad00 VG |
163 | |
164 | if (FUSE_IS_DAX(inode)) | |
165 | fuse_dax_inode_cleanup(inode); | |
1866d779 MR |
166 | if (fi->nlookup) { |
167 | fuse_queue_forget(fc, fi->forget, fi->nodeid, | |
168 | fi->nlookup); | |
169 | fi->forget = NULL; | |
170 | } | |
c4d361f6 KJ |
171 | |
172 | if (fi->submount_lookup) { | |
173 | fuse_cleanup_submount_lookup(fc, fi->submount_lookup); | |
174 | fi->submount_lookup = NULL; | |
175 | } | |
e5e5558e | 176 | } |
5d069dbe | 177 | if (S_ISREG(inode->i_mode) && !fuse_is_bad(inode)) { |
9baf28bb AV |
178 | WARN_ON(!list_empty(&fi->write_files)); |
179 | WARN_ON(!list_empty(&fi->queued_writes)); | |
180 | } | |
d8a5ba45 MS |
181 | } |
182 | ||
84c21507 | 183 | static int fuse_reconfigure(struct fs_context *fsc) |
71421259 | 184 | { |
84c21507 | 185 | struct super_block *sb = fsc->root->d_sb; |
0189a2d3 | 186 | |
02b9984d | 187 | sync_filesystem(sb); |
84c21507 | 188 | if (fsc->sb_flags & SB_MANDLOCK) |
71421259 MS |
189 | return -EINVAL; |
190 | ||
191 | return 0; | |
192 | } | |
193 | ||
45c72cd7 PS |
194 | /* |
195 | * ino_t is 32-bits on 32-bit arch. We have to squash the 64-bit value down | |
196 | * so that it will fit. | |
197 | */ | |
198 | static ino_t fuse_squash_ino(u64 ino64) | |
199 | { | |
200 | ino_t ino = (ino_t) ino64; | |
201 | if (sizeof(ino_t) < sizeof(u64)) | |
202 | ino ^= ino64 >> (sizeof(u64) - sizeof(ino_t)) * 8; | |
203 | return ino; | |
204 | } | |
205 | ||
3be5a52b | 206 | void fuse_change_attributes_common(struct inode *inode, struct fuse_attr *attr, |
972f4c46 | 207 | struct fuse_statx *sx, |
4b52f059 | 208 | u64 attr_valid, u32 cache_mask) |
d8a5ba45 | 209 | { |
9ffbb916 | 210 | struct fuse_conn *fc = get_fuse_conn(inode); |
ebc14c4d | 211 | struct fuse_inode *fi = get_fuse_inode(inode); |
d8a5ba45 | 212 | |
f15ecfef KT |
213 | lockdep_assert_held(&fi->lock); |
214 | ||
4510d86f | 215 | fi->attr_version = atomic64_inc_return(&fc->attr_version); |
1fb69e78 | 216 | fi->i_time = attr_valid; |
d3045530 MS |
217 | /* Clear basic stats from invalid mask */ |
218 | set_mask_bits(&fi->inval_mask, STATX_BASIC_STATS, 0); | |
1fb69e78 | 219 | |
45c72cd7 | 220 | inode->i_ino = fuse_squash_ino(attr->ino); |
ebc14c4d | 221 | inode->i_mode = (inode->i_mode & S_IFMT) | (attr->mode & 07777); |
bfe86848 | 222 | set_nlink(inode, attr->nlink); |
8cb08329 EB |
223 | inode->i_uid = make_kuid(fc->user_ns, attr->uid); |
224 | inode->i_gid = make_kgid(fc->user_ns, attr->gid); | |
d8a5ba45 | 225 | inode->i_blocks = attr->blocks; |
47912eaa MS |
226 | |
227 | /* Sanitize nsecs */ | |
228 | attr->atimensec = min_t(u32, attr->atimensec, NSEC_PER_SEC - 1); | |
229 | attr->mtimensec = min_t(u32, attr->mtimensec, NSEC_PER_SEC - 1); | |
230 | attr->ctimensec = min_t(u32, attr->ctimensec, NSEC_PER_SEC - 1); | |
231 | ||
3c0d5df2 | 232 | inode_set_atime(inode, attr->atime, attr->atimensec); |
b0aa7606 | 233 | /* mtime from server may be stale due to local buffered write */ |
4b52f059 | 234 | if (!(cache_mask & STATX_MTIME)) { |
3c0d5df2 | 235 | inode_set_mtime(inode, attr->mtime, attr->mtimensec); |
4b52f059 MS |
236 | } |
237 | if (!(cache_mask & STATX_CTIME)) { | |
ceb2d5e9 | 238 | inode_set_ctime(inode, attr->ctime, attr->ctimensec); |
b0aa7606 | 239 | } |
972f4c46 MS |
240 | if (sx) { |
241 | /* Sanitize nsecs */ | |
242 | sx->btime.tv_nsec = | |
243 | min_t(u32, sx->btime.tv_nsec, NSEC_PER_SEC - 1); | |
244 | ||
245 | /* | |
246 | * Btime has been queried, cache is valid (whether or not btime | |
247 | * is available or not) so clear STATX_BTIME from inval_mask. | |
248 | * | |
249 | * Availability of the btime attribute is indicated in | |
250 | * FUSE_I_BTIME | |
251 | */ | |
252 | set_mask_bits(&fi->inval_mask, STATX_BTIME, 0); | |
253 | if (sx->mask & STATX_BTIME) { | |
254 | set_bit(FUSE_I_BTIME, &fi->state); | |
255 | fi->i_btime.tv_sec = sx->btime.tv_sec; | |
256 | fi->i_btime.tv_nsec = sx->btime.tv_nsec; | |
257 | } | |
258 | } | |
e00d2c2d | 259 | |
0e9663ee MS |
260 | if (attr->blksize != 0) |
261 | inode->i_blkbits = ilog2(attr->blksize); | |
262 | else | |
263 | inode->i_blkbits = inode->i_sb->s_blocksize_bits; | |
264 | ||
ebc14c4d MS |
265 | /* |
266 | * Don't set the sticky bit in i_mode, unless we want the VFS | |
267 | * to check permissions. This prevents failures due to the | |
268 | * check in may_delete(). | |
269 | */ | |
270 | fi->orig_i_mode = inode->i_mode; | |
29433a29 | 271 | if (!fc->default_permissions) |
ebc14c4d | 272 | inode->i_mode &= ~S_ISVTX; |
45c72cd7 PS |
273 | |
274 | fi->orig_ino = attr->ino; | |
9d769e6a VG |
275 | |
276 | /* | |
277 | * We are refreshing inode data and it is possible that another | |
278 | * client set suid/sgid or security.capability xattr. So clear | |
279 | * S_NOSEC. Ideally, we could have cleared it only if suid/sgid | |
280 | * was set or if security.capability xattr was set. But we don't | |
281 | * know if security.capability has been set or not. So clear it | |
282 | * anyway. Its less efficient but should be safe. | |
283 | */ | |
284 | inode->i_flags &= ~S_NOSEC; | |
3be5a52b MS |
285 | } |
286 | ||
4b52f059 MS |
287 | u32 fuse_get_cache_mask(struct inode *inode) |
288 | { | |
289 | struct fuse_conn *fc = get_fuse_conn(inode); | |
290 | ||
291 | if (!fc->writeback_cache || !S_ISREG(inode->i_mode)) | |
292 | return 0; | |
293 | ||
294 | return STATX_MTIME | STATX_CTIME | STATX_SIZE; | |
295 | } | |
296 | ||
3be5a52b | 297 | void fuse_change_attributes(struct inode *inode, struct fuse_attr *attr, |
972f4c46 | 298 | struct fuse_statx *sx, |
3be5a52b MS |
299 | u64 attr_valid, u64 attr_version) |
300 | { | |
301 | struct fuse_conn *fc = get_fuse_conn(inode); | |
302 | struct fuse_inode *fi = get_fuse_inode(inode); | |
4b52f059 | 303 | u32 cache_mask; |
3be5a52b | 304 | loff_t oldsize; |
a64ba10f | 305 | struct timespec64 old_mtime; |
3be5a52b | 306 | |
f15ecfef | 307 | spin_lock(&fi->lock); |
04d82db0 MS |
308 | /* |
309 | * In case of writeback_cache enabled, writes update mtime, ctime and | |
310 | * may update i_size. In these cases trust the cached value in the | |
311 | * inode. | |
312 | */ | |
4b52f059 MS |
313 | cache_mask = fuse_get_cache_mask(inode); |
314 | if (cache_mask & STATX_SIZE) | |
04d82db0 | 315 | attr->size = i_size_read(inode); |
4b52f059 MS |
316 | |
317 | if (cache_mask & STATX_MTIME) { | |
3c0d5df2 JL |
318 | attr->mtime = inode_get_mtime_sec(inode); |
319 | attr->mtimensec = inode_get_mtime_nsec(inode); | |
4b52f059 MS |
320 | } |
321 | if (cache_mask & STATX_CTIME) { | |
3c0d5df2 JL |
322 | attr->ctime = inode_get_ctime_sec(inode); |
323 | attr->ctimensec = inode_get_ctime_nsec(inode); | |
04d82db0 MS |
324 | } |
325 | ||
06a7c3c2 MP |
326 | if ((attr_version != 0 && fi->attr_version > attr_version) || |
327 | test_bit(FUSE_I_SIZE_UNSTABLE, &fi->state)) { | |
f15ecfef | 328 | spin_unlock(&fi->lock); |
3be5a52b MS |
329 | return; |
330 | } | |
331 | ||
3c0d5df2 | 332 | old_mtime = inode_get_mtime(inode); |
972f4c46 | 333 | fuse_change_attributes_common(inode, attr, sx, attr_valid, cache_mask); |
ebc14c4d | 334 | |
e00d2c2d | 335 | oldsize = inode->i_size; |
8373200b PE |
336 | /* |
337 | * In case of writeback_cache enabled, the cached writes beyond EOF | |
338 | * extend local i_size without keeping userspace server in sync. So, | |
339 | * attr->size coming from server can be stale. We cannot trust it. | |
340 | */ | |
4b52f059 | 341 | if (!(cache_mask & STATX_SIZE)) |
8373200b | 342 | i_size_write(inode, attr->size); |
f15ecfef | 343 | spin_unlock(&fi->lock); |
e00d2c2d | 344 | |
4b52f059 | 345 | if (!cache_mask && S_ISREG(inode->i_mode)) { |
eed2179e BF |
346 | bool inval = false; |
347 | ||
348 | if (oldsize != attr->size) { | |
7caef267 | 349 | truncate_pagecache(inode, attr->size); |
ad2ba64d KS |
350 | if (!fc->explicit_inval_data) |
351 | inval = true; | |
eed2179e | 352 | } else if (fc->auto_inval_data) { |
a64ba10f | 353 | struct timespec64 new_mtime = { |
eed2179e BF |
354 | .tv_sec = attr->mtime, |
355 | .tv_nsec = attr->mtimensec, | |
356 | }; | |
357 | ||
358 | /* | |
359 | * Auto inval mode also checks and invalidates if mtime | |
360 | * has changed. | |
361 | */ | |
a64ba10f | 362 | if (!timespec64_equal(&old_mtime, &new_mtime)) |
eed2179e BF |
363 | inval = true; |
364 | } | |
365 | ||
366 | if (inval) | |
367 | invalidate_inode_pages2(inode->i_mapping); | |
e00d2c2d | 368 | } |
c3cb6f93 JX |
369 | |
370 | if (IS_ENABLED(CONFIG_FUSE_DAX)) | |
371 | fuse_dax_dontcache(inode, attr->flags); | |
d8a5ba45 MS |
372 | } |
373 | ||
c4d361f6 KJ |
374 | static void fuse_init_submount_lookup(struct fuse_submount_lookup *sl, |
375 | u64 nodeid) | |
376 | { | |
377 | sl->nodeid = nodeid; | |
378 | refcount_set(&sl->count, 1); | |
379 | } | |
380 | ||
facd6105 CB |
381 | static void fuse_init_inode(struct inode *inode, struct fuse_attr *attr, |
382 | struct fuse_conn *fc) | |
d8a5ba45 MS |
383 | { |
384 | inode->i_mode = attr->mode & S_IFMT; | |
9ffbb916 | 385 | inode->i_size = attr->size; |
3c0d5df2 | 386 | inode_set_mtime(inode, attr->mtime, attr->mtimensec); |
ceb2d5e9 | 387 | inode_set_ctime(inode, attr->ctime, attr->ctimensec); |
e5e5558e MS |
388 | if (S_ISREG(inode->i_mode)) { |
389 | fuse_init_common(inode); | |
93a497b9 | 390 | fuse_init_file_inode(inode, attr->flags); |
e5e5558e MS |
391 | } else if (S_ISDIR(inode->i_mode)) |
392 | fuse_init_dir(inode); | |
393 | else if (S_ISLNK(inode->i_mode)) | |
394 | fuse_init_symlink(inode); | |
395 | else if (S_ISCHR(inode->i_mode) || S_ISBLK(inode->i_mode) || | |
396 | S_ISFIFO(inode->i_mode) || S_ISSOCK(inode->i_mode)) { | |
397 | fuse_init_common(inode); | |
398 | init_special_inode(inode, inode->i_mode, | |
399 | new_decode_dev(attr->rdev)); | |
39ee059a MS |
400 | } else |
401 | BUG(); | |
facd6105 CB |
402 | /* |
403 | * Ensure that we don't cache acls for daemons without FUSE_POSIX_ACL | |
404 | * so they see the exact same behavior as before. | |
405 | */ | |
406 | if (!fc->posix_acl) | |
407 | inode->i_acl = inode->i_default_acl = ACL_DONT_CACHE; | |
d8a5ba45 MS |
408 | } |
409 | ||
fcee216b | 410 | static int fuse_inode_eq(struct inode *inode, void *_nodeidp) |
d8a5ba45 | 411 | { |
b48badf0 | 412 | u64 nodeid = *(u64 *) _nodeidp; |
d8a5ba45 MS |
413 | if (get_node_id(inode) == nodeid) |
414 | return 1; | |
415 | else | |
416 | return 0; | |
417 | } | |
418 | ||
419 | static int fuse_inode_set(struct inode *inode, void *_nodeidp) | |
420 | { | |
b48badf0 | 421 | u64 nodeid = *(u64 *) _nodeidp; |
d8a5ba45 MS |
422 | get_fuse_inode(inode)->nodeid = nodeid; |
423 | return 0; | |
424 | } | |
425 | ||
b48badf0 | 426 | struct inode *fuse_iget(struct super_block *sb, u64 nodeid, |
1fb69e78 MS |
427 | int generation, struct fuse_attr *attr, |
428 | u64 attr_valid, u64 attr_version) | |
d8a5ba45 MS |
429 | { |
430 | struct inode *inode; | |
9e6268db | 431 | struct fuse_inode *fi; |
d8a5ba45 | 432 | struct fuse_conn *fc = get_fuse_conn_super(sb); |
d8a5ba45 | 433 | |
bf109c64 MR |
434 | /* |
435 | * Auto mount points get their node id from the submount root, which is | |
436 | * not a unique identifier within this filesystem. | |
437 | * | |
438 | * To avoid conflicts, do not place submount points into the inode hash | |
439 | * table. | |
440 | */ | |
441 | if (fc->auto_submounts && (attr->flags & FUSE_ATTR_SUBMOUNT) && | |
442 | S_ISDIR(attr->mode)) { | |
c4d361f6 KJ |
443 | struct fuse_inode *fi; |
444 | ||
bf109c64 MR |
445 | inode = new_inode(sb); |
446 | if (!inode) | |
447 | return NULL; | |
448 | ||
facd6105 | 449 | fuse_init_inode(inode, attr, fc); |
c4d361f6 KJ |
450 | fi = get_fuse_inode(inode); |
451 | fi->nodeid = nodeid; | |
452 | fi->submount_lookup = fuse_alloc_submount_lookup(); | |
453 | if (!fi->submount_lookup) { | |
454 | iput(inode); | |
455 | return NULL; | |
456 | } | |
457 | /* Sets nlookup = 1 on fi->submount_lookup->nlookup */ | |
458 | fuse_init_submount_lookup(fi->submount_lookup, nodeid); | |
bf109c64 MR |
459 | inode->i_flags |= S_AUTOMOUNT; |
460 | goto done; | |
461 | } | |
462 | ||
463 | retry: | |
d8a5ba45 MS |
464 | inode = iget5_locked(sb, nodeid, fuse_inode_eq, fuse_inode_set, &nodeid); |
465 | if (!inode) | |
466 | return NULL; | |
467 | ||
468 | if ((inode->i_state & I_NEW)) { | |
b0aa7606 | 469 | inode->i_flags |= S_NOATIME; |
d31433c8 | 470 | if (!fc->writeback_cache || !S_ISREG(attr->mode)) |
b0aa7606 | 471 | inode->i_flags |= S_NOCMTIME; |
d8a5ba45 | 472 | inode->i_generation = generation; |
facd6105 | 473 | fuse_init_inode(inode, attr, fc); |
d8a5ba45 | 474 | unlock_new_inode(inode); |
15db1683 AG |
475 | } else if (fuse_stale_inode(inode, generation, attr)) { |
476 | /* nodeid was reused, any I/O on the old inode should fail */ | |
5d069dbe | 477 | fuse_make_bad(inode); |
d8a5ba45 | 478 | iput(inode); |
d8a5ba45 MS |
479 | goto retry; |
480 | } | |
9e6268db | 481 | fi = get_fuse_inode(inode); |
c9d8f5f0 | 482 | spin_lock(&fi->lock); |
1729a16c | 483 | fi->nlookup++; |
c9d8f5f0 | 484 | spin_unlock(&fi->lock); |
c4d361f6 | 485 | done: |
972f4c46 | 486 | fuse_change_attributes(inode, attr, NULL, attr_valid, attr_version); |
1fb69e78 | 487 | |
d8a5ba45 MS |
488 | return inode; |
489 | } | |
490 | ||
fcee216b MR |
491 | struct inode *fuse_ilookup(struct fuse_conn *fc, u64 nodeid, |
492 | struct fuse_mount **fm) | |
493 | { | |
494 | struct fuse_mount *fm_iter; | |
495 | struct inode *inode; | |
496 | ||
497 | WARN_ON(!rwsem_is_locked(&fc->killsb)); | |
498 | list_for_each_entry(fm_iter, &fc->mounts, fc_entry) { | |
499 | if (!fm_iter->sb) | |
500 | continue; | |
501 | ||
502 | inode = ilookup5(fm_iter->sb, nodeid, fuse_inode_eq, &nodeid); | |
503 | if (inode) { | |
504 | if (fm) | |
505 | *fm = fm_iter; | |
506 | return inode; | |
507 | } | |
508 | } | |
509 | ||
510 | return NULL; | |
511 | } | |
512 | ||
513 | int fuse_reverse_inval_inode(struct fuse_conn *fc, u64 nodeid, | |
3b463ae0 JM |
514 | loff_t offset, loff_t len) |
515 | { | |
5ddd9ced | 516 | struct fuse_inode *fi; |
3b463ae0 JM |
517 | struct inode *inode; |
518 | pgoff_t pg_start; | |
519 | pgoff_t pg_end; | |
520 | ||
fcee216b | 521 | inode = fuse_ilookup(fc, nodeid, NULL); |
3b463ae0 JM |
522 | if (!inode) |
523 | return -ENOENT; | |
524 | ||
5ddd9ced MS |
525 | fi = get_fuse_inode(inode); |
526 | spin_lock(&fi->lock); | |
527 | fi->attr_version = atomic64_inc_return(&fc->attr_version); | |
528 | spin_unlock(&fi->lock); | |
529 | ||
3b463ae0 | 530 | fuse_invalidate_attr(inode); |
60bcc88a | 531 | forget_all_cached_acls(inode); |
3b463ae0 | 532 | if (offset >= 0) { |
09cbfeaf | 533 | pg_start = offset >> PAGE_SHIFT; |
3b463ae0 JM |
534 | if (len <= 0) |
535 | pg_end = -1; | |
536 | else | |
09cbfeaf | 537 | pg_end = (offset + len - 1) >> PAGE_SHIFT; |
3b463ae0 JM |
538 | invalidate_inode_pages2_range(inode->i_mapping, |
539 | pg_start, pg_end); | |
540 | } | |
541 | iput(inode); | |
542 | return 0; | |
543 | } | |
544 | ||
63576c13 | 545 | bool fuse_lock_inode(struct inode *inode) |
5c672ab3 | 546 | { |
63576c13 MS |
547 | bool locked = false; |
548 | ||
549 | if (!get_fuse_conn(inode)->parallel_dirops) { | |
5c672ab3 | 550 | mutex_lock(&get_fuse_inode(inode)->mutex); |
63576c13 MS |
551 | locked = true; |
552 | } | |
553 | ||
554 | return locked; | |
5c672ab3 MS |
555 | } |
556 | ||
63576c13 | 557 | void fuse_unlock_inode(struct inode *inode, bool locked) |
5c672ab3 | 558 | { |
63576c13 | 559 | if (locked) |
5c672ab3 MS |
560 | mutex_unlock(&get_fuse_inode(inode)->mutex); |
561 | } | |
562 | ||
42faad99 | 563 | static void fuse_umount_begin(struct super_block *sb) |
69a53bf2 | 564 | { |
15c8e72e VG |
565 | struct fuse_conn *fc = get_fuse_conn_super(sb); |
566 | ||
247861c3 DL |
567 | if (fc->no_force_umount) |
568 | return; | |
569 | ||
570 | fuse_abort_conn(fc); | |
571 | ||
572 | // Only retire block-device-based superblocks. | |
573 | if (sb->s_bdev != NULL) | |
574 | retire_super(sb); | |
69a53bf2 MS |
575 | } |
576 | ||
fcee216b | 577 | static void fuse_send_destroy(struct fuse_mount *fm) |
0ec7ca41 | 578 | { |
fcee216b | 579 | if (fm->fc->conn_init) { |
1ccd1ea2 MS |
580 | FUSE_ARGS(args); |
581 | ||
582 | args.opcode = FUSE_DESTROY; | |
583 | args.force = true; | |
584 | args.nocreds = true; | |
fcee216b | 585 | fuse_simple_request(fm, &args); |
0ec7ca41 MS |
586 | } |
587 | } | |
588 | ||
e5e5558e MS |
589 | static void convert_fuse_statfs(struct kstatfs *stbuf, struct fuse_kstatfs *attr) |
590 | { | |
591 | stbuf->f_type = FUSE_SUPER_MAGIC; | |
592 | stbuf->f_bsize = attr->bsize; | |
de5f1202 | 593 | stbuf->f_frsize = attr->frsize; |
e5e5558e MS |
594 | stbuf->f_blocks = attr->blocks; |
595 | stbuf->f_bfree = attr->bfree; | |
596 | stbuf->f_bavail = attr->bavail; | |
597 | stbuf->f_files = attr->files; | |
598 | stbuf->f_ffree = attr->ffree; | |
599 | stbuf->f_namelen = attr->namelen; | |
600 | /* fsid is left zero */ | |
601 | } | |
602 | ||
726c3342 | 603 | static int fuse_statfs(struct dentry *dentry, struct kstatfs *buf) |
e5e5558e | 604 | { |
726c3342 | 605 | struct super_block *sb = dentry->d_sb; |
fcee216b | 606 | struct fuse_mount *fm = get_fuse_mount_super(sb); |
7078187a | 607 | FUSE_ARGS(args); |
e5e5558e MS |
608 | struct fuse_statfs_out outarg; |
609 | int err; | |
610 | ||
fcee216b | 611 | if (!fuse_allow_current_process(fm->fc)) { |
e57ac683 MS |
612 | buf->f_type = FUSE_SUPER_MAGIC; |
613 | return 0; | |
614 | } | |
615 | ||
de5f1202 | 616 | memset(&outarg, 0, sizeof(outarg)); |
d5b48543 MS |
617 | args.in_numargs = 0; |
618 | args.opcode = FUSE_STATFS; | |
619 | args.nodeid = get_node_id(d_inode(dentry)); | |
620 | args.out_numargs = 1; | |
621 | args.out_args[0].size = sizeof(outarg); | |
622 | args.out_args[0].value = &outarg; | |
fcee216b | 623 | err = fuse_simple_request(fm, &args); |
e5e5558e MS |
624 | if (!err) |
625 | convert_fuse_statfs(buf, &outarg.st); | |
e5e5558e MS |
626 | return err; |
627 | } | |
628 | ||
660585b5 MS |
629 | static struct fuse_sync_bucket *fuse_sync_bucket_alloc(void) |
630 | { | |
631 | struct fuse_sync_bucket *bucket; | |
632 | ||
633 | bucket = kzalloc(sizeof(*bucket), GFP_KERNEL | __GFP_NOFAIL); | |
634 | if (bucket) { | |
635 | init_waitqueue_head(&bucket->waitq); | |
636 | /* Initial active count */ | |
637 | atomic_set(&bucket->count, 1); | |
638 | } | |
639 | return bucket; | |
640 | } | |
641 | ||
642 | static void fuse_sync_fs_writes(struct fuse_conn *fc) | |
643 | { | |
644 | struct fuse_sync_bucket *bucket, *new_bucket; | |
645 | int count; | |
646 | ||
647 | new_bucket = fuse_sync_bucket_alloc(); | |
648 | spin_lock(&fc->lock); | |
649 | bucket = rcu_dereference_protected(fc->curr_bucket, 1); | |
650 | count = atomic_read(&bucket->count); | |
651 | WARN_ON(count < 1); | |
652 | /* No outstanding writes? */ | |
653 | if (count == 1) { | |
654 | spin_unlock(&fc->lock); | |
655 | kfree(new_bucket); | |
656 | return; | |
657 | } | |
658 | ||
659 | /* | |
660 | * Completion of new bucket depends on completion of this bucket, so add | |
661 | * one more count. | |
662 | */ | |
663 | atomic_inc(&new_bucket->count); | |
664 | rcu_assign_pointer(fc->curr_bucket, new_bucket); | |
665 | spin_unlock(&fc->lock); | |
666 | /* | |
667 | * Drop initial active count. At this point if all writes in this and | |
668 | * ancestor buckets complete, the count will go to zero and this task | |
669 | * will be woken up. | |
670 | */ | |
671 | atomic_dec(&bucket->count); | |
672 | ||
673 | wait_event(bucket->waitq, atomic_read(&bucket->count) == 0); | |
674 | ||
675 | /* Drop temp count on descendant bucket */ | |
676 | fuse_sync_bucket_dec(new_bucket); | |
677 | kfree_rcu(bucket, rcu); | |
678 | } | |
679 | ||
2d82ab25 GK |
680 | static int fuse_sync_fs(struct super_block *sb, int wait) |
681 | { | |
682 | struct fuse_mount *fm = get_fuse_mount_super(sb); | |
683 | struct fuse_conn *fc = fm->fc; | |
684 | struct fuse_syncfs_in inarg; | |
685 | FUSE_ARGS(args); | |
686 | int err; | |
687 | ||
688 | /* | |
689 | * Userspace cannot handle the wait == 0 case. Avoid a | |
690 | * gratuitous roundtrip. | |
691 | */ | |
692 | if (!wait) | |
693 | return 0; | |
694 | ||
695 | /* The filesystem is being unmounted. Nothing to do. */ | |
696 | if (!sb->s_root) | |
697 | return 0; | |
698 | ||
699 | if (!fc->sync_fs) | |
700 | return 0; | |
701 | ||
660585b5 MS |
702 | fuse_sync_fs_writes(fc); |
703 | ||
2d82ab25 GK |
704 | memset(&inarg, 0, sizeof(inarg)); |
705 | args.in_numargs = 1; | |
706 | args.in_args[0].size = sizeof(inarg); | |
707 | args.in_args[0].value = &inarg; | |
708 | args.opcode = FUSE_SYNCFS; | |
709 | args.nodeid = get_node_id(sb->s_root->d_inode); | |
710 | args.out_numargs = 0; | |
711 | ||
712 | err = fuse_simple_request(fm, &args); | |
713 | if (err == -ENOSYS) { | |
714 | fc->sync_fs = 0; | |
715 | err = 0; | |
716 | } | |
717 | ||
718 | return err; | |
719 | } | |
720 | ||
d8a5ba45 | 721 | enum { |
c30da2e9 DH |
722 | OPT_SOURCE, |
723 | OPT_SUBTYPE, | |
d8a5ba45 MS |
724 | OPT_FD, |
725 | OPT_ROOTMODE, | |
726 | OPT_USER_ID, | |
87729a55 | 727 | OPT_GROUP_ID, |
d8a5ba45 MS |
728 | OPT_DEFAULT_PERMISSIONS, |
729 | OPT_ALLOW_OTHER, | |
db50b96c | 730 | OPT_MAX_READ, |
d8091614 | 731 | OPT_BLKSIZE, |
d8a5ba45 MS |
732 | OPT_ERR |
733 | }; | |
734 | ||
d7167b14 | 735 | static const struct fs_parameter_spec fuse_fs_parameters[] = { |
c30da2e9 DH |
736 | fsparam_string ("source", OPT_SOURCE), |
737 | fsparam_u32 ("fd", OPT_FD), | |
738 | fsparam_u32oct ("rootmode", OPT_ROOTMODE), | |
739 | fsparam_u32 ("user_id", OPT_USER_ID), | |
740 | fsparam_u32 ("group_id", OPT_GROUP_ID), | |
741 | fsparam_flag ("default_permissions", OPT_DEFAULT_PERMISSIONS), | |
742 | fsparam_flag ("allow_other", OPT_ALLOW_OTHER), | |
743 | fsparam_u32 ("max_read", OPT_MAX_READ), | |
744 | fsparam_u32 ("blksize", OPT_BLKSIZE), | |
c7eb6869 | 745 | fsparam_string ("subtype", OPT_SUBTYPE), |
c30da2e9 DH |
746 | {} |
747 | }; | |
748 | ||
84c21507 | 749 | static int fuse_parse_param(struct fs_context *fsc, struct fs_parameter *param) |
233a01fa | 750 | { |
c30da2e9 | 751 | struct fs_parse_result result; |
84c21507 | 752 | struct fuse_fs_context *ctx = fsc->fs_private; |
c30da2e9 DH |
753 | int opt; |
754 | ||
84c21507 | 755 | if (fsc->purpose == FS_CONTEXT_FOR_RECONFIGURE) { |
b330966f MS |
756 | /* |
757 | * Ignore options coming from mount(MS_REMOUNT) for backward | |
758 | * compatibility. | |
759 | */ | |
84c21507 | 760 | if (fsc->oldapi) |
b330966f MS |
761 | return 0; |
762 | ||
84c21507 | 763 | return invalfc(fsc, "No changes allowed in reconfigure"); |
b330966f | 764 | } |
e8b20a47 | 765 | |
84c21507 | 766 | opt = fs_parse(fsc, fuse_fs_parameters, param, &result); |
c30da2e9 DH |
767 | if (opt < 0) |
768 | return opt; | |
769 | ||
770 | switch (opt) { | |
771 | case OPT_SOURCE: | |
84c21507 MS |
772 | if (fsc->source) |
773 | return invalfc(fsc, "Multiple sources specified"); | |
774 | fsc->source = param->string; | |
c30da2e9 DH |
775 | param->string = NULL; |
776 | break; | |
777 | ||
778 | case OPT_SUBTYPE: | |
779 | if (ctx->subtype) | |
84c21507 | 780 | return invalfc(fsc, "Multiple subtypes specified"); |
c30da2e9 DH |
781 | ctx->subtype = param->string; |
782 | param->string = NULL; | |
783 | return 0; | |
784 | ||
785 | case OPT_FD: | |
786 | ctx->fd = result.uint_32; | |
cabdb4fa | 787 | ctx->fd_present = true; |
c30da2e9 DH |
788 | break; |
789 | ||
790 | case OPT_ROOTMODE: | |
791 | if (!fuse_valid_type(result.uint_32)) | |
84c21507 | 792 | return invalfc(fsc, "Invalid rootmode"); |
c30da2e9 | 793 | ctx->rootmode = result.uint_32; |
cabdb4fa | 794 | ctx->rootmode_present = true; |
c30da2e9 DH |
795 | break; |
796 | ||
797 | case OPT_USER_ID: | |
84c21507 | 798 | ctx->user_id = make_kuid(fsc->user_ns, result.uint_32); |
c30da2e9 | 799 | if (!uid_valid(ctx->user_id)) |
84c21507 | 800 | return invalfc(fsc, "Invalid user_id"); |
cabdb4fa | 801 | ctx->user_id_present = true; |
c30da2e9 DH |
802 | break; |
803 | ||
804 | case OPT_GROUP_ID: | |
84c21507 | 805 | ctx->group_id = make_kgid(fsc->user_ns, result.uint_32); |
c30da2e9 | 806 | if (!gid_valid(ctx->group_id)) |
84c21507 | 807 | return invalfc(fsc, "Invalid group_id"); |
cabdb4fa | 808 | ctx->group_id_present = true; |
c30da2e9 DH |
809 | break; |
810 | ||
811 | case OPT_DEFAULT_PERMISSIONS: | |
cabdb4fa | 812 | ctx->default_permissions = true; |
c30da2e9 DH |
813 | break; |
814 | ||
815 | case OPT_ALLOW_OTHER: | |
cabdb4fa | 816 | ctx->allow_other = true; |
c30da2e9 DH |
817 | break; |
818 | ||
819 | case OPT_MAX_READ: | |
820 | ctx->max_read = result.uint_32; | |
821 | break; | |
822 | ||
823 | case OPT_BLKSIZE: | |
824 | if (!ctx->is_bdev) | |
84c21507 | 825 | return invalfc(fsc, "blksize only supported for fuseblk"); |
c30da2e9 DH |
826 | ctx->blksize = result.uint_32; |
827 | break; | |
828 | ||
829 | default: | |
830 | return -EINVAL; | |
233a01fa | 831 | } |
c30da2e9 DH |
832 | |
833 | return 0; | |
233a01fa MS |
834 | } |
835 | ||
84c21507 | 836 | static void fuse_free_fsc(struct fs_context *fsc) |
d8a5ba45 | 837 | { |
84c21507 | 838 | struct fuse_fs_context *ctx = fsc->fs_private; |
5a533682 | 839 | |
c30da2e9 DH |
840 | if (ctx) { |
841 | kfree(ctx->subtype); | |
842 | kfree(ctx); | |
843 | } | |
d8a5ba45 MS |
844 | } |
845 | ||
34c80b1d | 846 | static int fuse_show_options(struct seq_file *m, struct dentry *root) |
d8a5ba45 | 847 | { |
34c80b1d AV |
848 | struct super_block *sb = root->d_sb; |
849 | struct fuse_conn *fc = get_fuse_conn_super(sb); | |
d8a5ba45 | 850 | |
f4fd4ae3 VG |
851 | if (fc->legacy_opts_show) { |
852 | seq_printf(m, ",user_id=%u", | |
853 | from_kuid_munged(fc->user_ns, fc->user_id)); | |
854 | seq_printf(m, ",group_id=%u", | |
855 | from_kgid_munged(fc->user_ns, fc->group_id)); | |
856 | if (fc->default_permissions) | |
857 | seq_puts(m, ",default_permissions"); | |
858 | if (fc->allow_other) | |
859 | seq_puts(m, ",allow_other"); | |
860 | if (fc->max_read != ~0) | |
861 | seq_printf(m, ",max_read=%u", fc->max_read); | |
862 | if (sb->s_bdev && sb->s_blocksize != FUSE_DEFAULT_BLKSIZE) | |
863 | seq_printf(m, ",blksize=%lu", sb->s_blocksize); | |
864 | } | |
1dd53957 | 865 | #ifdef CONFIG_FUSE_DAX |
780b1b95 JX |
866 | if (fc->dax_mode == FUSE_DAX_ALWAYS) |
867 | seq_puts(m, ",dax=always"); | |
868 | else if (fc->dax_mode == FUSE_DAX_NEVER) | |
869 | seq_puts(m, ",dax=never"); | |
870 | else if (fc->dax_mode == FUSE_DAX_INODE_USER) | |
871 | seq_puts(m, ",dax=inode"); | |
1dd53957 | 872 | #endif |
3f22c746 | 873 | |
d8a5ba45 MS |
874 | return 0; |
875 | } | |
876 | ||
ae3aad77 SH |
877 | static void fuse_iqueue_init(struct fuse_iqueue *fiq, |
878 | const struct fuse_iqueue_ops *ops, | |
879 | void *priv) | |
f88996a9 MS |
880 | { |
881 | memset(fiq, 0, sizeof(struct fuse_iqueue)); | |
76e43c8c | 882 | spin_lock_init(&fiq->lock); |
f88996a9 MS |
883 | init_waitqueue_head(&fiq->waitq); |
884 | INIT_LIST_HEAD(&fiq->pending); | |
885 | INIT_LIST_HEAD(&fiq->interrupts); | |
886 | fiq->forget_list_tail = &fiq->forget_list_head; | |
e16714d8 | 887 | fiq->connected = 1; |
ae3aad77 SH |
888 | fiq->ops = ops; |
889 | fiq->priv = priv; | |
f88996a9 MS |
890 | } |
891 | ||
3a2b5b9c MS |
892 | static void fuse_pqueue_init(struct fuse_pqueue *fpq) |
893 | { | |
be2ff42c KT |
894 | unsigned int i; |
895 | ||
45a91cb1 | 896 | spin_lock_init(&fpq->lock); |
be2ff42c KT |
897 | for (i = 0; i < FUSE_PQ_HASH_SIZE; i++) |
898 | INIT_LIST_HEAD(&fpq->processing[i]); | |
3a2b5b9c | 899 | INIT_LIST_HEAD(&fpq->io); |
e96edd94 | 900 | fpq->connected = 1; |
3a2b5b9c MS |
901 | } |
902 | ||
fcee216b MR |
903 | void fuse_conn_init(struct fuse_conn *fc, struct fuse_mount *fm, |
904 | struct user_namespace *user_ns, | |
ae3aad77 | 905 | const struct fuse_iqueue_ops *fiq_ops, void *fiq_priv) |
d8a5ba45 | 906 | { |
0d179aa5 TH |
907 | memset(fc, 0, sizeof(*fc)); |
908 | spin_lock_init(&fc->lock); | |
ae2dffa3 | 909 | spin_lock_init(&fc->bg_lock); |
3b463ae0 | 910 | init_rwsem(&fc->killsb); |
095fc40a | 911 | refcount_set(&fc->count, 1); |
c3696046 | 912 | atomic_set(&fc->dev_count, 1); |
0d179aa5 | 913 | init_waitqueue_head(&fc->blocked_waitq); |
ae3aad77 | 914 | fuse_iqueue_init(&fc->iq, fiq_ops, fiq_priv); |
0d179aa5 TH |
915 | INIT_LIST_HEAD(&fc->bg_queue); |
916 | INIT_LIST_HEAD(&fc->entry); | |
cc080e9e | 917 | INIT_LIST_HEAD(&fc->devices); |
0d179aa5 | 918 | atomic_set(&fc->num_waiting, 0); |
7a6d3c8b CH |
919 | fc->max_background = FUSE_DEFAULT_MAX_BACKGROUND; |
920 | fc->congestion_threshold = FUSE_DEFAULT_CONGESTION_THRESHOLD; | |
75126f55 | 921 | atomic64_set(&fc->khctr, 0); |
0d179aa5 | 922 | fc->polled_files = RB_ROOT; |
0aada884 | 923 | fc->blocked = 0; |
796523fb | 924 | fc->initialized = 0; |
e16714d8 | 925 | fc->connected = 1; |
4510d86f | 926 | atomic64_set(&fc->attr_version, 1); |
0d179aa5 | 927 | get_random_bytes(&fc->scramble_key, sizeof(fc->scramble_key)); |
0b6e9ea0 | 928 | fc->pid_ns = get_pid_ns(task_active_pid_ns(current)); |
8cb08329 | 929 | fc->user_ns = get_user_ns(user_ns); |
8a3177db | 930 | fc->max_pages = FUSE_DEFAULT_MAX_PAGES_PER_REQ; |
a7f0d7aa | 931 | fc->max_pages_limit = FUSE_MAX_MAX_PAGES; |
fcee216b | 932 | |
44350256 AG |
933 | if (IS_ENABLED(CONFIG_FUSE_PASSTHROUGH)) |
934 | fuse_backing_files_init(fc); | |
935 | ||
fcee216b MR |
936 | INIT_LIST_HEAD(&fc->mounts); |
937 | list_add(&fm->fc_entry, &fc->mounts); | |
938 | fm->fc = fc; | |
d8a5ba45 | 939 | } |
0d179aa5 | 940 | EXPORT_SYMBOL_GPL(fuse_conn_init); |
d8a5ba45 | 941 | |
bafa9654 MS |
942 | void fuse_conn_put(struct fuse_conn *fc) |
943 | { | |
095fc40a | 944 | if (refcount_dec_and_test(&fc->count)) { |
a62a8ef9 | 945 | struct fuse_iqueue *fiq = &fc->iq; |
660585b5 | 946 | struct fuse_sync_bucket *bucket; |
a62a8ef9 | 947 | |
1dd53957 VG |
948 | if (IS_ENABLED(CONFIG_FUSE_DAX)) |
949 | fuse_dax_conn_free(fc); | |
a62a8ef9 SH |
950 | if (fiq->ops->release) |
951 | fiq->ops->release(fiq); | |
0b6e9ea0 | 952 | put_pid_ns(fc->pid_ns); |
8cb08329 | 953 | put_user_ns(fc->user_ns); |
660585b5 MS |
954 | bucket = rcu_dereference_protected(fc->curr_bucket, 1); |
955 | if (bucket) { | |
956 | WARN_ON(atomic_read(&bucket->count) != 1); | |
957 | kfree(bucket); | |
958 | } | |
44350256 AG |
959 | if (IS_ENABLED(CONFIG_FUSE_PASSTHROUGH)) |
960 | fuse_backing_files_free(fc); | |
43901aab | 961 | fc->release(fc); |
d2a85164 | 962 | } |
bafa9654 | 963 | } |
08cbf542 | 964 | EXPORT_SYMBOL_GPL(fuse_conn_put); |
bafa9654 MS |
965 | |
966 | struct fuse_conn *fuse_conn_get(struct fuse_conn *fc) | |
967 | { | |
095fc40a | 968 | refcount_inc(&fc->count); |
bafa9654 MS |
969 | return fc; |
970 | } | |
08cbf542 | 971 | EXPORT_SYMBOL_GPL(fuse_conn_get); |
bafa9654 | 972 | |
b93f858a | 973 | static struct inode *fuse_get_root_inode(struct super_block *sb, unsigned mode) |
d8a5ba45 MS |
974 | { |
975 | struct fuse_attr attr; | |
976 | memset(&attr, 0, sizeof(attr)); | |
977 | ||
978 | attr.mode = mode; | |
979 | attr.ino = FUSE_ROOT_ID; | |
074406fa | 980 | attr.nlink = 1; |
1fb69e78 | 981 | return fuse_iget(sb, 1, 0, &attr, 0, 0); |
d8a5ba45 MS |
982 | } |
983 | ||
1729a16c | 984 | struct fuse_inode_handle { |
dbd561d2 MS |
985 | u64 nodeid; |
986 | u32 generation; | |
987 | }; | |
988 | ||
989 | static struct dentry *fuse_get_dentry(struct super_block *sb, | |
990 | struct fuse_inode_handle *handle) | |
991 | { | |
33670fa2 | 992 | struct fuse_conn *fc = get_fuse_conn_super(sb); |
dbd561d2 MS |
993 | struct inode *inode; |
994 | struct dentry *entry; | |
995 | int err = -ESTALE; | |
996 | ||
997 | if (handle->nodeid == 0) | |
998 | goto out_err; | |
999 | ||
1000 | inode = ilookup5(sb, handle->nodeid, fuse_inode_eq, &handle->nodeid); | |
33670fa2 MS |
1001 | if (!inode) { |
1002 | struct fuse_entry_out outarg; | |
13983d06 | 1003 | const struct qstr name = QSTR_INIT(".", 1); |
33670fa2 MS |
1004 | |
1005 | if (!fc->export_support) | |
1006 | goto out_err; | |
1007 | ||
33670fa2 MS |
1008 | err = fuse_lookup_name(sb, handle->nodeid, &name, &outarg, |
1009 | &inode); | |
1010 | if (err && err != -ENOENT) | |
1011 | goto out_err; | |
1012 | if (err || !inode) { | |
1013 | err = -ESTALE; | |
1014 | goto out_err; | |
1015 | } | |
1016 | err = -EIO; | |
1017 | if (get_node_id(inode) != handle->nodeid) | |
1018 | goto out_iput; | |
1019 | } | |
dbd561d2 MS |
1020 | err = -ESTALE; |
1021 | if (inode->i_generation != handle->generation) | |
1022 | goto out_iput; | |
1023 | ||
44003728 | 1024 | entry = d_obtain_alias(inode); |
c35eebe9 | 1025 | if (!IS_ERR(entry) && get_node_id(inode) != FUSE_ROOT_ID) |
dbd561d2 | 1026 | fuse_invalidate_entry_cache(entry); |
dbd561d2 MS |
1027 | |
1028 | return entry; | |
1029 | ||
1030 | out_iput: | |
1031 | iput(inode); | |
1032 | out_err: | |
1033 | return ERR_PTR(err); | |
1034 | } | |
1035 | ||
b0b0382b AV |
1036 | static int fuse_encode_fh(struct inode *inode, u32 *fh, int *max_len, |
1037 | struct inode *parent) | |
dbd561d2 | 1038 | { |
b0b0382b | 1039 | int len = parent ? 6 : 3; |
dbd561d2 MS |
1040 | u64 nodeid; |
1041 | u32 generation; | |
1042 | ||
5fe0c237 AK |
1043 | if (*max_len < len) { |
1044 | *max_len = len; | |
94e07a75 | 1045 | return FILEID_INVALID; |
5fe0c237 | 1046 | } |
dbd561d2 MS |
1047 | |
1048 | nodeid = get_fuse_inode(inode)->nodeid; | |
1049 | generation = inode->i_generation; | |
1050 | ||
1051 | fh[0] = (u32)(nodeid >> 32); | |
1052 | fh[1] = (u32)(nodeid & 0xffffffff); | |
1053 | fh[2] = generation; | |
1054 | ||
b0b0382b | 1055 | if (parent) { |
dbd561d2 MS |
1056 | nodeid = get_fuse_inode(parent)->nodeid; |
1057 | generation = parent->i_generation; | |
dbd561d2 MS |
1058 | |
1059 | fh[3] = (u32)(nodeid >> 32); | |
1060 | fh[4] = (u32)(nodeid & 0xffffffff); | |
1061 | fh[5] = generation; | |
1062 | } | |
1063 | ||
1064 | *max_len = len; | |
41d1ddd2 | 1065 | return parent ? FILEID_INO64_GEN_PARENT : FILEID_INO64_GEN; |
dbd561d2 MS |
1066 | } |
1067 | ||
1068 | static struct dentry *fuse_fh_to_dentry(struct super_block *sb, | |
1069 | struct fid *fid, int fh_len, int fh_type) | |
1070 | { | |
1071 | struct fuse_inode_handle handle; | |
1072 | ||
41d1ddd2 AG |
1073 | if ((fh_type != FILEID_INO64_GEN && |
1074 | fh_type != FILEID_INO64_GEN_PARENT) || fh_len < 3) | |
dbd561d2 MS |
1075 | return NULL; |
1076 | ||
1077 | handle.nodeid = (u64) fid->raw[0] << 32; | |
1078 | handle.nodeid |= (u64) fid->raw[1]; | |
1079 | handle.generation = fid->raw[2]; | |
1080 | return fuse_get_dentry(sb, &handle); | |
1081 | } | |
1082 | ||
1083 | static struct dentry *fuse_fh_to_parent(struct super_block *sb, | |
1084 | struct fid *fid, int fh_len, int fh_type) | |
1085 | { | |
1086 | struct fuse_inode_handle parent; | |
1087 | ||
41d1ddd2 | 1088 | if (fh_type != FILEID_INO64_GEN_PARENT || fh_len < 6) |
dbd561d2 MS |
1089 | return NULL; |
1090 | ||
1091 | parent.nodeid = (u64) fid->raw[3] << 32; | |
1092 | parent.nodeid |= (u64) fid->raw[4]; | |
1093 | parent.generation = fid->raw[5]; | |
1094 | return fuse_get_dentry(sb, &parent); | |
1095 | } | |
1096 | ||
33670fa2 MS |
1097 | static struct dentry *fuse_get_parent(struct dentry *child) |
1098 | { | |
2b0143b5 | 1099 | struct inode *child_inode = d_inode(child); |
33670fa2 MS |
1100 | struct fuse_conn *fc = get_fuse_conn(child_inode); |
1101 | struct inode *inode; | |
1102 | struct dentry *parent; | |
1103 | struct fuse_entry_out outarg; | |
33670fa2 MS |
1104 | int err; |
1105 | ||
1106 | if (!fc->export_support) | |
1107 | return ERR_PTR(-ESTALE); | |
1108 | ||
33670fa2 | 1109 | err = fuse_lookup_name(child_inode->i_sb, get_node_id(child_inode), |
80e5d1ff | 1110 | &dotdot_name, &outarg, &inode); |
44003728 CH |
1111 | if (err) { |
1112 | if (err == -ENOENT) | |
1113 | return ERR_PTR(-ESTALE); | |
33670fa2 | 1114 | return ERR_PTR(err); |
33670fa2 | 1115 | } |
44003728 CH |
1116 | |
1117 | parent = d_obtain_alias(inode); | |
c35eebe9 | 1118 | if (!IS_ERR(parent) && get_node_id(inode) != FUSE_ROOT_ID) |
33670fa2 | 1119 | fuse_invalidate_entry_cache(parent); |
33670fa2 MS |
1120 | |
1121 | return parent; | |
1122 | } | |
dbd561d2 MS |
1123 | |
1124 | static const struct export_operations fuse_export_operations = { | |
1125 | .fh_to_dentry = fuse_fh_to_dentry, | |
1126 | .fh_to_parent = fuse_fh_to_parent, | |
1127 | .encode_fh = fuse_encode_fh, | |
33670fa2 | 1128 | .get_parent = fuse_get_parent, |
dbd561d2 MS |
1129 | }; |
1130 | ||
ee9b6d61 | 1131 | static const struct super_operations fuse_super_operations = { |
d8a5ba45 | 1132 | .alloc_inode = fuse_alloc_inode, |
9baf28bb | 1133 | .free_inode = fuse_free_inode, |
b57922d9 | 1134 | .evict_inode = fuse_evict_inode, |
1e18bda8 | 1135 | .write_inode = fuse_write_inode, |
ead5f0b5 | 1136 | .drop_inode = generic_delete_inode, |
69a53bf2 | 1137 | .umount_begin = fuse_umount_begin, |
e5e5558e | 1138 | .statfs = fuse_statfs, |
2d82ab25 | 1139 | .sync_fs = fuse_sync_fs, |
d8a5ba45 MS |
1140 | .show_options = fuse_show_options, |
1141 | }; | |
1142 | ||
487ea5af CH |
1143 | static void sanitize_global_limit(unsigned *limit) |
1144 | { | |
f22f812d MS |
1145 | /* |
1146 | * The default maximum number of async requests is calculated to consume | |
1147 | * 1/2^13 of the total memory, assuming 392 bytes per request. | |
1148 | */ | |
487ea5af | 1149 | if (*limit == 0) |
f22f812d | 1150 | *limit = ((totalram_pages() << PAGE_SHIFT) >> 13) / 392; |
487ea5af CH |
1151 | |
1152 | if (*limit >= 1 << 16) | |
1153 | *limit = (1 << 16) - 1; | |
1154 | } | |
1155 | ||
e4dca7b7 | 1156 | static int set_global_limit(const char *val, const struct kernel_param *kp) |
487ea5af CH |
1157 | { |
1158 | int rv; | |
1159 | ||
1160 | rv = param_set_uint(val, kp); | |
1161 | if (rv) | |
1162 | return rv; | |
1163 | ||
1164 | sanitize_global_limit((unsigned *)kp->arg); | |
1165 | ||
1166 | return 0; | |
1167 | } | |
1168 | ||
1169 | static void process_init_limits(struct fuse_conn *fc, struct fuse_init_out *arg) | |
1170 | { | |
1171 | int cap_sys_admin = capable(CAP_SYS_ADMIN); | |
1172 | ||
1173 | if (arg->minor < 13) | |
1174 | return; | |
1175 | ||
1176 | sanitize_global_limit(&max_user_bgreq); | |
1177 | sanitize_global_limit(&max_user_congthresh); | |
1178 | ||
ae2dffa3 | 1179 | spin_lock(&fc->bg_lock); |
487ea5af CH |
1180 | if (arg->max_background) { |
1181 | fc->max_background = arg->max_background; | |
1182 | ||
1183 | if (!cap_sys_admin && fc->max_background > max_user_bgreq) | |
1184 | fc->max_background = max_user_bgreq; | |
1185 | } | |
1186 | if (arg->congestion_threshold) { | |
1187 | fc->congestion_threshold = arg->congestion_threshold; | |
1188 | ||
1189 | if (!cap_sys_admin && | |
1190 | fc->congestion_threshold > max_user_congthresh) | |
1191 | fc->congestion_threshold = max_user_congthresh; | |
1192 | } | |
ae2dffa3 | 1193 | spin_unlock(&fc->bg_lock); |
487ea5af CH |
1194 | } |
1195 | ||
615047ef MS |
1196 | struct fuse_init_args { |
1197 | struct fuse_args args; | |
1198 | struct fuse_init_in in; | |
1199 | struct fuse_init_out out; | |
1200 | }; | |
1201 | ||
fcee216b | 1202 | static void process_init_reply(struct fuse_mount *fm, struct fuse_args *args, |
615047ef | 1203 | int error) |
9b9a0469 | 1204 | { |
fcee216b | 1205 | struct fuse_conn *fc = fm->fc; |
615047ef MS |
1206 | struct fuse_init_args *ia = container_of(args, typeof(*ia), args); |
1207 | struct fuse_init_out *arg = &ia->out; | |
fd1a1dc6 | 1208 | bool ok = true; |
9b9a0469 | 1209 | |
615047ef | 1210 | if (error || arg->major != FUSE_KERNEL_VERSION) |
fd1a1dc6 | 1211 | ok = false; |
9b9a0469 | 1212 | else { |
9cd68455 MS |
1213 | unsigned long ra_pages; |
1214 | ||
487ea5af CH |
1215 | process_init_limits(fc, arg); |
1216 | ||
9cd68455 | 1217 | if (arg->minor >= 6) { |
3066ff93 BS |
1218 | u64 flags = arg->flags; |
1219 | ||
1220 | if (flags & FUSE_INIT_EXT) | |
1221 | flags |= (u64) arg->flags2 << 32; | |
53db2893 | 1222 | |
09cbfeaf | 1223 | ra_pages = arg->max_readahead / PAGE_SIZE; |
53db2893 | 1224 | if (flags & FUSE_ASYNC_READ) |
9cd68455 | 1225 | fc->async_read = 1; |
53db2893 | 1226 | if (!(flags & FUSE_POSIX_LOCKS)) |
71421259 | 1227 | fc->no_lock = 1; |
37fb3a30 | 1228 | if (arg->minor >= 17) { |
53db2893 | 1229 | if (!(flags & FUSE_FLOCK_LOCKS)) |
37fb3a30 | 1230 | fc->no_flock = 1; |
24114504 | 1231 | } else { |
53db2893 | 1232 | if (!(flags & FUSE_POSIX_LOCKS)) |
24114504 | 1233 | fc->no_flock = 1; |
37fb3a30 | 1234 | } |
53db2893 | 1235 | if (flags & FUSE_ATOMIC_O_TRUNC) |
6ff958ed | 1236 | fc->atomic_o_trunc = 1; |
33670fa2 MS |
1237 | if (arg->minor >= 9) { |
1238 | /* LOOKUP has dependency on proto version */ | |
53db2893 | 1239 | if (flags & FUSE_EXPORT_SUPPORT) |
33670fa2 MS |
1240 | fc->export_support = 1; |
1241 | } | |
53db2893 | 1242 | if (flags & FUSE_BIG_WRITES) |
78bb6cb9 | 1243 | fc->big_writes = 1; |
53db2893 | 1244 | if (flags & FUSE_DONT_MASK) |
e0a43ddc | 1245 | fc->dont_mask = 1; |
53db2893 | 1246 | if (flags & FUSE_AUTO_INVAL_DATA) |
72d0d248 | 1247 | fc->auto_inval_data = 1; |
53db2893 | 1248 | else if (flags & FUSE_EXPLICIT_INVAL_DATA) |
ad2ba64d | 1249 | fc->explicit_inval_data = 1; |
53db2893 | 1250 | if (flags & FUSE_DO_READDIRPLUS) { |
0b05b183 | 1251 | fc->do_readdirplus = 1; |
53db2893 | 1252 | if (flags & FUSE_READDIRPLUS_AUTO) |
28420dad MS |
1253 | fc->readdirplus_auto = 1; |
1254 | } | |
53db2893 | 1255 | if (flags & FUSE_ASYNC_DIO) |
60b9df7a | 1256 | fc->async_dio = 1; |
53db2893 | 1257 | if (flags & FUSE_WRITEBACK_CACHE) |
4d99ff8f | 1258 | fc->writeback_cache = 1; |
53db2893 | 1259 | if (flags & FUSE_PARALLEL_DIROPS) |
5c672ab3 | 1260 | fc->parallel_dirops = 1; |
53db2893 | 1261 | if (flags & FUSE_HANDLE_KILLPRIV) |
5e940c1d | 1262 | fc->handle_killpriv = 1; |
e27c9d38 | 1263 | if (arg->time_gran && arg->time_gran <= 1000000000) |
fcee216b | 1264 | fm->sb->s_time_gran = arg->time_gran; |
53db2893 | 1265 | if ((flags & FUSE_POSIX_ACL)) { |
29433a29 | 1266 | fc->default_permissions = 1; |
60bcc88a | 1267 | fc->posix_acl = 1; |
60bcc88a | 1268 | } |
53db2893 | 1269 | if (flags & FUSE_CACHE_SYMLINKS) |
5571f1e6 | 1270 | fc->cache_symlinks = 1; |
53db2893 | 1271 | if (flags & FUSE_ABORT_ERROR) |
3b7008b2 | 1272 | fc->abort_err = 1; |
53db2893 | 1273 | if (flags & FUSE_MAX_PAGES) { |
5da784cc | 1274 | fc->max_pages = |
a7f0d7aa | 1275 | min_t(unsigned int, fc->max_pages_limit, |
5da784cc CS |
1276 | max_t(unsigned int, arg->max_pages, 1)); |
1277 | } | |
2ee019fa JX |
1278 | if (IS_ENABLED(CONFIG_FUSE_DAX)) { |
1279 | if (flags & FUSE_MAP_ALIGNMENT && | |
1280 | !fuse_dax_check_alignment(fc, arg->map_alignment)) { | |
1281 | ok = false; | |
1282 | } | |
1283 | if (flags & FUSE_HAS_INODE_DAX) | |
1284 | fc->inode_dax = 1; | |
fd1a1dc6 | 1285 | } |
53db2893 | 1286 | if (flags & FUSE_HANDLE_KILLPRIV_V2) { |
63f9909f | 1287 | fc->handle_killpriv_v2 = 1; |
9d769e6a VG |
1288 | fm->sb->s_flags |= SB_NOSEC; |
1289 | } | |
53db2893 | 1290 | if (flags & FUSE_SETXATTR_EXT) |
52a4c95f | 1291 | fc->setxattr_ext = 1; |
3e2b6fdb VG |
1292 | if (flags & FUSE_SECURITY_CTX) |
1293 | fc->init_security = 1; | |
8ed7cb3f MS |
1294 | if (flags & FUSE_CREATE_SUPP_GROUP) |
1295 | fc->create_supp_group = 1; | |
c55e0a55 TF |
1296 | if (flags & FUSE_DIRECT_IO_ALLOW_MMAP) |
1297 | fc->direct_io_allow_mmap = 1; | |
7dc4e97a AG |
1298 | /* |
1299 | * max_stack_depth is the max stack depth of FUSE fs, | |
1300 | * so it has to be at least 1 to support passthrough | |
1301 | * to backing files. | |
1302 | * | |
1303 | * with max_stack_depth > 1, the backing files can be | |
1304 | * on a stacked fs (e.g. overlayfs) themselves and with | |
1305 | * max_stack_depth == 1, FUSE fs can be stacked as the | |
1306 | * underlying fs of a stacked fs (e.g. overlayfs). | |
1307 | */ | |
1308 | if (IS_ENABLED(CONFIG_FUSE_PASSTHROUGH) && | |
1309 | (flags & FUSE_PASSTHROUGH) && | |
1310 | arg->max_stack_depth > 0 && | |
1311 | arg->max_stack_depth <= FILESYSTEM_MAX_STACK_DEPTH) { | |
1312 | fc->passthrough = 1; | |
1313 | fc->max_stack_depth = arg->max_stack_depth; | |
1314 | fm->sb->s_stack_depth = arg->max_stack_depth; | |
1315 | } | |
71421259 | 1316 | } else { |
09cbfeaf | 1317 | ra_pages = fc->max_read / PAGE_SIZE; |
71421259 | 1318 | fc->no_lock = 1; |
37fb3a30 | 1319 | fc->no_flock = 1; |
71421259 | 1320 | } |
9cd68455 | 1321 | |
fcee216b MR |
1322 | fm->sb->s_bdi->ra_pages = |
1323 | min(fm->sb->s_bdi->ra_pages, ra_pages); | |
9b9a0469 MS |
1324 | fc->minor = arg->minor; |
1325 | fc->max_write = arg->minor < 5 ? 4096 : arg->max_write; | |
f948d564 | 1326 | fc->max_write = max_t(unsigned, 4096, fc->max_write); |
0ec7ca41 | 1327 | fc->conn_init = 1; |
9b9a0469 | 1328 | } |
615047ef MS |
1329 | kfree(ia); |
1330 | ||
fd1a1dc6 SH |
1331 | if (!ok) { |
1332 | fc->conn_init = 0; | |
1333 | fc->conn_error = 1; | |
1334 | } | |
1335 | ||
9759bd51 | 1336 | fuse_set_initialized(fc); |
08a53cdc | 1337 | wake_up_all(&fc->blocked_waitq); |
9b9a0469 MS |
1338 | } |
1339 | ||
fcee216b | 1340 | void fuse_send_init(struct fuse_mount *fm) |
9b9a0469 | 1341 | { |
615047ef | 1342 | struct fuse_init_args *ia; |
53db2893 | 1343 | u64 flags; |
095da6cb | 1344 | |
615047ef MS |
1345 | ia = kzalloc(sizeof(*ia), GFP_KERNEL | __GFP_NOFAIL); |
1346 | ||
1347 | ia->in.major = FUSE_KERNEL_VERSION; | |
1348 | ia->in.minor = FUSE_KERNEL_MINOR_VERSION; | |
fcee216b | 1349 | ia->in.max_readahead = fm->sb->s_bdi->ra_pages * PAGE_SIZE; |
53db2893 | 1350 | flags = |
615047ef | 1351 | FUSE_ASYNC_READ | FUSE_POSIX_LOCKS | FUSE_ATOMIC_O_TRUNC | |
37fb3a30 | 1352 | FUSE_EXPORT_SUPPORT | FUSE_BIG_WRITES | FUSE_DONT_MASK | |
69fe05c9 | 1353 | FUSE_SPLICE_WRITE | FUSE_SPLICE_MOVE | FUSE_SPLICE_READ | |
9446385f | 1354 | FUSE_FLOCK_LOCKS | FUSE_HAS_IOCTL_DIR | FUSE_AUTO_INVAL_DATA | |
4d99ff8f | 1355 | FUSE_DO_READDIRPLUS | FUSE_READDIRPLUS_AUTO | FUSE_ASYNC_DIO | |
5c672ab3 | 1356 | FUSE_WRITEBACK_CACHE | FUSE_NO_OPEN_SUPPORT | |
3b7008b2 | 1357 | FUSE_PARALLEL_DIROPS | FUSE_HANDLE_KILLPRIV | FUSE_POSIX_ACL | |
d9a9ea94 | 1358 | FUSE_ABORT_ERROR | FUSE_MAX_PAGES | FUSE_CACHE_SYMLINKS | |
63f9909f | 1359 | FUSE_NO_OPENDIR_SUPPORT | FUSE_EXPLICIT_INVAL_DATA | |
3e2b6fdb | 1360 | FUSE_HANDLE_KILLPRIV_V2 | FUSE_SETXATTR_EXT | FUSE_INIT_EXT | |
5cadfbd5 | 1361 | FUSE_SECURITY_CTX | FUSE_CREATE_SUPP_GROUP | |
c55e0a55 | 1362 | FUSE_HAS_EXPIRE_ONLY | FUSE_DIRECT_IO_ALLOW_MMAP; |
fd1a1dc6 | 1363 | #ifdef CONFIG_FUSE_DAX |
fcee216b | 1364 | if (fm->fc->dax) |
53db2893 | 1365 | flags |= FUSE_MAP_ALIGNMENT; |
2ee019fa JX |
1366 | if (fuse_is_inode_dax_mode(fm->fc->dax_mode)) |
1367 | flags |= FUSE_HAS_INODE_DAX; | |
fd1a1dc6 | 1368 | #endif |
bf109c64 | 1369 | if (fm->fc->auto_submounts) |
53db2893 | 1370 | flags |= FUSE_SUBMOUNTS; |
7dc4e97a AG |
1371 | if (IS_ENABLED(CONFIG_FUSE_PASSTHROUGH)) |
1372 | flags |= FUSE_PASSTHROUGH; | |
53db2893 MS |
1373 | |
1374 | ia->in.flags = flags; | |
1375 | ia->in.flags2 = flags >> 32; | |
bf109c64 | 1376 | |
615047ef MS |
1377 | ia->args.opcode = FUSE_INIT; |
1378 | ia->args.in_numargs = 1; | |
1379 | ia->args.in_args[0].size = sizeof(ia->in); | |
1380 | ia->args.in_args[0].value = &ia->in; | |
1381 | ia->args.out_numargs = 1; | |
3ad2f3fb | 1382 | /* Variable length argument used for backward compatibility |
9b9a0469 MS |
1383 | with interface version < 7.5. Rest of init_out is zeroed |
1384 | by do_get_request(), so a short reply is not a problem */ | |
cabdb4fa | 1385 | ia->args.out_argvar = true; |
615047ef MS |
1386 | ia->args.out_args[0].size = sizeof(ia->out); |
1387 | ia->args.out_args[0].value = &ia->out; | |
1388 | ia->args.force = true; | |
1389 | ia->args.nocreds = true; | |
1390 | ia->args.end = process_init_reply; | |
1391 | ||
fcee216b MR |
1392 | if (fuse_simple_background(fm, &ia->args, GFP_KERNEL) != 0) |
1393 | process_init_reply(fm, &ia->args, -ENOTCONN); | |
9b9a0469 | 1394 | } |
95a84cdb | 1395 | EXPORT_SYMBOL_GPL(fuse_send_init); |
9b9a0469 | 1396 | |
783863d6 | 1397 | void fuse_free_conn(struct fuse_conn *fc) |
43901aab | 1398 | { |
cc080e9e | 1399 | WARN_ON(!list_empty(&fc->devices)); |
dd3e2c55 | 1400 | kfree_rcu(fc, rcu); |
43901aab | 1401 | } |
783863d6 | 1402 | EXPORT_SYMBOL_GPL(fuse_free_conn); |
43901aab | 1403 | |
a325f9b9 TH |
1404 | static int fuse_bdi_init(struct fuse_conn *fc, struct super_block *sb) |
1405 | { | |
1406 | int err; | |
5f7f7543 | 1407 | char *suffix = ""; |
a325f9b9 | 1408 | |
69c8ebf8 | 1409 | if (sb->s_bdev) { |
5f7f7543 | 1410 | suffix = "-fuseblk"; |
69c8ebf8 JK |
1411 | /* |
1412 | * sb->s_bdi points to blkdev's bdi however we want to redirect | |
1413 | * it to our private bdi... | |
1414 | */ | |
1415 | bdi_put(sb->s_bdi); | |
1416 | sb->s_bdi = &noop_backing_dev_info; | |
1417 | } | |
5f7f7543 JK |
1418 | err = super_setup_bdi_name(sb, "%u:%u%s", MAJOR(fc->dev), |
1419 | MINOR(fc->dev), suffix); | |
a325f9b9 TH |
1420 | if (err) |
1421 | return err; | |
1422 | ||
5f7f7543 | 1423 | /* fuse does it's own writeback accounting */ |
823423ef CH |
1424 | sb->s_bdi->capabilities &= ~BDI_CAP_WRITEBACK_ACCT; |
1425 | sb->s_bdi->capabilities |= BDI_CAP_STRICTLIMIT; | |
a325f9b9 | 1426 | |
a325f9b9 TH |
1427 | /* |
1428 | * For a single fuse filesystem use max 1% of dirty + | |
1429 | * writeback threshold. | |
1430 | * | |
1431 | * This gives about 1M of write buffer for memory maps on a | |
1432 | * machine with 1G and 10% dirty_ratio, which should be more | |
1433 | * than enough. | |
1434 | * | |
1435 | * Privileged users can raise it by writing to | |
1436 | * | |
1437 | * /sys/class/bdi/<bdi>/max_ratio | |
1438 | */ | |
5f7f7543 | 1439 | bdi_set_max_ratio(sb->s_bdi, 1); |
a325f9b9 TH |
1440 | |
1441 | return 0; | |
1442 | } | |
1443 | ||
0cd1eb9a | 1444 | struct fuse_dev *fuse_dev_alloc(void) |
cc080e9e MS |
1445 | { |
1446 | struct fuse_dev *fud; | |
be2ff42c | 1447 | struct list_head *pq; |
cc080e9e MS |
1448 | |
1449 | fud = kzalloc(sizeof(struct fuse_dev), GFP_KERNEL); | |
be2ff42c KT |
1450 | if (!fud) |
1451 | return NULL; | |
cc080e9e | 1452 | |
be2ff42c KT |
1453 | pq = kcalloc(FUSE_PQ_HASH_SIZE, sizeof(struct list_head), GFP_KERNEL); |
1454 | if (!pq) { | |
1455 | kfree(fud); | |
1456 | return NULL; | |
cc080e9e MS |
1457 | } |
1458 | ||
be2ff42c | 1459 | fud->pq.processing = pq; |
be2ff42c KT |
1460 | fuse_pqueue_init(&fud->pq); |
1461 | ||
0cd1eb9a VG |
1462 | return fud; |
1463 | } | |
1464 | EXPORT_SYMBOL_GPL(fuse_dev_alloc); | |
1465 | ||
1466 | void fuse_dev_install(struct fuse_dev *fud, struct fuse_conn *fc) | |
1467 | { | |
1468 | fud->fc = fuse_conn_get(fc); | |
be2ff42c KT |
1469 | spin_lock(&fc->lock); |
1470 | list_add_tail(&fud->entry, &fc->devices); | |
1471 | spin_unlock(&fc->lock); | |
0cd1eb9a VG |
1472 | } |
1473 | EXPORT_SYMBOL_GPL(fuse_dev_install); | |
be2ff42c | 1474 | |
0cd1eb9a VG |
1475 | struct fuse_dev *fuse_dev_alloc_install(struct fuse_conn *fc) |
1476 | { | |
1477 | struct fuse_dev *fud; | |
1478 | ||
1479 | fud = fuse_dev_alloc(); | |
1480 | if (!fud) | |
1481 | return NULL; | |
1482 | ||
1483 | fuse_dev_install(fud, fc); | |
cc080e9e MS |
1484 | return fud; |
1485 | } | |
0cd1eb9a | 1486 | EXPORT_SYMBOL_GPL(fuse_dev_alloc_install); |
cc080e9e MS |
1487 | |
1488 | void fuse_dev_free(struct fuse_dev *fud) | |
1489 | { | |
1490 | struct fuse_conn *fc = fud->fc; | |
1491 | ||
1492 | if (fc) { | |
1493 | spin_lock(&fc->lock); | |
1494 | list_del(&fud->entry); | |
1495 | spin_unlock(&fc->lock); | |
1496 | ||
1497 | fuse_conn_put(fc); | |
1498 | } | |
d72f70da | 1499 | kfree(fud->pq.processing); |
cc080e9e MS |
1500 | kfree(fud); |
1501 | } | |
1502 | EXPORT_SYMBOL_GPL(fuse_dev_free); | |
1503 | ||
1866d779 MR |
1504 | static void fuse_fill_attr_from_inode(struct fuse_attr *attr, |
1505 | const struct fuse_inode *fi) | |
1506 | { | |
3c0d5df2 JL |
1507 | struct timespec64 atime = inode_get_atime(&fi->inode); |
1508 | struct timespec64 mtime = inode_get_mtime(&fi->inode); | |
ceb2d5e9 JL |
1509 | struct timespec64 ctime = inode_get_ctime(&fi->inode); |
1510 | ||
1866d779 MR |
1511 | *attr = (struct fuse_attr){ |
1512 | .ino = fi->inode.i_ino, | |
1513 | .size = fi->inode.i_size, | |
1514 | .blocks = fi->inode.i_blocks, | |
3c0d5df2 JL |
1515 | .atime = atime.tv_sec, |
1516 | .mtime = mtime.tv_sec, | |
ceb2d5e9 | 1517 | .ctime = ctime.tv_sec, |
3c0d5df2 JL |
1518 | .atimensec = atime.tv_nsec, |
1519 | .mtimensec = mtime.tv_nsec, | |
ceb2d5e9 | 1520 | .ctimensec = ctime.tv_nsec, |
1866d779 MR |
1521 | .mode = fi->inode.i_mode, |
1522 | .nlink = fi->inode.i_nlink, | |
1523 | .uid = fi->inode.i_uid.val, | |
1524 | .gid = fi->inode.i_gid.val, | |
1525 | .rdev = fi->inode.i_rdev, | |
1526 | .blksize = 1u << fi->inode.i_blkbits, | |
1527 | }; | |
1528 | } | |
1529 | ||
1530 | static void fuse_sb_defaults(struct super_block *sb) | |
1531 | { | |
1532 | sb->s_magic = FUSE_SUPER_MAGIC; | |
1533 | sb->s_op = &fuse_super_operations; | |
1534 | sb->s_xattr = fuse_xattr_handlers; | |
1535 | sb->s_maxbytes = MAX_LFS_FILESIZE; | |
1536 | sb->s_time_gran = 1; | |
1537 | sb->s_export_op = &fuse_export_operations; | |
1538 | sb->s_iflags |= SB_I_IMA_UNVERIFIABLE_SIGNATURE; | |
1539 | if (sb->s_user_ns != &init_user_ns) | |
1540 | sb->s_iflags |= SB_I_UNTRUSTED_MOUNTER; | |
1541 | sb->s_flags &= ~(SB_NOSEC | SB_I_VERSION); | |
1866d779 MR |
1542 | } |
1543 | ||
1b539917 GK |
1544 | static int fuse_fill_super_submount(struct super_block *sb, |
1545 | struct fuse_inode *parent_fi) | |
1866d779 MR |
1546 | { |
1547 | struct fuse_mount *fm = get_fuse_mount_super(sb); | |
1548 | struct super_block *parent_sb = parent_fi->inode.i_sb; | |
1549 | struct fuse_attr root_attr; | |
1550 | struct inode *root; | |
c4d361f6 KJ |
1551 | struct fuse_submount_lookup *sl; |
1552 | struct fuse_inode *fi; | |
1866d779 MR |
1553 | |
1554 | fuse_sb_defaults(sb); | |
1555 | fm->sb = sb; | |
1556 | ||
1557 | WARN_ON(sb->s_bdi != &noop_backing_dev_info); | |
1558 | sb->s_bdi = bdi_get(parent_sb->s_bdi); | |
1559 | ||
1560 | sb->s_xattr = parent_sb->s_xattr; | |
1561 | sb->s_time_gran = parent_sb->s_time_gran; | |
1562 | sb->s_blocksize = parent_sb->s_blocksize; | |
1563 | sb->s_blocksize_bits = parent_sb->s_blocksize_bits; | |
1564 | sb->s_subtype = kstrdup(parent_sb->s_subtype, GFP_KERNEL); | |
1565 | if (parent_sb->s_subtype && !sb->s_subtype) | |
1566 | return -ENOMEM; | |
1567 | ||
1568 | fuse_fill_attr_from_inode(&root_attr, parent_fi); | |
1569 | root = fuse_iget(sb, parent_fi->nodeid, 0, &root_attr, 0, 0); | |
1570 | /* | |
1571 | * This inode is just a duplicate, so it is not looked up and | |
1572 | * its nlookup should not be incremented. fuse_iget() does | |
1573 | * that, though, so undo it here. | |
1574 | */ | |
c4d361f6 KJ |
1575 | fi = get_fuse_inode(root); |
1576 | fi->nlookup--; | |
1577 | ||
1866d779 MR |
1578 | sb->s_d_op = &fuse_dentry_operations; |
1579 | sb->s_root = d_make_root(root); | |
1580 | if (!sb->s_root) | |
1581 | return -ENOMEM; | |
1582 | ||
c4d361f6 KJ |
1583 | /* |
1584 | * Grab the parent's submount_lookup pointer and take a | |
1585 | * reference on the shared nlookup from the parent. This is to | |
1586 | * prevent the last forget for this nodeid from getting | |
1587 | * triggered until all users have finished with it. | |
1588 | */ | |
1589 | sl = parent_fi->submount_lookup; | |
1590 | WARN_ON(!sl); | |
1591 | if (sl) { | |
1592 | refcount_inc(&sl->count); | |
1593 | fi->submount_lookup = sl; | |
1594 | } | |
1595 | ||
1866d779 MR |
1596 | return 0; |
1597 | } | |
1598 | ||
266eb3f2 | 1599 | /* Filesystem context private data holds the FUSE inode of the mount point */ |
fe0a7bd8 GK |
1600 | static int fuse_get_tree_submount(struct fs_context *fsc) |
1601 | { | |
266eb3f2 GK |
1602 | struct fuse_mount *fm; |
1603 | struct fuse_inode *mp_fi = fsc->fs_private; | |
1604 | struct fuse_conn *fc = get_fuse_conn(&mp_fi->inode); | |
1605 | struct super_block *sb; | |
1606 | int err; | |
1607 | ||
1608 | fm = kzalloc(sizeof(struct fuse_mount), GFP_KERNEL); | |
1609 | if (!fm) | |
1610 | return -ENOMEM; | |
1611 | ||
c191cd07 | 1612 | fm->fc = fuse_conn_get(fc); |
266eb3f2 GK |
1613 | fsc->s_fs_info = fm; |
1614 | sb = sget_fc(fsc, NULL, set_anon_super_fc); | |
c191cd07 MS |
1615 | if (fsc->s_fs_info) |
1616 | fuse_mount_destroy(fm); | |
1617 | if (IS_ERR(sb)) | |
266eb3f2 | 1618 | return PTR_ERR(sb); |
266eb3f2 GK |
1619 | |
1620 | /* Initialize superblock, making @mp_fi its root */ | |
1621 | err = fuse_fill_super_submount(sb, mp_fi); | |
1622 | if (err) { | |
266eb3f2 GK |
1623 | deactivate_locked_super(sb); |
1624 | return err; | |
1625 | } | |
1626 | ||
1627 | down_write(&fc->killsb); | |
1628 | list_add_tail(&fm->fc_entry, &fc->mounts); | |
1629 | up_write(&fc->killsb); | |
1630 | ||
1631 | sb->s_flags |= SB_ACTIVE; | |
1632 | fsc->root = dget(sb->s_root); | |
1633 | ||
fe0a7bd8 GK |
1634 | return 0; |
1635 | } | |
1636 | ||
1637 | static const struct fs_context_operations fuse_context_submount_ops = { | |
1638 | .get_tree = fuse_get_tree_submount, | |
1639 | }; | |
1640 | ||
1641 | int fuse_init_fs_context_submount(struct fs_context *fsc) | |
1642 | { | |
1643 | fsc->ops = &fuse_context_submount_ops; | |
1644 | return 0; | |
1645 | } | |
1646 | EXPORT_SYMBOL_GPL(fuse_init_fs_context_submount); | |
1647 | ||
0cc2656c | 1648 | int fuse_fill_super_common(struct super_block *sb, struct fuse_fs_context *ctx) |
d8a5ba45 | 1649 | { |
7fd3abfa | 1650 | struct fuse_dev *fud = NULL; |
fcee216b MR |
1651 | struct fuse_mount *fm = get_fuse_mount_super(sb); |
1652 | struct fuse_conn *fc = fm->fc; | |
d8a5ba45 | 1653 | struct inode *root; |
f543f253 | 1654 | struct dentry *root_dentry; |
d8a5ba45 MS |
1655 | int err; |
1656 | ||
c2b8f006 | 1657 | err = -EINVAL; |
1751e8a6 | 1658 | if (sb->s_flags & SB_MANDLOCK) |
c2b8f006 | 1659 | goto err; |
71421259 | 1660 | |
660585b5 | 1661 | rcu_assign_pointer(fc->curr_bucket, fuse_sync_bucket_alloc()); |
1866d779 | 1662 | fuse_sb_defaults(sb); |
9e1f1de0 | 1663 | |
0cc2656c | 1664 | if (ctx->is_bdev) { |
875d95ec | 1665 | #ifdef CONFIG_BLOCK |
c2b8f006 | 1666 | err = -EINVAL; |
c30da2e9 | 1667 | if (!sb_set_blocksize(sb, ctx->blksize)) |
c2b8f006 | 1668 | goto err; |
875d95ec | 1669 | #endif |
d8091614 | 1670 | } else { |
09cbfeaf KS |
1671 | sb->s_blocksize = PAGE_SIZE; |
1672 | sb->s_blocksize_bits = PAGE_SHIFT; | |
d8091614 | 1673 | } |
c30da2e9 DH |
1674 | |
1675 | sb->s_subtype = ctx->subtype; | |
1676 | ctx->subtype = NULL; | |
1dd53957 | 1677 | if (IS_ENABLED(CONFIG_FUSE_DAX)) { |
780b1b95 | 1678 | err = fuse_dax_conn_alloc(fc, ctx->dax_mode, ctx->dax_dev); |
1dd53957 VG |
1679 | if (err) |
1680 | goto err; | |
1681 | } | |
e45b2546 | 1682 | |
7fd3abfa VG |
1683 | if (ctx->fudptr) { |
1684 | err = -ENOMEM; | |
1685 | fud = fuse_dev_alloc_install(fc); | |
1686 | if (!fud) | |
1dd53957 | 1687 | goto err_free_dax; |
7fd3abfa | 1688 | } |
cc080e9e | 1689 | |
a325f9b9 | 1690 | fc->dev = sb->s_dev; |
fcee216b | 1691 | fm->sb = sb; |
a325f9b9 TH |
1692 | err = fuse_bdi_init(fc, sb); |
1693 | if (err) | |
cc080e9e | 1694 | goto err_dev_free; |
0d179aa5 | 1695 | |
e0a43ddc | 1696 | /* Handle umasking inside the fuse code */ |
1751e8a6 | 1697 | if (sb->s_flags & SB_POSIXACL) |
e0a43ddc | 1698 | fc->dont_mask = 1; |
1751e8a6 | 1699 | sb->s_flags |= SB_POSIXACL; |
e0a43ddc | 1700 | |
c30da2e9 DH |
1701 | fc->default_permissions = ctx->default_permissions; |
1702 | fc->allow_other = ctx->allow_other; | |
1703 | fc->user_id = ctx->user_id; | |
1704 | fc->group_id = ctx->group_id; | |
f4fd4ae3 | 1705 | fc->legacy_opts_show = ctx->legacy_opts_show; |
1866d779 | 1706 | fc->max_read = max_t(unsigned int, 4096, ctx->max_read); |
783863d6 | 1707 | fc->destroy = ctx->destroy; |
15c8e72e VG |
1708 | fc->no_control = ctx->no_control; |
1709 | fc->no_force_umount = ctx->no_force_umount; | |
f543f253 | 1710 | |
d8a5ba45 | 1711 | err = -ENOMEM; |
c30da2e9 | 1712 | root = fuse_get_root_inode(sb, ctx->rootmode); |
0ce267ff | 1713 | sb->s_d_op = &fuse_root_dentry_operations; |
48fde701 AV |
1714 | root_dentry = d_make_root(root); |
1715 | if (!root_dentry) | |
cc080e9e | 1716 | goto err_dev_free; |
0ce267ff | 1717 | /* Root dentry doesn't have .d_revalidate */ |
c35eebe9 | 1718 | sb->s_d_op = &fuse_dentry_operations; |
f543f253 | 1719 | |
bafa9654 | 1720 | mutex_lock(&fuse_mutex); |
8aa09a50 | 1721 | err = -EINVAL; |
7fd3abfa | 1722 | if (ctx->fudptr && *ctx->fudptr) |
bafa9654 | 1723 | goto err_unlock; |
8aa09a50 | 1724 | |
bafa9654 MS |
1725 | err = fuse_ctl_add_conn(fc); |
1726 | if (err) | |
1727 | goto err_unlock; | |
1728 | ||
1729 | list_add_tail(&fc->entry, &fuse_conn_list); | |
f543f253 | 1730 | sb->s_root = root_dentry; |
7fd3abfa VG |
1731 | if (ctx->fudptr) |
1732 | *ctx->fudptr = fud; | |
bafa9654 | 1733 | mutex_unlock(&fuse_mutex); |
0cc2656c SH |
1734 | return 0; |
1735 | ||
1736 | err_unlock: | |
1737 | mutex_unlock(&fuse_mutex); | |
1738 | dput(root_dentry); | |
1739 | err_dev_free: | |
7fd3abfa VG |
1740 | if (fud) |
1741 | fuse_dev_free(fud); | |
1dd53957 VG |
1742 | err_free_dax: |
1743 | if (IS_ENABLED(CONFIG_FUSE_DAX)) | |
1744 | fuse_dax_conn_free(fc); | |
0cc2656c SH |
1745 | err: |
1746 | return err; | |
1747 | } | |
1748 | EXPORT_SYMBOL_GPL(fuse_fill_super_common); | |
1749 | ||
1750 | static int fuse_fill_super(struct super_block *sb, struct fs_context *fsc) | |
1751 | { | |
1752 | struct fuse_fs_context *ctx = fsc->fs_private; | |
0cc2656c | 1753 | int err; |
0cc2656c | 1754 | |
62dd1fc8 | 1755 | if (!ctx->file || !ctx->rootmode_present || |
badc7414 MS |
1756 | !ctx->user_id_present || !ctx->group_id_present) |
1757 | return -EINVAL; | |
0cc2656c SH |
1758 | |
1759 | /* | |
1760 | * Require mount to happen from the same user namespace which | |
1761 | * opened /dev/fuse to prevent potential attacks. | |
1762 | */ | |
62dd1fc8 MS |
1763 | if ((ctx->file->f_op != &fuse_dev_operations) || |
1764 | (ctx->file->f_cred->user_ns != sb->s_user_ns)) | |
964d32e5 | 1765 | return -EINVAL; |
62dd1fc8 | 1766 | ctx->fudptr = &ctx->file->private_data; |
0cc2656c | 1767 | |
0cc2656c SH |
1768 | err = fuse_fill_super_common(sb, ctx); |
1769 | if (err) | |
964d32e5 | 1770 | return err; |
62dd1fc8 MS |
1771 | /* file->private_data shall be visible on all CPUs after this */ |
1772 | smp_mb(); | |
fcee216b | 1773 | fuse_send_init(get_fuse_mount_super(sb)); |
d8a5ba45 | 1774 | return 0; |
d8a5ba45 MS |
1775 | } |
1776 | ||
5d5b74aa MS |
1777 | /* |
1778 | * This is the path where user supplied an already initialized fuse dev. In | |
1779 | * this case never create a new super if the old one is gone. | |
1780 | */ | |
1781 | static int fuse_set_no_super(struct super_block *sb, struct fs_context *fsc) | |
d8a5ba45 | 1782 | { |
5d5b74aa MS |
1783 | return -ENOTCONN; |
1784 | } | |
c30da2e9 | 1785 | |
5d5b74aa MS |
1786 | static int fuse_test_super(struct super_block *sb, struct fs_context *fsc) |
1787 | { | |
c30da2e9 | 1788 | |
5d5b74aa MS |
1789 | return fsc->sget_key == get_fuse_conn_super(sb); |
1790 | } | |
1791 | ||
84c21507 | 1792 | static int fuse_get_tree(struct fs_context *fsc) |
d8a5ba45 | 1793 | { |
84c21507 | 1794 | struct fuse_fs_context *ctx = fsc->fs_private; |
5d5b74aa | 1795 | struct fuse_dev *fud; |
80019f11 MS |
1796 | struct fuse_conn *fc; |
1797 | struct fuse_mount *fm; | |
5d5b74aa | 1798 | struct super_block *sb; |
62dd1fc8 | 1799 | int err; |
c30da2e9 | 1800 | |
80019f11 MS |
1801 | fc = kmalloc(sizeof(*fc), GFP_KERNEL); |
1802 | if (!fc) | |
1803 | return -ENOMEM; | |
1804 | ||
1805 | fm = kzalloc(sizeof(*fm), GFP_KERNEL); | |
1806 | if (!fm) { | |
1807 | kfree(fc); | |
1808 | return -ENOMEM; | |
1809 | } | |
1810 | ||
1811 | fuse_conn_init(fc, fm, fsc->user_ns, &fuse_dev_fiq_ops, NULL); | |
1812 | fc->release = fuse_free_conn; | |
1813 | ||
1814 | fsc->s_fs_info = fm; | |
1815 | ||
62dd1fc8 MS |
1816 | if (ctx->fd_present) |
1817 | ctx->file = fget(ctx->fd); | |
c30da2e9 | 1818 | |
badc7414 | 1819 | if (IS_ENABLED(CONFIG_BLOCK) && ctx->is_bdev) { |
62dd1fc8 | 1820 | err = get_tree_bdev(fsc, fuse_fill_super); |
80019f11 | 1821 | goto out; |
badc7414 | 1822 | } |
5d5b74aa MS |
1823 | /* |
1824 | * While block dev mount can be initialized with a dummy device fd | |
1825 | * (found by device name), normal fuse mounts can't | |
1826 | */ | |
80019f11 | 1827 | err = -EINVAL; |
5d5b74aa | 1828 | if (!ctx->file) |
80019f11 | 1829 | goto out; |
c30da2e9 | 1830 | |
5d5b74aa MS |
1831 | /* |
1832 | * Allow creating a fuse mount with an already initialized fuse | |
1833 | * connection | |
1834 | */ | |
1835 | fud = READ_ONCE(ctx->file->private_data); | |
1836 | if (ctx->file->f_op == &fuse_dev_operations && fud) { | |
1837 | fsc->sget_key = fud->fc; | |
1838 | sb = sget_fc(fsc, fuse_test_super, fuse_set_no_super); | |
1839 | err = PTR_ERR_OR_ZERO(sb); | |
1840 | if (!IS_ERR(sb)) | |
1841 | fsc->root = dget(sb->s_root); | |
1842 | } else { | |
1843 | err = get_tree_nodev(fsc, fuse_fill_super); | |
1844 | } | |
80019f11 MS |
1845 | out: |
1846 | if (fsc->s_fs_info) | |
1847 | fuse_mount_destroy(fm); | |
62dd1fc8 MS |
1848 | if (ctx->file) |
1849 | fput(ctx->file); | |
1850 | return err; | |
c30da2e9 DH |
1851 | } |
1852 | ||
1853 | static const struct fs_context_operations fuse_context_ops = { | |
84c21507 | 1854 | .free = fuse_free_fsc, |
c30da2e9 | 1855 | .parse_param = fuse_parse_param, |
0189a2d3 | 1856 | .reconfigure = fuse_reconfigure, |
c30da2e9 DH |
1857 | .get_tree = fuse_get_tree, |
1858 | }; | |
1859 | ||
1860 | /* | |
1861 | * Set up the filesystem mount context. | |
1862 | */ | |
84c21507 | 1863 | static int fuse_init_fs_context(struct fs_context *fsc) |
c30da2e9 DH |
1864 | { |
1865 | struct fuse_fs_context *ctx; | |
1866 | ||
1867 | ctx = kzalloc(sizeof(struct fuse_fs_context), GFP_KERNEL); | |
1868 | if (!ctx) | |
1869 | return -ENOMEM; | |
1870 | ||
1871 | ctx->max_read = ~0; | |
1872 | ctx->blksize = FUSE_DEFAULT_BLKSIZE; | |
f4fd4ae3 | 1873 | ctx->legacy_opts_show = true; |
c30da2e9 DH |
1874 | |
1875 | #ifdef CONFIG_BLOCK | |
84c21507 | 1876 | if (fsc->fs_type == &fuseblk_fs_type) { |
c30da2e9 | 1877 | ctx->is_bdev = true; |
783863d6 MS |
1878 | ctx->destroy = true; |
1879 | } | |
c30da2e9 DH |
1880 | #endif |
1881 | ||
84c21507 MS |
1882 | fsc->fs_private = ctx; |
1883 | fsc->ops = &fuse_context_ops; | |
c30da2e9 | 1884 | return 0; |
d8a5ba45 MS |
1885 | } |
1886 | ||
fcee216b | 1887 | bool fuse_mount_remove(struct fuse_mount *fm) |
3b463ae0 | 1888 | { |
fcee216b MR |
1889 | struct fuse_conn *fc = fm->fc; |
1890 | bool last = false; | |
3b463ae0 | 1891 | |
fcee216b MR |
1892 | down_write(&fc->killsb); |
1893 | list_del_init(&fm->fc_entry); | |
1894 | if (list_empty(&fc->mounts)) | |
1895 | last = true; | |
1896 | up_write(&fc->killsb); | |
e8f3bd77 | 1897 | |
fcee216b MR |
1898 | return last; |
1899 | } | |
1900 | EXPORT_SYMBOL_GPL(fuse_mount_remove); | |
e8f3bd77 | 1901 | |
fcee216b MR |
1902 | void fuse_conn_destroy(struct fuse_mount *fm) |
1903 | { | |
1904 | struct fuse_conn *fc = fm->fc; | |
1905 | ||
1906 | if (fc->destroy) | |
1907 | fuse_send_destroy(fm); | |
1908 | ||
1909 | fuse_abort_conn(fc); | |
1910 | fuse_wait_aborted(fc); | |
413daa1a MS |
1911 | |
1912 | if (!list_empty(&fc->entry)) { | |
1913 | mutex_lock(&fuse_mutex); | |
1914 | list_del(&fc->entry); | |
1915 | fuse_ctl_remove_conn(fc); | |
1916 | mutex_unlock(&fuse_mutex); | |
3b463ae0 | 1917 | } |
e8f3bd77 | 1918 | } |
fcee216b | 1919 | EXPORT_SYMBOL_GPL(fuse_conn_destroy); |
3b463ae0 | 1920 | |
6a68d1e1 | 1921 | static void fuse_sb_destroy(struct super_block *sb) |
e8f3bd77 | 1922 | { |
fcee216b MR |
1923 | struct fuse_mount *fm = get_fuse_mount_super(sb); |
1924 | bool last; | |
1925 | ||
d534d31d | 1926 | if (sb->s_root) { |
fcee216b MR |
1927 | last = fuse_mount_remove(fm); |
1928 | if (last) | |
1929 | fuse_conn_destroy(fm); | |
1930 | } | |
6a68d1e1 MS |
1931 | } |
1932 | ||
a27c061a MS |
1933 | void fuse_mount_destroy(struct fuse_mount *fm) |
1934 | { | |
80019f11 MS |
1935 | fuse_conn_put(fm->fc); |
1936 | kfree(fm); | |
a27c061a MS |
1937 | } |
1938 | EXPORT_SYMBOL(fuse_mount_destroy); | |
1939 | ||
6a68d1e1 MS |
1940 | static void fuse_kill_sb_anon(struct super_block *sb) |
1941 | { | |
1942 | fuse_sb_destroy(sb); | |
3b463ae0 | 1943 | kill_anon_super(sb); |
a27c061a | 1944 | fuse_mount_destroy(get_fuse_mount_super(sb)); |
3b463ae0 JM |
1945 | } |
1946 | ||
875d95ec MS |
1947 | static struct file_system_type fuse_fs_type = { |
1948 | .owner = THIS_MODULE, | |
1949 | .name = "fuse", | |
4ad769f3 | 1950 | .fs_flags = FS_HAS_SUBTYPE | FS_USERNS_MOUNT, |
c30da2e9 | 1951 | .init_fs_context = fuse_init_fs_context, |
d7167b14 | 1952 | .parameters = fuse_fs_parameters, |
3b463ae0 | 1953 | .kill_sb = fuse_kill_sb_anon, |
875d95ec | 1954 | }; |
7f78e035 | 1955 | MODULE_ALIAS_FS("fuse"); |
875d95ec MS |
1956 | |
1957 | #ifdef CONFIG_BLOCK | |
3b463ae0 JM |
1958 | static void fuse_kill_sb_blk(struct super_block *sb) |
1959 | { | |
6a68d1e1 | 1960 | fuse_sb_destroy(sb); |
3b463ae0 | 1961 | kill_block_super(sb); |
a27c061a | 1962 | fuse_mount_destroy(get_fuse_mount_super(sb)); |
3b463ae0 JM |
1963 | } |
1964 | ||
d6392f87 MS |
1965 | static struct file_system_type fuseblk_fs_type = { |
1966 | .owner = THIS_MODULE, | |
1967 | .name = "fuseblk", | |
c30da2e9 | 1968 | .init_fs_context = fuse_init_fs_context, |
d7167b14 | 1969 | .parameters = fuse_fs_parameters, |
3b463ae0 | 1970 | .kill_sb = fuse_kill_sb_blk, |
edad01e2 | 1971 | .fs_flags = FS_REQUIRES_DEV | FS_HAS_SUBTYPE, |
d6392f87 | 1972 | }; |
7f78e035 | 1973 | MODULE_ALIAS_FS("fuseblk"); |
d6392f87 | 1974 | |
875d95ec MS |
1975 | static inline int register_fuseblk(void) |
1976 | { | |
1977 | return register_filesystem(&fuseblk_fs_type); | |
1978 | } | |
1979 | ||
1980 | static inline void unregister_fuseblk(void) | |
1981 | { | |
1982 | unregister_filesystem(&fuseblk_fs_type); | |
1983 | } | |
1984 | #else | |
1985 | static inline int register_fuseblk(void) | |
1986 | { | |
1987 | return 0; | |
1988 | } | |
1989 | ||
1990 | static inline void unregister_fuseblk(void) | |
1991 | { | |
1992 | } | |
1993 | #endif | |
1994 | ||
51cc5068 | 1995 | static void fuse_inode_init_once(void *foo) |
d8a5ba45 | 1996 | { |
1729a16c | 1997 | struct inode *inode = foo; |
d8a5ba45 | 1998 | |
a35afb83 | 1999 | inode_init_once(inode); |
d8a5ba45 MS |
2000 | } |
2001 | ||
2002 | static int __init fuse_fs_init(void) | |
2003 | { | |
2004 | int err; | |
2005 | ||
d6392f87 | 2006 | fuse_inode_cachep = kmem_cache_create("fuse_inode", |
df206988 JW |
2007 | sizeof(struct fuse_inode), 0, |
2008 | SLAB_HWCACHE_ALIGN|SLAB_ACCOUNT|SLAB_RECLAIM_ACCOUNT, | |
2009 | fuse_inode_init_once); | |
d6392f87 MS |
2010 | err = -ENOMEM; |
2011 | if (!fuse_inode_cachep) | |
988f0325 AV |
2012 | goto out; |
2013 | ||
2014 | err = register_fuseblk(); | |
2015 | if (err) | |
2016 | goto out2; | |
2017 | ||
2018 | err = register_filesystem(&fuse_fs_type); | |
2019 | if (err) | |
2020 | goto out3; | |
d6392f87 MS |
2021 | |
2022 | return 0; | |
d8a5ba45 | 2023 | |
988f0325 | 2024 | out3: |
875d95ec | 2025 | unregister_fuseblk(); |
988f0325 AV |
2026 | out2: |
2027 | kmem_cache_destroy(fuse_inode_cachep); | |
d6392f87 | 2028 | out: |
d8a5ba45 MS |
2029 | return err; |
2030 | } | |
2031 | ||
2032 | static void fuse_fs_cleanup(void) | |
2033 | { | |
2034 | unregister_filesystem(&fuse_fs_type); | |
875d95ec | 2035 | unregister_fuseblk(); |
8c0a8537 KS |
2036 | |
2037 | /* | |
2038 | * Make sure all delayed rcu free inodes are flushed before we | |
2039 | * destroy cache. | |
2040 | */ | |
2041 | rcu_barrier(); | |
d8a5ba45 MS |
2042 | kmem_cache_destroy(fuse_inode_cachep); |
2043 | } | |
2044 | ||
5c89e17e | 2045 | static struct kobject *fuse_kobj; |
5c89e17e | 2046 | |
f543f253 MS |
2047 | static int fuse_sysfs_init(void) |
2048 | { | |
2049 | int err; | |
2050 | ||
00d26666 | 2051 | fuse_kobj = kobject_create_and_add("fuse", fs_kobj); |
5c89e17e GKH |
2052 | if (!fuse_kobj) { |
2053 | err = -ENOMEM; | |
f543f253 | 2054 | goto out_err; |
5c89e17e | 2055 | } |
f543f253 | 2056 | |
f9bb4882 EB |
2057 | err = sysfs_create_mount_point(fuse_kobj, "connections"); |
2058 | if (err) | |
f543f253 MS |
2059 | goto out_fuse_unregister; |
2060 | ||
2061 | return 0; | |
2062 | ||
2063 | out_fuse_unregister: | |
197b12d6 | 2064 | kobject_put(fuse_kobj); |
f543f253 MS |
2065 | out_err: |
2066 | return err; | |
2067 | } | |
2068 | ||
2069 | static void fuse_sysfs_cleanup(void) | |
2070 | { | |
f9bb4882 | 2071 | sysfs_remove_mount_point(fuse_kobj, "connections"); |
197b12d6 | 2072 | kobject_put(fuse_kobj); |
f543f253 MS |
2073 | } |
2074 | ||
d8a5ba45 MS |
2075 | static int __init fuse_init(void) |
2076 | { | |
2077 | int res; | |
2078 | ||
f2294482 KS |
2079 | pr_info("init (API version %i.%i)\n", |
2080 | FUSE_KERNEL_VERSION, FUSE_KERNEL_MINOR_VERSION); | |
d8a5ba45 | 2081 | |
bafa9654 | 2082 | INIT_LIST_HEAD(&fuse_conn_list); |
d8a5ba45 MS |
2083 | res = fuse_fs_init(); |
2084 | if (res) | |
2085 | goto err; | |
2086 | ||
334f485d MS |
2087 | res = fuse_dev_init(); |
2088 | if (res) | |
2089 | goto err_fs_cleanup; | |
2090 | ||
f543f253 MS |
2091 | res = fuse_sysfs_init(); |
2092 | if (res) | |
2093 | goto err_dev_cleanup; | |
2094 | ||
bafa9654 MS |
2095 | res = fuse_ctl_init(); |
2096 | if (res) | |
2097 | goto err_sysfs_cleanup; | |
2098 | ||
487ea5af CH |
2099 | sanitize_global_limit(&max_user_bgreq); |
2100 | sanitize_global_limit(&max_user_congthresh); | |
2101 | ||
d8a5ba45 MS |
2102 | return 0; |
2103 | ||
bafa9654 MS |
2104 | err_sysfs_cleanup: |
2105 | fuse_sysfs_cleanup(); | |
f543f253 MS |
2106 | err_dev_cleanup: |
2107 | fuse_dev_cleanup(); | |
334f485d MS |
2108 | err_fs_cleanup: |
2109 | fuse_fs_cleanup(); | |
d8a5ba45 MS |
2110 | err: |
2111 | return res; | |
2112 | } | |
2113 | ||
2114 | static void __exit fuse_exit(void) | |
2115 | { | |
f2294482 | 2116 | pr_debug("exit\n"); |
d8a5ba45 | 2117 | |
bafa9654 | 2118 | fuse_ctl_cleanup(); |
f543f253 | 2119 | fuse_sysfs_cleanup(); |
d8a5ba45 | 2120 | fuse_fs_cleanup(); |
334f485d | 2121 | fuse_dev_cleanup(); |
d8a5ba45 MS |
2122 | } |
2123 | ||
2124 | module_init(fuse_init); | |
2125 | module_exit(fuse_exit); |