mirror of
				git://git.kernel.org/pub/scm/linux/kernel/git/torvalds/linux.git
				synced 2025-09-18 22:14:16 +00:00 
			
		
		
		
	vfs-6.16-rc1.super
-----BEGIN PGP SIGNATURE-----
 
 iHUEABYKAB0WIQRAhzRXHqcMeLMyaSiRxhvAZXjcogUCaDBPTwAKCRCRxhvAZXjc
 oi3BAQD/IBxTbAZIe7vEAsuLlBoKbWrzPGvxzd4UeMGo6OY18wEAvvyJM+arQy51
 jS0ZErDOJnPNe7jps+Gh+WDx6d3NMAY=
 =lqAG
 -----END PGP SIGNATURE-----
Merge tag 'vfs-6.16-rc1.super' of git://git.kernel.org/pub/scm/linux/kernel/git/vfs/vfs
Pull vfs freezing updates from Christian Brauner:
 "This contains various filesystem freezing related work for this cycle:
   - Allow the power subsystem to support filesystem freeze for suspend
     and hibernate.
     Now all the pieces are in place to actually allow the power
     subsystem to freeze/thaw filesystems during suspend/resume.
     Filesystems are only frozen and thawed if the power subsystem does
     actually own the freeze.
     If the filesystem is already frozen by the time we've frozen all
     userspace processes we don't care to freeze it again. That's
     userspace's job once the process resumes. We only actually freeze
     filesystems if we absolutely have to and we ignore other failures
     to freeze.
     We could bubble up errors and fail suspend/resume if the error
     isn't EBUSY (aka it's already frozen) but I don't think that this
     is worth it. Filesystem freezing during suspend/resume is
     best-effort. If the user has 500 ext4 filesystems mounted and 4
     fail to freeze for whatever reason then we simply skip them.
     What we have now is already a big improvement and let's see how we
     fare with it before making our lives even harder (and uglier) than
     we have to.
   - Allow efivars to support freeze and thaw
     Allow efivarfs to partake to resync variable state during system
     hibernation and suspend. Add freeze/thaw support.
     This is a pretty straightforward implementation. We simply add
     regular freeze/thaw support for both userspace and the kernel.
     efivars is the first pseudofilesystem that adds support for
     filesystem freezing and thawing.
     The simplicity comes from the fact that we simply always resync
     variable state after efivarfs has been frozen. It doesn't matter
     whether that's because of suspend, userspace initiated freeze or
     hibernation. Efivars is simple enough that it doesn't matter that
     we walk all dentries. There are no directories and there aren't
     insane amounts of entries and both freeze/thaw are already
     heavy-handed operations. If userspace initiated a freeze/thaw cycle
     they would need CAP_SYS_ADMIN in the initial user namespace (as
     that's where efivarfs is mounted) so it can't be triggered by
     random userspace. IOW, we really really don't care"
* tag 'vfs-6.16-rc1.super' of git://git.kernel.org/pub/scm/linux/kernel/git/vfs/vfs:
  f2fs: fix freezing filesystem during resize
  kernfs: add warning about implementing freeze/thaw
  efivarfs: support freeze/thaw
  power: freeze filesystems during suspend/resume
  libfs: export find_next_child()
  super: add filesystem freezing helpers for suspend and hibernate
  gfs2: pass through holder from the VFS for freeze/thaw
  super: use common iterator (Part 2)
  super: use a common iterator (Part 1)
  super: skip dying superblocks early
  super: simplify user_get_super()
  super: remove pointless s_root checks
  fs: allow all writers to be frozen
  locking/percpu-rwsem: add freezable alternative to down_read
			
			
This commit is contained in:
		
						commit
						8dd53535f1
					
				
					 19 changed files with 417 additions and 276 deletions
				
			
		|  | @ -17,7 +17,6 @@ struct efivarfs_fs_info { | ||||||
| 	struct efivarfs_mount_opts mount_opts; | 	struct efivarfs_mount_opts mount_opts; | ||||||
| 	struct super_block *sb; | 	struct super_block *sb; | ||||||
| 	struct notifier_block nb; | 	struct notifier_block nb; | ||||||
| 	struct notifier_block pm_nb; |  | ||||||
| }; | }; | ||||||
| 
 | 
 | ||||||
| struct efi_variable { | struct efi_variable { | ||||||
|  |  | ||||||
|  | @ -21,6 +21,7 @@ | ||||||
| #include <linux/namei.h> | #include <linux/namei.h> | ||||||
| 
 | 
 | ||||||
| #include "internal.h" | #include "internal.h" | ||||||
|  | #include "../internal.h" | ||||||
| 
 | 
 | ||||||
| static int efivarfs_ops_notifier(struct notifier_block *nb, unsigned long event, | static int efivarfs_ops_notifier(struct notifier_block *nb, unsigned long event, | ||||||
| 				 void *data) | 				 void *data) | ||||||
|  | @ -120,12 +121,18 @@ static int efivarfs_statfs(struct dentry *dentry, struct kstatfs *buf) | ||||||
| 
 | 
 | ||||||
| 	return 0; | 	return 0; | ||||||
| } | } | ||||||
|  | 
 | ||||||
|  | static int efivarfs_freeze_fs(struct super_block *sb); | ||||||
|  | static int efivarfs_unfreeze_fs(struct super_block *sb); | ||||||
|  | 
 | ||||||
| static const struct super_operations efivarfs_ops = { | static const struct super_operations efivarfs_ops = { | ||||||
| 	.statfs = efivarfs_statfs, | 	.statfs = efivarfs_statfs, | ||||||
| 	.drop_inode = generic_delete_inode, | 	.drop_inode = generic_delete_inode, | ||||||
| 	.alloc_inode = efivarfs_alloc_inode, | 	.alloc_inode = efivarfs_alloc_inode, | ||||||
| 	.free_inode = efivarfs_free_inode, | 	.free_inode = efivarfs_free_inode, | ||||||
| 	.show_options = efivarfs_show_options, | 	.show_options = efivarfs_show_options, | ||||||
|  | 	.freeze_fs = efivarfs_freeze_fs, | ||||||
|  | 	.unfreeze_fs = efivarfs_unfreeze_fs, | ||||||
| }; | }; | ||||||
| 
 | 
 | ||||||
| /*
 | /*
 | ||||||
|  | @ -365,8 +372,6 @@ static int efivarfs_fill_super(struct super_block *sb, struct fs_context *fc) | ||||||
| 	if (err) | 	if (err) | ||||||
| 		return err; | 		return err; | ||||||
| 
 | 
 | ||||||
| 	register_pm_notifier(&sfi->pm_nb); |  | ||||||
| 
 |  | ||||||
| 	return efivar_init(efivarfs_callback, sb, true); | 	return efivar_init(efivarfs_callback, sb, true); | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
|  | @ -391,48 +396,6 @@ static const struct fs_context_operations efivarfs_context_ops = { | ||||||
| 	.reconfigure	= efivarfs_reconfigure, | 	.reconfigure	= efivarfs_reconfigure, | ||||||
| }; | }; | ||||||
| 
 | 
 | ||||||
| struct efivarfs_ctx { |  | ||||||
| 	struct dir_context ctx; |  | ||||||
| 	struct super_block *sb; |  | ||||||
| 	struct dentry *dentry; |  | ||||||
| }; |  | ||||||
| 
 |  | ||||||
| static bool efivarfs_actor(struct dir_context *ctx, const char *name, int len, |  | ||||||
| 			   loff_t offset, u64 ino, unsigned mode) |  | ||||||
| { |  | ||||||
| 	unsigned long size; |  | ||||||
| 	struct efivarfs_ctx *ectx = container_of(ctx, struct efivarfs_ctx, ctx); |  | ||||||
| 	struct dentry *dentry = try_lookup_noperm(&QSTR_LEN(name, len), |  | ||||||
| 						  ectx->sb->s_root); |  | ||||||
| 	struct inode *inode; |  | ||||||
| 	struct efivar_entry *entry; |  | ||||||
| 	int err; |  | ||||||
| 
 |  | ||||||
| 	if (IS_ERR_OR_NULL(dentry)) |  | ||||||
| 		return true; |  | ||||||
| 
 |  | ||||||
| 	inode = d_inode(dentry); |  | ||||||
| 	entry = efivar_entry(inode); |  | ||||||
| 
 |  | ||||||
| 	err = efivar_entry_size(entry, &size); |  | ||||||
| 	size += sizeof(__u32);	/* attributes */ |  | ||||||
| 	if (err) |  | ||||||
| 		size = 0; |  | ||||||
| 
 |  | ||||||
| 	inode_lock_nested(inode, I_MUTEX_CHILD); |  | ||||||
| 	i_size_write(inode, size); |  | ||||||
| 	inode_unlock(inode); |  | ||||||
| 
 |  | ||||||
| 	if (!size) { |  | ||||||
| 		ectx->dentry = dentry; |  | ||||||
| 		return false; |  | ||||||
| 	} |  | ||||||
| 
 |  | ||||||
| 	dput(dentry); |  | ||||||
| 
 |  | ||||||
| 	return true; |  | ||||||
| } |  | ||||||
| 
 |  | ||||||
| static int efivarfs_check_missing(efi_char16_t *name16, efi_guid_t vendor, | static int efivarfs_check_missing(efi_char16_t *name16, efi_guid_t vendor, | ||||||
| 				  unsigned long name_size, void *data) | 				  unsigned long name_size, void *data) | ||||||
| { | { | ||||||
|  | @ -469,111 +432,59 @@ static int efivarfs_check_missing(efi_char16_t *name16, efi_guid_t vendor, | ||||||
| 	return err; | 	return err; | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
| static void efivarfs_deactivate_super_work(struct work_struct *work) |  | ||||||
| { |  | ||||||
| 	struct super_block *s = container_of(work, struct super_block, |  | ||||||
| 					     destroy_work); |  | ||||||
| 	/*
 |  | ||||||
| 	 * note: here s->destroy_work is free for reuse (which |  | ||||||
| 	 * will happen in deactivate_super) |  | ||||||
| 	 */ |  | ||||||
| 	deactivate_super(s); |  | ||||||
| } |  | ||||||
| 
 |  | ||||||
| static struct file_system_type efivarfs_type; | static struct file_system_type efivarfs_type; | ||||||
| 
 | 
 | ||||||
| static int efivarfs_pm_notify(struct notifier_block *nb, unsigned long action, | static int efivarfs_freeze_fs(struct super_block *sb) | ||||||
| 			      void *ptr) |  | ||||||
| { | { | ||||||
| 	struct efivarfs_fs_info *sfi = container_of(nb, struct efivarfs_fs_info, | 	/* Nothing for us to do. */ | ||||||
| 						    pm_nb); | 	return 0; | ||||||
| 	struct path path; | } | ||||||
| 	struct efivarfs_ctx ectx = { |  | ||||||
| 		.ctx = { |  | ||||||
| 			.actor	= efivarfs_actor, |  | ||||||
| 		}, |  | ||||||
| 		.sb = sfi->sb, |  | ||||||
| 	}; |  | ||||||
| 	struct file *file; |  | ||||||
| 	struct super_block *s = sfi->sb; |  | ||||||
| 	static bool rescan_done = true; |  | ||||||
| 
 | 
 | ||||||
| 	if (action == PM_HIBERNATION_PREPARE) { | static int efivarfs_unfreeze_fs(struct super_block *sb) | ||||||
| 		rescan_done = false; | { | ||||||
| 		return NOTIFY_OK; | 	struct dentry *child = NULL; | ||||||
| 	} else if (action != PM_POST_HIBERNATION) { |  | ||||||
| 		return NOTIFY_DONE; |  | ||||||
| 	} |  | ||||||
| 
 |  | ||||||
| 	if (rescan_done) |  | ||||||
| 		return NOTIFY_DONE; |  | ||||||
| 
 |  | ||||||
| 	/* ensure single superblock is alive and pin it */ |  | ||||||
| 	if (!atomic_inc_not_zero(&s->s_active)) |  | ||||||
| 		return NOTIFY_DONE; |  | ||||||
| 
 | 
 | ||||||
|  | 	/*
 | ||||||
|  | 	 * Unconditionally resync the variable state on a thaw request. | ||||||
|  | 	 * Given the size of efivarfs it really doesn't matter to simply | ||||||
|  | 	 * iterate through all of the entries and resync. Freeze/thaw | ||||||
|  | 	 * requests are rare enough for that to not matter and the | ||||||
|  | 	 * number of entries is pretty low too. So we really don't care. | ||||||
|  | 	 */ | ||||||
| 	pr_info("efivarfs: resyncing variable state\n"); | 	pr_info("efivarfs: resyncing variable state\n"); | ||||||
|  | 	for (;;) { | ||||||
|  | 		int err; | ||||||
|  | 		unsigned long size = 0; | ||||||
|  | 		struct inode *inode; | ||||||
|  | 		struct efivar_entry *entry; | ||||||
| 
 | 
 | ||||||
| 	path.dentry = sfi->sb->s_root; | 		child = find_next_child(sb->s_root, child); | ||||||
|  | 		if (!child) | ||||||
|  | 			break; | ||||||
| 
 | 
 | ||||||
| 	/*
 | 		inode = d_inode(child); | ||||||
| 	 * do not add SB_KERNMOUNT which a single superblock could | 		entry = efivar_entry(inode); | ||||||
| 	 * expose to userspace and which also causes MNT_INTERNAL, see | 
 | ||||||
| 	 * below | 		err = efivar_entry_size(entry, &size); | ||||||
| 	 */ | 		if (err) | ||||||
| 	path.mnt = vfs_kern_mount(&efivarfs_type, 0, | 			size = 0; | ||||||
| 				  efivarfs_type.name, NULL); | 		else | ||||||
| 	if (IS_ERR(path.mnt)) { | 			size += sizeof(__u32); | ||||||
| 		pr_err("efivarfs: internal mount failed\n"); | 
 | ||||||
| 		/*
 | 		inode_lock(inode); | ||||||
| 		 * We may be the last pinner of the superblock but | 		i_size_write(inode, size); | ||||||
| 		 * calling efivarfs_kill_sb from within the notifier | 		inode_unlock(inode); | ||||||
| 		 * here would deadlock trying to unregister it | 
 | ||||||
| 		 */ | 		/* The variable doesn't exist anymore, delete it. */ | ||||||
| 		INIT_WORK(&s->destroy_work, efivarfs_deactivate_super_work); | 		if (!size) { | ||||||
| 		schedule_work(&s->destroy_work); | 			pr_info("efivarfs: removing variable %pd\n", child); | ||||||
| 		return PTR_ERR(path.mnt); | 			simple_recursive_removal(child, NULL); | ||||||
|  | 		} | ||||||
| 	} | 	} | ||||||
| 
 | 
 | ||||||
| 	/* path.mnt now has pin on superblock, so this must be above one */ | 	efivar_init(efivarfs_check_missing, sb, false); | ||||||
| 	atomic_dec(&s->s_active); | 	pr_info("efivarfs: finished resyncing variable state\n"); | ||||||
| 
 | 	return 0; | ||||||
| 	file = kernel_file_open(&path, O_RDONLY | O_DIRECTORY | O_NOATIME, |  | ||||||
| 				current_cred()); |  | ||||||
| 	/*
 |  | ||||||
| 	 * safe even if last put because no MNT_INTERNAL means this |  | ||||||
| 	 * will do delayed deactivate_super and not deadlock |  | ||||||
| 	 */ |  | ||||||
| 	mntput(path.mnt); |  | ||||||
| 	if (IS_ERR(file)) |  | ||||||
| 		return NOTIFY_DONE; |  | ||||||
| 
 |  | ||||||
| 	rescan_done = true; |  | ||||||
| 
 |  | ||||||
| 	/*
 |  | ||||||
| 	 * First loop over the directory and verify each entry exists, |  | ||||||
| 	 * removing it if it doesn't |  | ||||||
| 	 */ |  | ||||||
| 	file->f_pos = 2;	/* skip . and .. */ |  | ||||||
| 	do { |  | ||||||
| 		ectx.dentry = NULL; |  | ||||||
| 		iterate_dir(file, &ectx.ctx); |  | ||||||
| 		if (ectx.dentry) { |  | ||||||
| 			pr_info("efivarfs: removing variable %pd\n", |  | ||||||
| 				ectx.dentry); |  | ||||||
| 			simple_recursive_removal(ectx.dentry, NULL); |  | ||||||
| 			dput(ectx.dentry); |  | ||||||
| 		} |  | ||||||
| 	} while (ectx.dentry); |  | ||||||
| 	fput(file); |  | ||||||
| 
 |  | ||||||
| 	/*
 |  | ||||||
| 	 * then loop over variables, creating them if there's no matching |  | ||||||
| 	 * dentry |  | ||||||
| 	 */ |  | ||||||
| 	efivar_init(efivarfs_check_missing, sfi->sb, false); |  | ||||||
| 
 |  | ||||||
| 	return NOTIFY_OK; |  | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
| static int efivarfs_init_fs_context(struct fs_context *fc) | static int efivarfs_init_fs_context(struct fs_context *fc) | ||||||
|  | @ -593,9 +504,6 @@ static int efivarfs_init_fs_context(struct fs_context *fc) | ||||||
| 	fc->s_fs_info = sfi; | 	fc->s_fs_info = sfi; | ||||||
| 	fc->ops = &efivarfs_context_ops; | 	fc->ops = &efivarfs_context_ops; | ||||||
| 
 | 
 | ||||||
| 	sfi->pm_nb.notifier_call = efivarfs_pm_notify; |  | ||||||
| 	sfi->pm_nb.priority = 0; |  | ||||||
| 
 |  | ||||||
| 	return 0; | 	return 0; | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
|  | @ -605,7 +513,6 @@ static void efivarfs_kill_sb(struct super_block *sb) | ||||||
| 
 | 
 | ||||||
| 	blocking_notifier_chain_unregister(&efivar_ops_nh, &sfi->nb); | 	blocking_notifier_chain_unregister(&efivar_ops_nh, &sfi->nb); | ||||||
| 	kill_litter_super(sb); | 	kill_litter_super(sb); | ||||||
| 	unregister_pm_notifier(&sfi->pm_nb); |  | ||||||
| 
 | 
 | ||||||
| 	kfree(sfi); | 	kfree(sfi); | ||||||
| } | } | ||||||
|  |  | ||||||
|  | @ -2271,12 +2271,12 @@ out_drop_write: | ||||||
| 	if (err) | 	if (err) | ||||||
| 		return err; | 		return err; | ||||||
| 
 | 
 | ||||||
| 	err = freeze_super(sbi->sb, FREEZE_HOLDER_USERSPACE); | 	err = freeze_super(sbi->sb, FREEZE_HOLDER_KERNEL, NULL); | ||||||
| 	if (err) | 	if (err) | ||||||
| 		return err; | 		return err; | ||||||
| 
 | 
 | ||||||
| 	if (f2fs_readonly(sbi->sb)) { | 	if (f2fs_readonly(sbi->sb)) { | ||||||
| 		err = thaw_super(sbi->sb, FREEZE_HOLDER_USERSPACE); | 		err = thaw_super(sbi->sb, FREEZE_HOLDER_KERNEL, NULL); | ||||||
| 		if (err) | 		if (err) | ||||||
| 			return err; | 			return err; | ||||||
| 		return -EROFS; | 		return -EROFS; | ||||||
|  | @ -2333,6 +2333,6 @@ recover_out: | ||||||
| out_err: | out_err: | ||||||
| 	f2fs_up_write(&sbi->cp_global_sem); | 	f2fs_up_write(&sbi->cp_global_sem); | ||||||
| 	f2fs_up_write(&sbi->gc_lock); | 	f2fs_up_write(&sbi->gc_lock); | ||||||
| 	thaw_super(sbi->sb, FREEZE_HOLDER_USERSPACE); | 	thaw_super(sbi->sb, FREEZE_HOLDER_KERNEL, NULL); | ||||||
| 	return err; | 	return err; | ||||||
| } | } | ||||||
|  |  | ||||||
|  | @ -674,7 +674,7 @@ static int gfs2_sync_fs(struct super_block *sb, int wait) | ||||||
| 	return sdp->sd_log_error; | 	return sdp->sd_log_error; | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
| static int gfs2_do_thaw(struct gfs2_sbd *sdp) | static int gfs2_do_thaw(struct gfs2_sbd *sdp, enum freeze_holder who, const void *freeze_owner) | ||||||
| { | { | ||||||
| 	struct super_block *sb = sdp->sd_vfs; | 	struct super_block *sb = sdp->sd_vfs; | ||||||
| 	int error; | 	int error; | ||||||
|  | @ -682,7 +682,7 @@ static int gfs2_do_thaw(struct gfs2_sbd *sdp) | ||||||
| 	error = gfs2_freeze_lock_shared(sdp); | 	error = gfs2_freeze_lock_shared(sdp); | ||||||
| 	if (error) | 	if (error) | ||||||
| 		goto fail; | 		goto fail; | ||||||
| 	error = thaw_super(sb, FREEZE_HOLDER_USERSPACE); | 	error = thaw_super(sb, who, freeze_owner); | ||||||
| 	if (!error) | 	if (!error) | ||||||
| 		return 0; | 		return 0; | ||||||
| 
 | 
 | ||||||
|  | @ -703,14 +703,14 @@ void gfs2_freeze_func(struct work_struct *work) | ||||||
| 	if (test_bit(SDF_FROZEN, &sdp->sd_flags)) | 	if (test_bit(SDF_FROZEN, &sdp->sd_flags)) | ||||||
| 		goto freeze_failed; | 		goto freeze_failed; | ||||||
| 
 | 
 | ||||||
| 	error = freeze_super(sb, FREEZE_HOLDER_USERSPACE); | 	error = freeze_super(sb, FREEZE_HOLDER_USERSPACE, NULL); | ||||||
| 	if (error) | 	if (error) | ||||||
| 		goto freeze_failed; | 		goto freeze_failed; | ||||||
| 
 | 
 | ||||||
| 	gfs2_freeze_unlock(sdp); | 	gfs2_freeze_unlock(sdp); | ||||||
| 	set_bit(SDF_FROZEN, &sdp->sd_flags); | 	set_bit(SDF_FROZEN, &sdp->sd_flags); | ||||||
| 
 | 
 | ||||||
| 	error = gfs2_do_thaw(sdp); | 	error = gfs2_do_thaw(sdp, FREEZE_HOLDER_USERSPACE, NULL); | ||||||
| 	if (error) | 	if (error) | ||||||
| 		goto out; | 		goto out; | ||||||
| 
 | 
 | ||||||
|  | @ -728,10 +728,13 @@ out: | ||||||
| /**
 | /**
 | ||||||
|  * gfs2_freeze_super - prevent further writes to the filesystem |  * gfs2_freeze_super - prevent further writes to the filesystem | ||||||
|  * @sb: the VFS structure for the filesystem |  * @sb: the VFS structure for the filesystem | ||||||
|  |  * @who: freeze flags | ||||||
|  |  * @freeze_owner: owner of the freeze | ||||||
|  * |  * | ||||||
|  */ |  */ | ||||||
| 
 | 
 | ||||||
| static int gfs2_freeze_super(struct super_block *sb, enum freeze_holder who) | static int gfs2_freeze_super(struct super_block *sb, enum freeze_holder who, | ||||||
|  | 			     const void *freeze_owner) | ||||||
| { | { | ||||||
| 	struct gfs2_sbd *sdp = sb->s_fs_info; | 	struct gfs2_sbd *sdp = sb->s_fs_info; | ||||||
| 	int error; | 	int error; | ||||||
|  | @ -744,7 +747,7 @@ static int gfs2_freeze_super(struct super_block *sb, enum freeze_holder who) | ||||||
| 	} | 	} | ||||||
| 
 | 
 | ||||||
| 	for (;;) { | 	for (;;) { | ||||||
| 		error = freeze_super(sb, FREEZE_HOLDER_USERSPACE); | 		error = freeze_super(sb, who, freeze_owner); | ||||||
| 		if (error) { | 		if (error) { | ||||||
| 			fs_info(sdp, "GFS2: couldn't freeze filesystem: %d\n", | 			fs_info(sdp, "GFS2: couldn't freeze filesystem: %d\n", | ||||||
| 				error); | 				error); | ||||||
|  | @ -758,7 +761,7 @@ static int gfs2_freeze_super(struct super_block *sb, enum freeze_holder who) | ||||||
| 			break; | 			break; | ||||||
| 		} | 		} | ||||||
| 
 | 
 | ||||||
| 		error = gfs2_do_thaw(sdp); | 		error = gfs2_do_thaw(sdp, who, freeze_owner); | ||||||
| 		if (error) | 		if (error) | ||||||
| 			goto out; | 			goto out; | ||||||
| 
 | 
 | ||||||
|  | @ -796,10 +799,13 @@ static int gfs2_freeze_fs(struct super_block *sb) | ||||||
| /**
 | /**
 | ||||||
|  * gfs2_thaw_super - reallow writes to the filesystem |  * gfs2_thaw_super - reallow writes to the filesystem | ||||||
|  * @sb: the VFS structure for the filesystem |  * @sb: the VFS structure for the filesystem | ||||||
|  |  * @who: freeze flags | ||||||
|  |  * @freeze_owner: owner of the freeze | ||||||
|  * |  * | ||||||
|  */ |  */ | ||||||
| 
 | 
 | ||||||
| static int gfs2_thaw_super(struct super_block *sb, enum freeze_holder who) | static int gfs2_thaw_super(struct super_block *sb, enum freeze_holder who, | ||||||
|  | 			   const void *freeze_owner) | ||||||
| { | { | ||||||
| 	struct gfs2_sbd *sdp = sb->s_fs_info; | 	struct gfs2_sbd *sdp = sb->s_fs_info; | ||||||
| 	int error; | 	int error; | ||||||
|  | @ -814,7 +820,7 @@ static int gfs2_thaw_super(struct super_block *sb, enum freeze_holder who) | ||||||
| 	atomic_inc(&sb->s_active); | 	atomic_inc(&sb->s_active); | ||||||
| 	gfs2_freeze_unlock(sdp); | 	gfs2_freeze_unlock(sdp); | ||||||
| 
 | 
 | ||||||
| 	error = gfs2_do_thaw(sdp); | 	error = gfs2_do_thaw(sdp, who, freeze_owner); | ||||||
| 
 | 
 | ||||||
| 	if (!error) { | 	if (!error) { | ||||||
| 		clear_bit(SDF_FREEZE_INITIATOR, &sdp->sd_flags); | 		clear_bit(SDF_FREEZE_INITIATOR, &sdp->sd_flags); | ||||||
|  |  | ||||||
|  | @ -174,10 +174,10 @@ static ssize_t freeze_store(struct gfs2_sbd *sdp, const char *buf, size_t len) | ||||||
| 
 | 
 | ||||||
| 	switch (n) { | 	switch (n) { | ||||||
| 	case 0: | 	case 0: | ||||||
| 		error = thaw_super(sdp->sd_vfs, FREEZE_HOLDER_USERSPACE); | 		error = thaw_super(sdp->sd_vfs, FREEZE_HOLDER_USERSPACE, NULL); | ||||||
| 		break; | 		break; | ||||||
| 	case 1: | 	case 1: | ||||||
| 		error = freeze_super(sdp->sd_vfs, FREEZE_HOLDER_USERSPACE); | 		error = freeze_super(sdp->sd_vfs, FREEZE_HOLDER_USERSPACE, NULL); | ||||||
| 		break; | 		break; | ||||||
| 	default: | 	default: | ||||||
| 		return -EINVAL; | 		return -EINVAL; | ||||||
|  |  | ||||||
|  | @ -344,6 +344,7 @@ static inline bool path_mounted(const struct path *path) | ||||||
| void file_f_owner_release(struct file *file); | void file_f_owner_release(struct file *file); | ||||||
| bool file_seek_cur_needs_f_lock(struct file *file); | bool file_seek_cur_needs_f_lock(struct file *file); | ||||||
| int statmount_mnt_idmap(struct mnt_idmap *idmap, struct seq_file *seq, bool uid_map); | int statmount_mnt_idmap(struct mnt_idmap *idmap, struct seq_file *seq, bool uid_map); | ||||||
|  | struct dentry *find_next_child(struct dentry *parent, struct dentry *prev); | ||||||
| int anon_inode_getattr(struct mnt_idmap *idmap, const struct path *path, | int anon_inode_getattr(struct mnt_idmap *idmap, const struct path *path, | ||||||
| 		       struct kstat *stat, u32 request_mask, | 		       struct kstat *stat, u32 request_mask, | ||||||
| 		       unsigned int query_flags); | 		       unsigned int query_flags); | ||||||
|  |  | ||||||
|  | @ -396,8 +396,8 @@ static int ioctl_fsfreeze(struct file *filp) | ||||||
| 
 | 
 | ||||||
| 	/* Freeze */ | 	/* Freeze */ | ||||||
| 	if (sb->s_op->freeze_super) | 	if (sb->s_op->freeze_super) | ||||||
| 		return sb->s_op->freeze_super(sb, FREEZE_HOLDER_USERSPACE); | 		return sb->s_op->freeze_super(sb, FREEZE_HOLDER_USERSPACE, NULL); | ||||||
| 	return freeze_super(sb, FREEZE_HOLDER_USERSPACE); | 	return freeze_super(sb, FREEZE_HOLDER_USERSPACE, NULL); | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
| static int ioctl_fsthaw(struct file *filp) | static int ioctl_fsthaw(struct file *filp) | ||||||
|  | @ -409,8 +409,8 @@ static int ioctl_fsthaw(struct file *filp) | ||||||
| 
 | 
 | ||||||
| 	/* Thaw */ | 	/* Thaw */ | ||||||
| 	if (sb->s_op->thaw_super) | 	if (sb->s_op->thaw_super) | ||||||
| 		return sb->s_op->thaw_super(sb, FREEZE_HOLDER_USERSPACE); | 		return sb->s_op->thaw_super(sb, FREEZE_HOLDER_USERSPACE, NULL); | ||||||
| 	return thaw_super(sb, FREEZE_HOLDER_USERSPACE); | 	return thaw_super(sb, FREEZE_HOLDER_USERSPACE, NULL); | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
| static int ioctl_file_dedupe_range(struct file *file, | static int ioctl_file_dedupe_range(struct file *file, | ||||||
|  |  | ||||||
|  | @ -62,6 +62,21 @@ const struct super_operations kernfs_sops = { | ||||||
| 
 | 
 | ||||||
| 	.show_options	= kernfs_sop_show_options, | 	.show_options	= kernfs_sop_show_options, | ||||||
| 	.show_path	= kernfs_sop_show_path, | 	.show_path	= kernfs_sop_show_path, | ||||||
|  | 
 | ||||||
|  | 	/*
 | ||||||
|  | 	 * sysfs is built on top of kernfs and sysfs provides the power | ||||||
|  | 	 * management infrastructure to support suspend/hibernate by | ||||||
|  | 	 * writing to various files in /sys/power/. As filesystems may | ||||||
|  | 	 * be automatically frozen during suspend/hibernate implementing | ||||||
|  | 	 * freeze/thaw support for kernfs generically will cause | ||||||
|  | 	 * deadlocks as the suspending/hibernation initiating task will | ||||||
|  | 	 * hold a VFS lock that it will then wait upon to be released. | ||||||
|  | 	 * If freeze/thaw for kernfs is needed talk to the VFS. | ||||||
|  | 	 */ | ||||||
|  | 	.freeze_fs	= NULL, | ||||||
|  | 	.unfreeze_fs	= NULL, | ||||||
|  | 	.freeze_super	= NULL, | ||||||
|  | 	.thaw_super	= NULL, | ||||||
| }; | }; | ||||||
| 
 | 
 | ||||||
| static int kernfs_encode_fh(struct inode *inode, __u32 *fh, int *max_len, | static int kernfs_encode_fh(struct inode *inode, __u32 *fh, int *max_len, | ||||||
|  |  | ||||||
|  | @ -583,7 +583,7 @@ const struct file_operations simple_offset_dir_operations = { | ||||||
| 	.fsync		= noop_fsync, | 	.fsync		= noop_fsync, | ||||||
| }; | }; | ||||||
| 
 | 
 | ||||||
| static struct dentry *find_next_child(struct dentry *parent, struct dentry *prev) | struct dentry *find_next_child(struct dentry *parent, struct dentry *prev) | ||||||
| { | { | ||||||
| 	struct dentry *child = NULL, *d; | 	struct dentry *child = NULL, *d; | ||||||
| 
 | 
 | ||||||
|  | @ -603,6 +603,7 @@ static struct dentry *find_next_child(struct dentry *parent, struct dentry *prev | ||||||
| 	dput(prev); | 	dput(prev); | ||||||
| 	return child; | 	return child; | ||||||
| } | } | ||||||
|  | EXPORT_SYMBOL(find_next_child); | ||||||
| 
 | 
 | ||||||
| void simple_recursive_removal(struct dentry *dentry, | void simple_recursive_removal(struct dentry *dentry, | ||||||
|                               void (*callback)(struct dentry *)) |                               void (*callback)(struct dentry *)) | ||||||
|  |  | ||||||
							
								
								
									
										318
									
								
								fs/super.c
									
										
									
									
									
								
							
							
						
						
									
										318
									
								
								fs/super.c
									
										
									
									
									
								
							|  | @ -39,7 +39,8 @@ | ||||||
| #include <uapi/linux/mount.h> | #include <uapi/linux/mount.h> | ||||||
| #include "internal.h" | #include "internal.h" | ||||||
| 
 | 
 | ||||||
| static int thaw_super_locked(struct super_block *sb, enum freeze_holder who); | static int thaw_super_locked(struct super_block *sb, enum freeze_holder who, | ||||||
|  | 			     const void *freeze_owner); | ||||||
| 
 | 
 | ||||||
| static LIST_HEAD(super_blocks); | static LIST_HEAD(super_blocks); | ||||||
| static DEFINE_SPINLOCK(sb_lock); | static DEFINE_SPINLOCK(sb_lock); | ||||||
|  | @ -887,52 +888,48 @@ void drop_super_exclusive(struct super_block *sb) | ||||||
| } | } | ||||||
| EXPORT_SYMBOL(drop_super_exclusive); | EXPORT_SYMBOL(drop_super_exclusive); | ||||||
| 
 | 
 | ||||||
| static void __iterate_supers(void (*f)(struct super_block *)) | enum super_iter_flags_t { | ||||||
|  | 	SUPER_ITER_EXCL		= (1U << 0), | ||||||
|  | 	SUPER_ITER_UNLOCKED	= (1U << 1), | ||||||
|  | 	SUPER_ITER_REVERSE	= (1U << 2), | ||||||
|  | }; | ||||||
|  | 
 | ||||||
|  | static inline struct super_block *first_super(enum super_iter_flags_t flags) | ||||||
|  | { | ||||||
|  | 	if (flags & SUPER_ITER_REVERSE) | ||||||
|  | 		return list_last_entry(&super_blocks, struct super_block, s_list); | ||||||
|  | 	return list_first_entry(&super_blocks, struct super_block, s_list); | ||||||
|  | } | ||||||
|  | 
 | ||||||
|  | static inline struct super_block *next_super(struct super_block *sb, | ||||||
|  | 					     enum super_iter_flags_t flags) | ||||||
|  | { | ||||||
|  | 	if (flags & SUPER_ITER_REVERSE) | ||||||
|  | 		return list_prev_entry(sb, s_list); | ||||||
|  | 	return list_next_entry(sb, s_list); | ||||||
|  | } | ||||||
|  | 
 | ||||||
|  | static void __iterate_supers(void (*f)(struct super_block *, void *), void *arg, | ||||||
|  | 			     enum super_iter_flags_t flags) | ||||||
| { | { | ||||||
| 	struct super_block *sb, *p = NULL; | 	struct super_block *sb, *p = NULL; | ||||||
|  | 	bool excl = flags & SUPER_ITER_EXCL; | ||||||
| 
 | 
 | ||||||
| 	spin_lock(&sb_lock); | 	guard(spinlock)(&sb_lock); | ||||||
| 	list_for_each_entry(sb, &super_blocks, s_list) { | 
 | ||||||
|  | 	for (sb = first_super(flags); | ||||||
|  | 	     !list_entry_is_head(sb, &super_blocks, s_list); | ||||||
|  | 	     sb = next_super(sb, flags)) { | ||||||
| 		if (super_flags(sb, SB_DYING)) | 		if (super_flags(sb, SB_DYING)) | ||||||
| 			continue; | 			continue; | ||||||
| 		sb->s_count++; | 		sb->s_count++; | ||||||
| 		spin_unlock(&sb_lock); | 		spin_unlock(&sb_lock); | ||||||
| 
 | 
 | ||||||
| 		f(sb); | 		if (flags & SUPER_ITER_UNLOCKED) { | ||||||
| 
 | 			f(sb, arg); | ||||||
| 		spin_lock(&sb_lock); | 		} else if (super_lock(sb, excl)) { | ||||||
| 		if (p) | 			f(sb, arg); | ||||||
| 			__put_super(p); | 			super_unlock(sb, excl); | ||||||
| 		p = sb; |  | ||||||
| 	} |  | ||||||
| 	if (p) |  | ||||||
| 		__put_super(p); |  | ||||||
| 	spin_unlock(&sb_lock); |  | ||||||
| } |  | ||||||
| /**
 |  | ||||||
|  *	iterate_supers - call function for all active superblocks |  | ||||||
|  *	@f: function to call |  | ||||||
|  *	@arg: argument to pass to it |  | ||||||
|  * |  | ||||||
|  *	Scans the superblock list and calls given function, passing it |  | ||||||
|  *	locked superblock and given argument. |  | ||||||
|  */ |  | ||||||
| void iterate_supers(void (*f)(struct super_block *, void *), void *arg) |  | ||||||
| { |  | ||||||
| 	struct super_block *sb, *p = NULL; |  | ||||||
| 
 |  | ||||||
| 	spin_lock(&sb_lock); |  | ||||||
| 	list_for_each_entry(sb, &super_blocks, s_list) { |  | ||||||
| 		bool locked; |  | ||||||
| 
 |  | ||||||
| 		sb->s_count++; |  | ||||||
| 		spin_unlock(&sb_lock); |  | ||||||
| 
 |  | ||||||
| 		locked = super_lock_shared(sb); |  | ||||||
| 		if (locked) { |  | ||||||
| 			if (sb->s_root) |  | ||||||
| 				f(sb, arg); |  | ||||||
| 			super_unlock_shared(sb); |  | ||||||
| 		} | 		} | ||||||
| 
 | 
 | ||||||
| 		spin_lock(&sb_lock); | 		spin_lock(&sb_lock); | ||||||
|  | @ -942,7 +939,11 @@ void iterate_supers(void (*f)(struct super_block *, void *), void *arg) | ||||||
| 	} | 	} | ||||||
| 	if (p) | 	if (p) | ||||||
| 		__put_super(p); | 		__put_super(p); | ||||||
| 	spin_unlock(&sb_lock); | } | ||||||
|  | 
 | ||||||
|  | void iterate_supers(void (*f)(struct super_block *, void *), void *arg) | ||||||
|  | { | ||||||
|  | 	__iterate_supers(f, arg, 0); | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
| /**
 | /**
 | ||||||
|  | @ -963,15 +964,15 @@ void iterate_supers_type(struct file_system_type *type, | ||||||
| 	hlist_for_each_entry(sb, &type->fs_supers, s_instances) { | 	hlist_for_each_entry(sb, &type->fs_supers, s_instances) { | ||||||
| 		bool locked; | 		bool locked; | ||||||
| 
 | 
 | ||||||
|  | 		if (super_flags(sb, SB_DYING)) | ||||||
|  | 			continue; | ||||||
|  | 
 | ||||||
| 		sb->s_count++; | 		sb->s_count++; | ||||||
| 		spin_unlock(&sb_lock); | 		spin_unlock(&sb_lock); | ||||||
| 
 | 
 | ||||||
| 		locked = super_lock_shared(sb); | 		locked = super_lock_shared(sb); | ||||||
| 		if (locked) { | 		if (locked) | ||||||
| 			if (sb->s_root) | 			f(sb, arg); | ||||||
| 				f(sb, arg); |  | ||||||
| 			super_unlock_shared(sb); |  | ||||||
| 		} |  | ||||||
| 
 | 
 | ||||||
| 		spin_lock(&sb_lock); | 		spin_lock(&sb_lock); | ||||||
| 		if (p) | 		if (p) | ||||||
|  | @ -991,23 +992,21 @@ struct super_block *user_get_super(dev_t dev, bool excl) | ||||||
| 
 | 
 | ||||||
| 	spin_lock(&sb_lock); | 	spin_lock(&sb_lock); | ||||||
| 	list_for_each_entry(sb, &super_blocks, s_list) { | 	list_for_each_entry(sb, &super_blocks, s_list) { | ||||||
| 		if (sb->s_dev ==  dev) { | 		bool locked; | ||||||
| 			bool locked; |  | ||||||
| 
 | 
 | ||||||
| 			sb->s_count++; | 		if (sb->s_dev != dev) | ||||||
| 			spin_unlock(&sb_lock); | 			continue; | ||||||
| 			/* still alive? */ | 
 | ||||||
| 			locked = super_lock(sb, excl); | 		sb->s_count++; | ||||||
| 			if (locked) { | 		spin_unlock(&sb_lock); | ||||||
| 				if (sb->s_root) | 
 | ||||||
| 					return sb; | 		locked = super_lock(sb, excl); | ||||||
| 				super_unlock(sb, excl); | 		if (locked) | ||||||
| 			} | 			return sb; | ||||||
| 			/* nope, got unmounted */ | 
 | ||||||
| 			spin_lock(&sb_lock); | 		spin_lock(&sb_lock); | ||||||
| 			__put_super(sb); | 		__put_super(sb); | ||||||
| 			break; | 		break; | ||||||
| 		} |  | ||||||
| 	} | 	} | ||||||
| 	spin_unlock(&sb_lock); | 	spin_unlock(&sb_lock); | ||||||
| 	return NULL; | 	return NULL; | ||||||
|  | @ -1111,11 +1110,9 @@ cancel_readonly: | ||||||
| 	return retval; | 	return retval; | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
| static void do_emergency_remount_callback(struct super_block *sb) | static void do_emergency_remount_callback(struct super_block *sb, void *unused) | ||||||
| { | { | ||||||
| 	bool locked = super_lock_excl(sb); | 	if (sb->s_bdev && !sb_rdonly(sb)) { | ||||||
| 
 |  | ||||||
| 	if (locked && sb->s_root && sb->s_bdev && !sb_rdonly(sb)) { |  | ||||||
| 		struct fs_context *fc; | 		struct fs_context *fc; | ||||||
| 
 | 
 | ||||||
| 		fc = fs_context_for_reconfigure(sb->s_root, | 		fc = fs_context_for_reconfigure(sb->s_root, | ||||||
|  | @ -1126,13 +1123,12 @@ static void do_emergency_remount_callback(struct super_block *sb) | ||||||
| 			put_fs_context(fc); | 			put_fs_context(fc); | ||||||
| 		} | 		} | ||||||
| 	} | 	} | ||||||
| 	if (locked) |  | ||||||
| 		super_unlock_excl(sb); |  | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
| static void do_emergency_remount(struct work_struct *work) | static void do_emergency_remount(struct work_struct *work) | ||||||
| { | { | ||||||
| 	__iterate_supers(do_emergency_remount_callback); | 	__iterate_supers(do_emergency_remount_callback, NULL, | ||||||
|  | 			 SUPER_ITER_EXCL | SUPER_ITER_REVERSE); | ||||||
| 	kfree(work); | 	kfree(work); | ||||||
| 	printk("Emergency Remount complete\n"); | 	printk("Emergency Remount complete\n"); | ||||||
| } | } | ||||||
|  | @ -1148,24 +1144,18 @@ void emergency_remount(void) | ||||||
| 	} | 	} | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
| static void do_thaw_all_callback(struct super_block *sb) | static void do_thaw_all_callback(struct super_block *sb, void *unused) | ||||||
| { | { | ||||||
| 	bool locked = super_lock_excl(sb); | 	if (IS_ENABLED(CONFIG_BLOCK)) | ||||||
| 
 | 		while (sb->s_bdev && !bdev_thaw(sb->s_bdev)) | ||||||
| 	if (locked && sb->s_root) { | 			pr_warn("Emergency Thaw on %pg\n", sb->s_bdev); | ||||||
| 		if (IS_ENABLED(CONFIG_BLOCK)) | 	thaw_super_locked(sb, FREEZE_HOLDER_USERSPACE, NULL); | ||||||
| 			while (sb->s_bdev && !bdev_thaw(sb->s_bdev)) | 	return; | ||||||
| 				pr_warn("Emergency Thaw on %pg\n", sb->s_bdev); |  | ||||||
| 		thaw_super_locked(sb, FREEZE_HOLDER_USERSPACE); |  | ||||||
| 		return; |  | ||||||
| 	} |  | ||||||
| 	if (locked) |  | ||||||
| 		super_unlock_excl(sb); |  | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
| static void do_thaw_all(struct work_struct *work) | static void do_thaw_all(struct work_struct *work) | ||||||
| { | { | ||||||
| 	__iterate_supers(do_thaw_all_callback); | 	__iterate_supers(do_thaw_all_callback, NULL, SUPER_ITER_EXCL); | ||||||
| 	kfree(work); | 	kfree(work); | ||||||
| 	printk(KERN_WARNING "Emergency Thaw complete\n"); | 	printk(KERN_WARNING "Emergency Thaw complete\n"); | ||||||
| } | } | ||||||
|  | @ -1186,6 +1176,66 @@ void emergency_thaw_all(void) | ||||||
| 	} | 	} | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
|  | static inline bool get_active_super(struct super_block *sb) | ||||||
|  | { | ||||||
|  | 	bool active = false; | ||||||
|  | 
 | ||||||
|  | 	if (super_lock_excl(sb)) { | ||||||
|  | 		active = atomic_inc_not_zero(&sb->s_active); | ||||||
|  | 		super_unlock_excl(sb); | ||||||
|  | 	} | ||||||
|  | 	return active; | ||||||
|  | } | ||||||
|  | 
 | ||||||
|  | static const char *filesystems_freeze_ptr = "filesystems_freeze"; | ||||||
|  | 
 | ||||||
|  | static void filesystems_freeze_callback(struct super_block *sb, void *unused) | ||||||
|  | { | ||||||
|  | 	if (!sb->s_op->freeze_fs && !sb->s_op->freeze_super) | ||||||
|  | 		return; | ||||||
|  | 
 | ||||||
|  | 	if (!get_active_super(sb)) | ||||||
|  | 		return; | ||||||
|  | 
 | ||||||
|  | 	if (sb->s_op->freeze_super) | ||||||
|  | 		sb->s_op->freeze_super(sb, FREEZE_EXCL | FREEZE_HOLDER_KERNEL, | ||||||
|  | 				       filesystems_freeze_ptr); | ||||||
|  | 	else | ||||||
|  | 		freeze_super(sb, FREEZE_EXCL | FREEZE_HOLDER_KERNEL, | ||||||
|  | 			     filesystems_freeze_ptr); | ||||||
|  | 
 | ||||||
|  | 	deactivate_super(sb); | ||||||
|  | } | ||||||
|  | 
 | ||||||
|  | void filesystems_freeze(void) | ||||||
|  | { | ||||||
|  | 	__iterate_supers(filesystems_freeze_callback, NULL, | ||||||
|  | 			 SUPER_ITER_UNLOCKED | SUPER_ITER_REVERSE); | ||||||
|  | } | ||||||
|  | 
 | ||||||
|  | static void filesystems_thaw_callback(struct super_block *sb, void *unused) | ||||||
|  | { | ||||||
|  | 	if (!sb->s_op->freeze_fs && !sb->s_op->freeze_super) | ||||||
|  | 		return; | ||||||
|  | 
 | ||||||
|  | 	if (!get_active_super(sb)) | ||||||
|  | 		return; | ||||||
|  | 
 | ||||||
|  | 	if (sb->s_op->thaw_super) | ||||||
|  | 		sb->s_op->thaw_super(sb, FREEZE_EXCL | FREEZE_HOLDER_KERNEL, | ||||||
|  | 				     filesystems_freeze_ptr); | ||||||
|  | 	else | ||||||
|  | 		thaw_super(sb, FREEZE_EXCL | FREEZE_HOLDER_KERNEL, | ||||||
|  | 			   filesystems_freeze_ptr); | ||||||
|  | 
 | ||||||
|  | 	deactivate_super(sb); | ||||||
|  | } | ||||||
|  | 
 | ||||||
|  | void filesystems_thaw(void) | ||||||
|  | { | ||||||
|  | 	__iterate_supers(filesystems_thaw_callback, NULL, SUPER_ITER_UNLOCKED); | ||||||
|  | } | ||||||
|  | 
 | ||||||
| static DEFINE_IDA(unnamed_dev_ida); | static DEFINE_IDA(unnamed_dev_ida); | ||||||
| 
 | 
 | ||||||
| /**
 | /**
 | ||||||
|  | @ -1479,10 +1529,10 @@ static int fs_bdev_freeze(struct block_device *bdev) | ||||||
| 
 | 
 | ||||||
| 	if (sb->s_op->freeze_super) | 	if (sb->s_op->freeze_super) | ||||||
| 		error = sb->s_op->freeze_super(sb, | 		error = sb->s_op->freeze_super(sb, | ||||||
| 				FREEZE_MAY_NEST | FREEZE_HOLDER_USERSPACE); | 				FREEZE_MAY_NEST | FREEZE_HOLDER_USERSPACE, NULL); | ||||||
| 	else | 	else | ||||||
| 		error = freeze_super(sb, | 		error = freeze_super(sb, | ||||||
| 				FREEZE_MAY_NEST | FREEZE_HOLDER_USERSPACE); | 				FREEZE_MAY_NEST | FREEZE_HOLDER_USERSPACE, NULL); | ||||||
| 	if (!error) | 	if (!error) | ||||||
| 		error = sync_blockdev(bdev); | 		error = sync_blockdev(bdev); | ||||||
| 	deactivate_super(sb); | 	deactivate_super(sb); | ||||||
|  | @ -1528,10 +1578,10 @@ static int fs_bdev_thaw(struct block_device *bdev) | ||||||
| 
 | 
 | ||||||
| 	if (sb->s_op->thaw_super) | 	if (sb->s_op->thaw_super) | ||||||
| 		error = sb->s_op->thaw_super(sb, | 		error = sb->s_op->thaw_super(sb, | ||||||
| 				FREEZE_MAY_NEST | FREEZE_HOLDER_USERSPACE); | 				FREEZE_MAY_NEST | FREEZE_HOLDER_USERSPACE, NULL); | ||||||
| 	else | 	else | ||||||
| 		error = thaw_super(sb, | 		error = thaw_super(sb, | ||||||
| 				FREEZE_MAY_NEST | FREEZE_HOLDER_USERSPACE); | 				FREEZE_MAY_NEST | FREEZE_HOLDER_USERSPACE, NULL); | ||||||
| 	deactivate_super(sb); | 	deactivate_super(sb); | ||||||
| 	return error; | 	return error; | ||||||
| } | } | ||||||
|  | @ -1903,7 +1953,7 @@ static int wait_for_partially_frozen(struct super_block *sb) | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
| #define FREEZE_HOLDERS (FREEZE_HOLDER_KERNEL | FREEZE_HOLDER_USERSPACE) | #define FREEZE_HOLDERS (FREEZE_HOLDER_KERNEL | FREEZE_HOLDER_USERSPACE) | ||||||
| #define FREEZE_FLAGS (FREEZE_HOLDERS | FREEZE_MAY_NEST) | #define FREEZE_FLAGS (FREEZE_HOLDERS | FREEZE_MAY_NEST | FREEZE_EXCL) | ||||||
| 
 | 
 | ||||||
| static inline int freeze_inc(struct super_block *sb, enum freeze_holder who) | static inline int freeze_inc(struct super_block *sb, enum freeze_holder who) | ||||||
| { | { | ||||||
|  | @ -1929,11 +1979,34 @@ static inline int freeze_dec(struct super_block *sb, enum freeze_holder who) | ||||||
| 	return sb->s_writers.freeze_kcount + sb->s_writers.freeze_ucount; | 	return sb->s_writers.freeze_kcount + sb->s_writers.freeze_ucount; | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
| static inline bool may_freeze(struct super_block *sb, enum freeze_holder who) | static inline bool may_freeze(struct super_block *sb, enum freeze_holder who, | ||||||
|  | 			      const void *freeze_owner) | ||||||
| { | { | ||||||
|  | 	lockdep_assert_held(&sb->s_umount); | ||||||
|  | 
 | ||||||
| 	WARN_ON_ONCE((who & ~FREEZE_FLAGS)); | 	WARN_ON_ONCE((who & ~FREEZE_FLAGS)); | ||||||
| 	WARN_ON_ONCE(hweight32(who & FREEZE_HOLDERS) > 1); | 	WARN_ON_ONCE(hweight32(who & FREEZE_HOLDERS) > 1); | ||||||
| 
 | 
 | ||||||
|  | 	if (who & FREEZE_EXCL) { | ||||||
|  | 		if (WARN_ON_ONCE(!(who & FREEZE_HOLDER_KERNEL))) | ||||||
|  | 			return false; | ||||||
|  | 		if (WARN_ON_ONCE(who & ~(FREEZE_EXCL | FREEZE_HOLDER_KERNEL))) | ||||||
|  | 			return false; | ||||||
|  | 		if (WARN_ON_ONCE(!freeze_owner)) | ||||||
|  | 			return false; | ||||||
|  | 		/* This freeze already has a specific owner. */ | ||||||
|  | 		if (sb->s_writers.freeze_owner) | ||||||
|  | 			return false; | ||||||
|  | 		/*
 | ||||||
|  | 		 * This is already frozen multiple times so we're just | ||||||
|  | 		 * going to take a reference count and mark the freeze as | ||||||
|  | 		 * being owned by the caller. | ||||||
|  | 		 */ | ||||||
|  | 		if (sb->s_writers.freeze_kcount + sb->s_writers.freeze_ucount) | ||||||
|  | 			sb->s_writers.freeze_owner = freeze_owner; | ||||||
|  | 		return true; | ||||||
|  | 	} | ||||||
|  | 
 | ||||||
| 	if (who & FREEZE_HOLDER_KERNEL) | 	if (who & FREEZE_HOLDER_KERNEL) | ||||||
| 		return (who & FREEZE_MAY_NEST) || | 		return (who & FREEZE_MAY_NEST) || | ||||||
| 		       sb->s_writers.freeze_kcount == 0; | 		       sb->s_writers.freeze_kcount == 0; | ||||||
|  | @ -1943,10 +2016,61 @@ static inline bool may_freeze(struct super_block *sb, enum freeze_holder who) | ||||||
| 	return false; | 	return false; | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
|  | static inline bool may_unfreeze(struct super_block *sb, enum freeze_holder who, | ||||||
|  | 				const void *freeze_owner) | ||||||
|  | { | ||||||
|  | 	lockdep_assert_held(&sb->s_umount); | ||||||
|  | 
 | ||||||
|  | 	WARN_ON_ONCE((who & ~FREEZE_FLAGS)); | ||||||
|  | 	WARN_ON_ONCE(hweight32(who & FREEZE_HOLDERS) > 1); | ||||||
|  | 
 | ||||||
|  | 	if (who & FREEZE_EXCL) { | ||||||
|  | 		if (WARN_ON_ONCE(!(who & FREEZE_HOLDER_KERNEL))) | ||||||
|  | 			return false; | ||||||
|  | 		if (WARN_ON_ONCE(who & ~(FREEZE_EXCL | FREEZE_HOLDER_KERNEL))) | ||||||
|  | 			return false; | ||||||
|  | 		if (WARN_ON_ONCE(!freeze_owner)) | ||||||
|  | 			return false; | ||||||
|  | 		if (WARN_ON_ONCE(sb->s_writers.freeze_kcount == 0)) | ||||||
|  | 			return false; | ||||||
|  | 		/* This isn't exclusively frozen. */ | ||||||
|  | 		if (!sb->s_writers.freeze_owner) | ||||||
|  | 			return false; | ||||||
|  | 		/* This isn't exclusively frozen by us. */ | ||||||
|  | 		if (sb->s_writers.freeze_owner != freeze_owner) | ||||||
|  | 			return false; | ||||||
|  | 		/*
 | ||||||
|  | 		 * This is still frozen multiple times so we're just | ||||||
|  | 		 * going to drop our reference count and undo our | ||||||
|  | 		 * exclusive freeze. | ||||||
|  | 		 */ | ||||||
|  | 		if ((sb->s_writers.freeze_kcount + sb->s_writers.freeze_ucount) > 1) | ||||||
|  | 			sb->s_writers.freeze_owner = NULL; | ||||||
|  | 		return true; | ||||||
|  | 	} | ||||||
|  | 
 | ||||||
|  | 	if (who & FREEZE_HOLDER_KERNEL) { | ||||||
|  | 		/*
 | ||||||
|  | 		 * Someone's trying to steal the reference belonging to | ||||||
|  | 		 * @sb->s_writers.freeze_owner. | ||||||
|  | 		 */ | ||||||
|  | 		if (sb->s_writers.freeze_kcount == 1 && | ||||||
|  | 		    sb->s_writers.freeze_owner) | ||||||
|  | 			return false; | ||||||
|  | 		return sb->s_writers.freeze_kcount > 0; | ||||||
|  | 	} | ||||||
|  | 
 | ||||||
|  | 	if (who & FREEZE_HOLDER_USERSPACE) | ||||||
|  | 		return sb->s_writers.freeze_ucount > 0; | ||||||
|  | 
 | ||||||
|  | 	return false; | ||||||
|  | } | ||||||
|  | 
 | ||||||
| /**
 | /**
 | ||||||
|  * freeze_super - lock the filesystem and force it into a consistent state |  * freeze_super - lock the filesystem and force it into a consistent state | ||||||
|  * @sb: the super to lock |  * @sb: the super to lock | ||||||
|  * @who: context that wants to freeze |  * @who: context that wants to freeze | ||||||
|  |  * @freeze_owner: owner of the freeze | ||||||
|  * |  * | ||||||
|  * Syncs the super to make sure the filesystem is consistent and calls the fs's |  * Syncs the super to make sure the filesystem is consistent and calls the fs's | ||||||
|  * freeze_fs.  Subsequent calls to this without first thawing the fs may return |  * freeze_fs.  Subsequent calls to this without first thawing the fs may return | ||||||
|  | @ -1998,7 +2122,7 @@ static inline bool may_freeze(struct super_block *sb, enum freeze_holder who) | ||||||
|  * Return: If the freeze was successful zero is returned. If the freeze |  * Return: If the freeze was successful zero is returned. If the freeze | ||||||
|  *         failed a negative error code is returned. |  *         failed a negative error code is returned. | ||||||
|  */ |  */ | ||||||
| int freeze_super(struct super_block *sb, enum freeze_holder who) | int freeze_super(struct super_block *sb, enum freeze_holder who, const void *freeze_owner) | ||||||
| { | { | ||||||
| 	int ret; | 	int ret; | ||||||
| 
 | 
 | ||||||
|  | @ -2010,7 +2134,7 @@ int freeze_super(struct super_block *sb, enum freeze_holder who) | ||||||
| 
 | 
 | ||||||
| retry: | retry: | ||||||
| 	if (sb->s_writers.frozen == SB_FREEZE_COMPLETE) { | 	if (sb->s_writers.frozen == SB_FREEZE_COMPLETE) { | ||||||
| 		if (may_freeze(sb, who)) | 		if (may_freeze(sb, who, freeze_owner)) | ||||||
| 			ret = !!WARN_ON_ONCE(freeze_inc(sb, who) == 1); | 			ret = !!WARN_ON_ONCE(freeze_inc(sb, who) == 1); | ||||||
| 		else | 		else | ||||||
| 			ret = -EBUSY; | 			ret = -EBUSY; | ||||||
|  | @ -2032,6 +2156,7 @@ retry: | ||||||
| 	if (sb_rdonly(sb)) { | 	if (sb_rdonly(sb)) { | ||||||
| 		/* Nothing to do really... */ | 		/* Nothing to do really... */ | ||||||
| 		WARN_ON_ONCE(freeze_inc(sb, who) > 1); | 		WARN_ON_ONCE(freeze_inc(sb, who) > 1); | ||||||
|  | 		sb->s_writers.freeze_owner = freeze_owner; | ||||||
| 		sb->s_writers.frozen = SB_FREEZE_COMPLETE; | 		sb->s_writers.frozen = SB_FREEZE_COMPLETE; | ||||||
| 		wake_up_var(&sb->s_writers.frozen); | 		wake_up_var(&sb->s_writers.frozen); | ||||||
| 		super_unlock_excl(sb); | 		super_unlock_excl(sb); | ||||||
|  | @ -2079,6 +2204,7 @@ retry: | ||||||
| 	 * when frozen is set to SB_FREEZE_COMPLETE, and for thaw_super(). | 	 * when frozen is set to SB_FREEZE_COMPLETE, and for thaw_super(). | ||||||
| 	 */ | 	 */ | ||||||
| 	WARN_ON_ONCE(freeze_inc(sb, who) > 1); | 	WARN_ON_ONCE(freeze_inc(sb, who) > 1); | ||||||
|  | 	sb->s_writers.freeze_owner = freeze_owner; | ||||||
| 	sb->s_writers.frozen = SB_FREEZE_COMPLETE; | 	sb->s_writers.frozen = SB_FREEZE_COMPLETE; | ||||||
| 	wake_up_var(&sb->s_writers.frozen); | 	wake_up_var(&sb->s_writers.frozen); | ||||||
| 	lockdep_sb_freeze_release(sb); | 	lockdep_sb_freeze_release(sb); | ||||||
|  | @ -2093,13 +2219,17 @@ EXPORT_SYMBOL(freeze_super); | ||||||
|  * removes that state without releasing the other state or unlocking the |  * removes that state without releasing the other state or unlocking the | ||||||
|  * filesystem. |  * filesystem. | ||||||
|  */ |  */ | ||||||
| static int thaw_super_locked(struct super_block *sb, enum freeze_holder who) | static int thaw_super_locked(struct super_block *sb, enum freeze_holder who, | ||||||
|  | 			     const void *freeze_owner) | ||||||
| { | { | ||||||
| 	int error = -EINVAL; | 	int error = -EINVAL; | ||||||
| 
 | 
 | ||||||
| 	if (sb->s_writers.frozen != SB_FREEZE_COMPLETE) | 	if (sb->s_writers.frozen != SB_FREEZE_COMPLETE) | ||||||
| 		goto out_unlock; | 		goto out_unlock; | ||||||
| 
 | 
 | ||||||
|  | 	if (!may_unfreeze(sb, who, freeze_owner)) | ||||||
|  | 		goto out_unlock; | ||||||
|  | 
 | ||||||
| 	/*
 | 	/*
 | ||||||
| 	 * All freezers share a single active reference. | 	 * All freezers share a single active reference. | ||||||
| 	 * So just unlock in case there are any left. | 	 * So just unlock in case there are any left. | ||||||
|  | @ -2109,6 +2239,7 @@ static int thaw_super_locked(struct super_block *sb, enum freeze_holder who) | ||||||
| 
 | 
 | ||||||
| 	if (sb_rdonly(sb)) { | 	if (sb_rdonly(sb)) { | ||||||
| 		sb->s_writers.frozen = SB_UNFROZEN; | 		sb->s_writers.frozen = SB_UNFROZEN; | ||||||
|  | 		sb->s_writers.freeze_owner = NULL; | ||||||
| 		wake_up_var(&sb->s_writers.frozen); | 		wake_up_var(&sb->s_writers.frozen); | ||||||
| 		goto out_deactivate; | 		goto out_deactivate; | ||||||
| 	} | 	} | ||||||
|  | @ -2126,6 +2257,7 @@ static int thaw_super_locked(struct super_block *sb, enum freeze_holder who) | ||||||
| 	} | 	} | ||||||
| 
 | 
 | ||||||
| 	sb->s_writers.frozen = SB_UNFROZEN; | 	sb->s_writers.frozen = SB_UNFROZEN; | ||||||
|  | 	sb->s_writers.freeze_owner = NULL; | ||||||
| 	wake_up_var(&sb->s_writers.frozen); | 	wake_up_var(&sb->s_writers.frozen); | ||||||
| 	sb_freeze_unlock(sb, SB_FREEZE_FS); | 	sb_freeze_unlock(sb, SB_FREEZE_FS); | ||||||
| out_deactivate: | out_deactivate: | ||||||
|  | @ -2141,6 +2273,7 @@ out_unlock: | ||||||
|  * thaw_super -- unlock filesystem |  * thaw_super -- unlock filesystem | ||||||
|  * @sb: the super to thaw |  * @sb: the super to thaw | ||||||
|  * @who: context that wants to freeze |  * @who: context that wants to freeze | ||||||
|  |  * @freeze_owner: owner of the freeze | ||||||
|  * |  * | ||||||
|  * Unlocks the filesystem and marks it writeable again after freeze_super() |  * Unlocks the filesystem and marks it writeable again after freeze_super() | ||||||
|  * if there are no remaining freezes on the filesystem. |  * if there are no remaining freezes on the filesystem. | ||||||
|  | @ -2154,13 +2287,14 @@ out_unlock: | ||||||
|  * have been frozen through the block layer via multiple block devices. |  * have been frozen through the block layer via multiple block devices. | ||||||
|  * The filesystem remains frozen until all block devices are unfrozen. |  * The filesystem remains frozen until all block devices are unfrozen. | ||||||
|  */ |  */ | ||||||
| int thaw_super(struct super_block *sb, enum freeze_holder who) | int thaw_super(struct super_block *sb, enum freeze_holder who, | ||||||
|  | 	       const void *freeze_owner) | ||||||
| { | { | ||||||
| 	if (!super_lock_excl(sb)) { | 	if (!super_lock_excl(sb)) { | ||||||
| 		WARN_ON_ONCE("Dying superblock while thawing!"); | 		WARN_ON_ONCE("Dying superblock while thawing!"); | ||||||
| 		return -EINVAL; | 		return -EINVAL; | ||||||
| 	} | 	} | ||||||
| 	return thaw_super_locked(sb, who); | 	return thaw_super_locked(sb, who, freeze_owner); | ||||||
| } | } | ||||||
| EXPORT_SYMBOL(thaw_super); | EXPORT_SYMBOL(thaw_super); | ||||||
| 
 | 
 | ||||||
|  |  | ||||||
|  | @ -123,7 +123,7 @@ xchk_fsfreeze( | ||||||
| { | { | ||||||
| 	int			error; | 	int			error; | ||||||
| 
 | 
 | ||||||
| 	error = freeze_super(sc->mp->m_super, FREEZE_HOLDER_KERNEL); | 	error = freeze_super(sc->mp->m_super, FREEZE_HOLDER_KERNEL, NULL); | ||||||
| 	trace_xchk_fsfreeze(sc, error); | 	trace_xchk_fsfreeze(sc, error); | ||||||
| 	return error; | 	return error; | ||||||
| } | } | ||||||
|  | @ -135,7 +135,7 @@ xchk_fsthaw( | ||||||
| 	int			error; | 	int			error; | ||||||
| 
 | 
 | ||||||
| 	/* This should always succeed, we have a kernel freeze */ | 	/* This should always succeed, we have a kernel freeze */ | ||||||
| 	error = thaw_super(sc->mp->m_super, FREEZE_HOLDER_KERNEL); | 	error = thaw_super(sc->mp->m_super, FREEZE_HOLDER_KERNEL, NULL); | ||||||
| 	trace_xchk_fsthaw(sc, error); | 	trace_xchk_fsthaw(sc, error); | ||||||
| 	return error; | 	return error; | ||||||
| } | } | ||||||
|  |  | ||||||
|  | @ -127,7 +127,7 @@ xfs_dax_notify_failure_freeze( | ||||||
| 	struct super_block	*sb = mp->m_super; | 	struct super_block	*sb = mp->m_super; | ||||||
| 	int			error; | 	int			error; | ||||||
| 
 | 
 | ||||||
| 	error = freeze_super(sb, FREEZE_HOLDER_KERNEL); | 	error = freeze_super(sb, FREEZE_HOLDER_KERNEL, NULL); | ||||||
| 	if (error) | 	if (error) | ||||||
| 		xfs_emerg(mp, "already frozen by kernel, err=%d", error); | 		xfs_emerg(mp, "already frozen by kernel, err=%d", error); | ||||||
| 
 | 
 | ||||||
|  | @ -143,7 +143,7 @@ xfs_dax_notify_failure_thaw( | ||||||
| 	int			error; | 	int			error; | ||||||
| 
 | 
 | ||||||
| 	if (kernel_frozen) { | 	if (kernel_frozen) { | ||||||
| 		error = thaw_super(sb, FREEZE_HOLDER_KERNEL); | 		error = thaw_super(sb, FREEZE_HOLDER_KERNEL, NULL); | ||||||
| 		if (error) | 		if (error) | ||||||
| 			xfs_emerg(mp, "still frozen after notify failure, err=%d", | 			xfs_emerg(mp, "still frozen after notify failure, err=%d", | ||||||
| 				error); | 				error); | ||||||
|  | @ -153,7 +153,7 @@ xfs_dax_notify_failure_thaw( | ||||||
| 	 * Also thaw userspace call anyway because the device is about to be | 	 * Also thaw userspace call anyway because the device is about to be | ||||||
| 	 * removed immediately. | 	 * removed immediately. | ||||||
| 	 */ | 	 */ | ||||||
| 	thaw_super(sb, FREEZE_HOLDER_USERSPACE); | 	thaw_super(sb, FREEZE_HOLDER_USERSPACE, NULL); | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
| static int | static int | ||||||
|  |  | ||||||
|  | @ -1316,6 +1316,7 @@ struct sb_writers { | ||||||
| 	unsigned short			frozen;		/* Is sb frozen? */ | 	unsigned short			frozen;		/* Is sb frozen? */ | ||||||
| 	int				freeze_kcount;	/* How many kernel freeze requests? */ | 	int				freeze_kcount;	/* How many kernel freeze requests? */ | ||||||
| 	int				freeze_ucount;	/* How many userspace freeze requests? */ | 	int				freeze_ucount;	/* How many userspace freeze requests? */ | ||||||
|  | 	const void			*freeze_owner;	/* Owner of the freeze */ | ||||||
| 	struct percpu_rw_semaphore	rw_sem[SB_FREEZE_LEVELS]; | 	struct percpu_rw_semaphore	rw_sem[SB_FREEZE_LEVELS]; | ||||||
| }; | }; | ||||||
| 
 | 
 | ||||||
|  | @ -1789,7 +1790,7 @@ static inline void __sb_end_write(struct super_block *sb, int level) | ||||||
| 
 | 
 | ||||||
| static inline void __sb_start_write(struct super_block *sb, int level) | static inline void __sb_start_write(struct super_block *sb, int level) | ||||||
| { | { | ||||||
| 	percpu_down_read(sb->s_writers.rw_sem + level - 1); | 	percpu_down_read_freezable(sb->s_writers.rw_sem + level - 1, true); | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
| static inline bool __sb_start_write_trylock(struct super_block *sb, int level) | static inline bool __sb_start_write_trylock(struct super_block *sb, int level) | ||||||
|  | @ -2288,6 +2289,7 @@ extern loff_t vfs_dedupe_file_range_one(struct file *src_file, loff_t src_pos, | ||||||
|  * @FREEZE_HOLDER_KERNEL: kernel wants to freeze or thaw filesystem |  * @FREEZE_HOLDER_KERNEL: kernel wants to freeze or thaw filesystem | ||||||
|  * @FREEZE_HOLDER_USERSPACE: userspace wants to freeze or thaw filesystem |  * @FREEZE_HOLDER_USERSPACE: userspace wants to freeze or thaw filesystem | ||||||
|  * @FREEZE_MAY_NEST: whether nesting freeze and thaw requests is allowed |  * @FREEZE_MAY_NEST: whether nesting freeze and thaw requests is allowed | ||||||
|  |  * @FREEZE_EXCL: a freeze that can only be undone by the owner | ||||||
|  * |  * | ||||||
|  * Indicate who the owner of the freeze or thaw request is and whether |  * Indicate who the owner of the freeze or thaw request is and whether | ||||||
|  * the freeze needs to be exclusive or can nest. |  * the freeze needs to be exclusive or can nest. | ||||||
|  | @ -2301,6 +2303,7 @@ enum freeze_holder { | ||||||
| 	FREEZE_HOLDER_KERNEL	= (1U << 0), | 	FREEZE_HOLDER_KERNEL	= (1U << 0), | ||||||
| 	FREEZE_HOLDER_USERSPACE	= (1U << 1), | 	FREEZE_HOLDER_USERSPACE	= (1U << 1), | ||||||
| 	FREEZE_MAY_NEST		= (1U << 2), | 	FREEZE_MAY_NEST		= (1U << 2), | ||||||
|  | 	FREEZE_EXCL		= (1U << 3), | ||||||
| }; | }; | ||||||
| 
 | 
 | ||||||
| struct super_operations { | struct super_operations { | ||||||
|  | @ -2314,9 +2317,9 @@ struct super_operations { | ||||||
| 	void (*evict_inode) (struct inode *); | 	void (*evict_inode) (struct inode *); | ||||||
| 	void (*put_super) (struct super_block *); | 	void (*put_super) (struct super_block *); | ||||||
| 	int (*sync_fs)(struct super_block *sb, int wait); | 	int (*sync_fs)(struct super_block *sb, int wait); | ||||||
| 	int (*freeze_super) (struct super_block *, enum freeze_holder who); | 	int (*freeze_super) (struct super_block *, enum freeze_holder who, const void *owner); | ||||||
| 	int (*freeze_fs) (struct super_block *); | 	int (*freeze_fs) (struct super_block *); | ||||||
| 	int (*thaw_super) (struct super_block *, enum freeze_holder who); | 	int (*thaw_super) (struct super_block *, enum freeze_holder who, const void *owner); | ||||||
| 	int (*unfreeze_fs) (struct super_block *); | 	int (*unfreeze_fs) (struct super_block *); | ||||||
| 	int (*statfs) (struct dentry *, struct kstatfs *); | 	int (*statfs) (struct dentry *, struct kstatfs *); | ||||||
| 	int (*remount_fs) (struct super_block *, int *, char *); | 	int (*remount_fs) (struct super_block *, int *, char *); | ||||||
|  | @ -2726,8 +2729,10 @@ extern int unregister_filesystem(struct file_system_type *); | ||||||
| extern int vfs_statfs(const struct path *, struct kstatfs *); | extern int vfs_statfs(const struct path *, struct kstatfs *); | ||||||
| extern int user_statfs(const char __user *, struct kstatfs *); | extern int user_statfs(const char __user *, struct kstatfs *); | ||||||
| extern int fd_statfs(int, struct kstatfs *); | extern int fd_statfs(int, struct kstatfs *); | ||||||
| int freeze_super(struct super_block *super, enum freeze_holder who); | int freeze_super(struct super_block *super, enum freeze_holder who, | ||||||
| int thaw_super(struct super_block *super, enum freeze_holder who); | 		 const void *freeze_owner); | ||||||
|  | int thaw_super(struct super_block *super, enum freeze_holder who, | ||||||
|  | 	       const void *freeze_owner); | ||||||
| extern __printf(2, 3) | extern __printf(2, 3) | ||||||
| int super_setup_bdi_name(struct super_block *sb, char *fmt, ...); | int super_setup_bdi_name(struct super_block *sb, char *fmt, ...); | ||||||
| extern int super_setup_bdi(struct super_block *sb); | extern int super_setup_bdi(struct super_block *sb); | ||||||
|  | @ -3536,9 +3541,11 @@ extern void put_filesystem(struct file_system_type *fs); | ||||||
| extern struct file_system_type *get_fs_type(const char *name); | extern struct file_system_type *get_fs_type(const char *name); | ||||||
| extern void drop_super(struct super_block *sb); | extern void drop_super(struct super_block *sb); | ||||||
| extern void drop_super_exclusive(struct super_block *sb); | extern void drop_super_exclusive(struct super_block *sb); | ||||||
| extern void iterate_supers(void (*)(struct super_block *, void *), void *); | extern void iterate_supers(void (*f)(struct super_block *, void *), void *arg); | ||||||
| extern void iterate_supers_type(struct file_system_type *, | extern void iterate_supers_type(struct file_system_type *, | ||||||
| 			        void (*)(struct super_block *, void *), void *); | 			        void (*)(struct super_block *, void *), void *); | ||||||
|  | void filesystems_freeze(void); | ||||||
|  | void filesystems_thaw(void); | ||||||
| 
 | 
 | ||||||
| extern int dcache_dir_open(struct inode *, struct file *); | extern int dcache_dir_open(struct inode *, struct file *); | ||||||
| extern int dcache_dir_close(struct inode *, struct file *); | extern int dcache_dir_close(struct inode *, struct file *); | ||||||
|  |  | ||||||
|  | @ -43,9 +43,10 @@ is_static struct percpu_rw_semaphore name = {				\ | ||||||
| #define DEFINE_STATIC_PERCPU_RWSEM(name)	\ | #define DEFINE_STATIC_PERCPU_RWSEM(name)	\ | ||||||
| 	__DEFINE_PERCPU_RWSEM(name, static) | 	__DEFINE_PERCPU_RWSEM(name, static) | ||||||
| 
 | 
 | ||||||
| extern bool __percpu_down_read(struct percpu_rw_semaphore *, bool); | extern bool __percpu_down_read(struct percpu_rw_semaphore *, bool, bool); | ||||||
| 
 | 
 | ||||||
| static inline void percpu_down_read(struct percpu_rw_semaphore *sem) | static inline void percpu_down_read_internal(struct percpu_rw_semaphore *sem, | ||||||
|  | 					     bool freezable) | ||||||
| { | { | ||||||
| 	might_sleep(); | 	might_sleep(); | ||||||
| 
 | 
 | ||||||
|  | @ -63,7 +64,7 @@ static inline void percpu_down_read(struct percpu_rw_semaphore *sem) | ||||||
| 	if (likely(rcu_sync_is_idle(&sem->rss))) | 	if (likely(rcu_sync_is_idle(&sem->rss))) | ||||||
| 		this_cpu_inc(*sem->read_count); | 		this_cpu_inc(*sem->read_count); | ||||||
| 	else | 	else | ||||||
| 		__percpu_down_read(sem, false); /* Unconditional memory barrier */ | 		__percpu_down_read(sem, false, freezable); /* Unconditional memory barrier */ | ||||||
| 	/*
 | 	/*
 | ||||||
| 	 * The preempt_enable() prevents the compiler from | 	 * The preempt_enable() prevents the compiler from | ||||||
| 	 * bleeding the critical section out. | 	 * bleeding the critical section out. | ||||||
|  | @ -71,6 +72,17 @@ static inline void percpu_down_read(struct percpu_rw_semaphore *sem) | ||||||
| 	preempt_enable(); | 	preempt_enable(); | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
|  | static inline void percpu_down_read(struct percpu_rw_semaphore *sem) | ||||||
|  | { | ||||||
|  | 	percpu_down_read_internal(sem, false); | ||||||
|  | } | ||||||
|  | 
 | ||||||
|  | static inline void percpu_down_read_freezable(struct percpu_rw_semaphore *sem, | ||||||
|  | 					      bool freeze) | ||||||
|  | { | ||||||
|  | 	percpu_down_read_internal(sem, freeze); | ||||||
|  | } | ||||||
|  | 
 | ||||||
| static inline bool percpu_down_read_trylock(struct percpu_rw_semaphore *sem) | static inline bool percpu_down_read_trylock(struct percpu_rw_semaphore *sem) | ||||||
| { | { | ||||||
| 	bool ret = true; | 	bool ret = true; | ||||||
|  | @ -82,7 +94,7 @@ static inline bool percpu_down_read_trylock(struct percpu_rw_semaphore *sem) | ||||||
| 	if (likely(rcu_sync_is_idle(&sem->rss))) | 	if (likely(rcu_sync_is_idle(&sem->rss))) | ||||||
| 		this_cpu_inc(*sem->read_count); | 		this_cpu_inc(*sem->read_count); | ||||||
| 	else | 	else | ||||||
| 		ret = __percpu_down_read(sem, true); /* Unconditional memory barrier */ | 		ret = __percpu_down_read(sem, true, false); /* Unconditional memory barrier */ | ||||||
| 	preempt_enable(); | 	preempt_enable(); | ||||||
| 	/*
 | 	/*
 | ||||||
| 	 * The barrier() from preempt_enable() prevents the compiler from | 	 * The barrier() from preempt_enable() prevents the compiler from | ||||||
|  |  | ||||||
|  | @ -138,7 +138,8 @@ static int percpu_rwsem_wake_function(struct wait_queue_entry *wq_entry, | ||||||
| 	return !reader; /* wake (readers until) 1 writer */ | 	return !reader; /* wake (readers until) 1 writer */ | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
| static void percpu_rwsem_wait(struct percpu_rw_semaphore *sem, bool reader) | static void percpu_rwsem_wait(struct percpu_rw_semaphore *sem, bool reader, | ||||||
|  | 			      bool freeze) | ||||||
| { | { | ||||||
| 	DEFINE_WAIT_FUNC(wq_entry, percpu_rwsem_wake_function); | 	DEFINE_WAIT_FUNC(wq_entry, percpu_rwsem_wake_function); | ||||||
| 	bool wait; | 	bool wait; | ||||||
|  | @ -156,7 +157,8 @@ static void percpu_rwsem_wait(struct percpu_rw_semaphore *sem, bool reader) | ||||||
| 	spin_unlock_irq(&sem->waiters.lock); | 	spin_unlock_irq(&sem->waiters.lock); | ||||||
| 
 | 
 | ||||||
| 	while (wait) { | 	while (wait) { | ||||||
| 		set_current_state(TASK_UNINTERRUPTIBLE); | 		set_current_state(TASK_UNINTERRUPTIBLE | | ||||||
|  | 				  (freeze ? TASK_FREEZABLE : 0)); | ||||||
| 		if (!smp_load_acquire(&wq_entry.private)) | 		if (!smp_load_acquire(&wq_entry.private)) | ||||||
| 			break; | 			break; | ||||||
| 		schedule(); | 		schedule(); | ||||||
|  | @ -164,7 +166,8 @@ static void percpu_rwsem_wait(struct percpu_rw_semaphore *sem, bool reader) | ||||||
| 	__set_current_state(TASK_RUNNING); | 	__set_current_state(TASK_RUNNING); | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
| bool __sched __percpu_down_read(struct percpu_rw_semaphore *sem, bool try) | bool __sched __percpu_down_read(struct percpu_rw_semaphore *sem, bool try, | ||||||
|  | 				bool freeze) | ||||||
| { | { | ||||||
| 	if (__percpu_down_read_trylock(sem)) | 	if (__percpu_down_read_trylock(sem)) | ||||||
| 		return true; | 		return true; | ||||||
|  | @ -174,7 +177,7 @@ bool __sched __percpu_down_read(struct percpu_rw_semaphore *sem, bool try) | ||||||
| 
 | 
 | ||||||
| 	trace_contention_begin(sem, LCB_F_PERCPU | LCB_F_READ); | 	trace_contention_begin(sem, LCB_F_PERCPU | LCB_F_READ); | ||||||
| 	preempt_enable(); | 	preempt_enable(); | ||||||
| 	percpu_rwsem_wait(sem, /* .reader = */ true); | 	percpu_rwsem_wait(sem, /* .reader = */ true, freeze); | ||||||
| 	preempt_disable(); | 	preempt_disable(); | ||||||
| 	trace_contention_end(sem, 0); | 	trace_contention_end(sem, 0); | ||||||
| 
 | 
 | ||||||
|  | @ -237,7 +240,7 @@ void __sched percpu_down_write(struct percpu_rw_semaphore *sem) | ||||||
| 	 */ | 	 */ | ||||||
| 	if (!__percpu_down_write_trylock(sem)) { | 	if (!__percpu_down_write_trylock(sem)) { | ||||||
| 		trace_contention_begin(sem, LCB_F_PERCPU | LCB_F_WRITE); | 		trace_contention_begin(sem, LCB_F_PERCPU | LCB_F_WRITE); | ||||||
| 		percpu_rwsem_wait(sem, /* .reader = */ false); | 		percpu_rwsem_wait(sem, /* .reader = */ false, false); | ||||||
| 		contended = true; | 		contended = true; | ||||||
| 	} | 	} | ||||||
| 
 | 
 | ||||||
|  |  | ||||||
|  | @ -778,6 +778,8 @@ int hibernate(void) | ||||||
| 		goto Restore; | 		goto Restore; | ||||||
| 
 | 
 | ||||||
| 	ksys_sync_helper(); | 	ksys_sync_helper(); | ||||||
|  | 	if (filesystem_freeze_enabled) | ||||||
|  | 		filesystems_freeze(); | ||||||
| 
 | 
 | ||||||
| 	error = freeze_processes(); | 	error = freeze_processes(); | ||||||
| 	if (error) | 	if (error) | ||||||
|  | @ -846,6 +848,7 @@ int hibernate(void) | ||||||
| 	/* Don't bother checking whether freezer_test_done is true */ | 	/* Don't bother checking whether freezer_test_done is true */ | ||||||
| 	freezer_test_done = false; | 	freezer_test_done = false; | ||||||
|  Exit: |  Exit: | ||||||
|  | 	filesystems_thaw(); | ||||||
| 	pm_notifier_call_chain(PM_POST_HIBERNATION); | 	pm_notifier_call_chain(PM_POST_HIBERNATION); | ||||||
|  Restore: |  Restore: | ||||||
| 	pm_restore_console(); | 	pm_restore_console(); | ||||||
|  | @ -882,6 +885,9 @@ int hibernate_quiet_exec(int (*func)(void *data), void *data) | ||||||
| 	if (error) | 	if (error) | ||||||
| 		goto restore; | 		goto restore; | ||||||
| 
 | 
 | ||||||
|  | 	if (filesystem_freeze_enabled) | ||||||
|  | 		filesystems_freeze(); | ||||||
|  | 
 | ||||||
| 	error = freeze_processes(); | 	error = freeze_processes(); | ||||||
| 	if (error) | 	if (error) | ||||||
| 		goto exit; | 		goto exit; | ||||||
|  | @ -941,6 +947,7 @@ thaw: | ||||||
| 	thaw_processes(); | 	thaw_processes(); | ||||||
| 
 | 
 | ||||||
| exit: | exit: | ||||||
|  | 	filesystems_thaw(); | ||||||
| 	pm_notifier_call_chain(PM_POST_HIBERNATION); | 	pm_notifier_call_chain(PM_POST_HIBERNATION); | ||||||
| 
 | 
 | ||||||
| restore: | restore: | ||||||
|  | @ -1029,19 +1036,26 @@ static int software_resume(void) | ||||||
| 	if (error) | 	if (error) | ||||||
| 		goto Restore; | 		goto Restore; | ||||||
| 
 | 
 | ||||||
|  | 	if (filesystem_freeze_enabled) | ||||||
|  | 		filesystems_freeze(); | ||||||
|  | 
 | ||||||
| 	pm_pr_dbg("Preparing processes for hibernation restore.\n"); | 	pm_pr_dbg("Preparing processes for hibernation restore.\n"); | ||||||
| 	error = freeze_processes(); | 	error = freeze_processes(); | ||||||
| 	if (error) | 	if (error) { | ||||||
|  | 		filesystems_thaw(); | ||||||
| 		goto Close_Finish; | 		goto Close_Finish; | ||||||
|  | 	} | ||||||
| 
 | 
 | ||||||
| 	error = freeze_kernel_threads(); | 	error = freeze_kernel_threads(); | ||||||
| 	if (error) { | 	if (error) { | ||||||
| 		thaw_processes(); | 		thaw_processes(); | ||||||
|  | 		filesystems_thaw(); | ||||||
| 		goto Close_Finish; | 		goto Close_Finish; | ||||||
| 	} | 	} | ||||||
| 
 | 
 | ||||||
| 	error = load_image_and_restore(); | 	error = load_image_and_restore(); | ||||||
| 	thaw_processes(); | 	thaw_processes(); | ||||||
|  | 	filesystems_thaw(); | ||||||
|  Finish: |  Finish: | ||||||
| 	pm_notifier_call_chain(PM_POST_RESTORE); | 	pm_notifier_call_chain(PM_POST_RESTORE); | ||||||
|  Restore: |  Restore: | ||||||
|  |  | ||||||
|  | @ -962,6 +962,34 @@ power_attr(pm_freeze_timeout); | ||||||
| 
 | 
 | ||||||
| #endif	/* CONFIG_FREEZER*/ | #endif	/* CONFIG_FREEZER*/ | ||||||
| 
 | 
 | ||||||
|  | #if defined(CONFIG_SUSPEND) || defined(CONFIG_HIBERNATION) | ||||||
|  | bool filesystem_freeze_enabled = false; | ||||||
|  | 
 | ||||||
|  | static ssize_t freeze_filesystems_show(struct kobject *kobj, | ||||||
|  | 				       struct kobj_attribute *attr, char *buf) | ||||||
|  | { | ||||||
|  | 	return sysfs_emit(buf, "%d\n", filesystem_freeze_enabled); | ||||||
|  | } | ||||||
|  | 
 | ||||||
|  | static ssize_t freeze_filesystems_store(struct kobject *kobj, | ||||||
|  | 					struct kobj_attribute *attr, | ||||||
|  | 					const char *buf, size_t n) | ||||||
|  | { | ||||||
|  | 	unsigned long val; | ||||||
|  | 
 | ||||||
|  | 	if (kstrtoul(buf, 10, &val)) | ||||||
|  | 		return -EINVAL; | ||||||
|  | 
 | ||||||
|  | 	if (val > 1) | ||||||
|  | 		return -EINVAL; | ||||||
|  | 
 | ||||||
|  | 	filesystem_freeze_enabled = !!val; | ||||||
|  | 	return n; | ||||||
|  | } | ||||||
|  | 
 | ||||||
|  | power_attr(freeze_filesystems); | ||||||
|  | #endif /* CONFIG_SUSPEND || CONFIG_HIBERNATION */ | ||||||
|  | 
 | ||||||
| static struct attribute * g[] = { | static struct attribute * g[] = { | ||||||
| 	&state_attr.attr, | 	&state_attr.attr, | ||||||
| #ifdef CONFIG_PM_TRACE | #ifdef CONFIG_PM_TRACE | ||||||
|  | @ -991,6 +1019,9 @@ static struct attribute * g[] = { | ||||||
| #endif | #endif | ||||||
| #ifdef CONFIG_FREEZER | #ifdef CONFIG_FREEZER | ||||||
| 	&pm_freeze_timeout_attr.attr, | 	&pm_freeze_timeout_attr.attr, | ||||||
|  | #endif | ||||||
|  | #if defined(CONFIG_SUSPEND) || defined(CONFIG_HIBERNATION) | ||||||
|  | 	&freeze_filesystems_attr.attr, | ||||||
| #endif | #endif | ||||||
| 	NULL, | 	NULL, | ||||||
| }; | }; | ||||||
|  |  | ||||||
|  | @ -18,6 +18,10 @@ struct swsusp_info { | ||||||
| 	unsigned long		size; | 	unsigned long		size; | ||||||
| } __aligned(PAGE_SIZE); | } __aligned(PAGE_SIZE); | ||||||
| 
 | 
 | ||||||
|  | #if defined(CONFIG_SUSPEND) || defined(CONFIG_HIBERNATION) | ||||||
|  | extern bool filesystem_freeze_enabled; | ||||||
|  | #endif | ||||||
|  | 
 | ||||||
| #ifdef CONFIG_HIBERNATION | #ifdef CONFIG_HIBERNATION | ||||||
| /* kernel/power/snapshot.c */ | /* kernel/power/snapshot.c */ | ||||||
| extern void __init hibernate_reserved_size_init(void); | extern void __init hibernate_reserved_size_init(void); | ||||||
|  |  | ||||||
|  | @ -30,6 +30,7 @@ | ||||||
| #include <trace/events/power.h> | #include <trace/events/power.h> | ||||||
| #include <linux/compiler.h> | #include <linux/compiler.h> | ||||||
| #include <linux/moduleparam.h> | #include <linux/moduleparam.h> | ||||||
|  | #include <linux/fs.h> | ||||||
| 
 | 
 | ||||||
| #include "power.h" | #include "power.h" | ||||||
| 
 | 
 | ||||||
|  | @ -374,6 +375,8 @@ static int suspend_prepare(suspend_state_t state) | ||||||
| 	if (error) | 	if (error) | ||||||
| 		goto Restore; | 		goto Restore; | ||||||
| 
 | 
 | ||||||
|  | 	if (filesystem_freeze_enabled) | ||||||
|  | 		filesystems_freeze(); | ||||||
| 	trace_suspend_resume(TPS("freeze_processes"), 0, true); | 	trace_suspend_resume(TPS("freeze_processes"), 0, true); | ||||||
| 	error = suspend_freeze_processes(); | 	error = suspend_freeze_processes(); | ||||||
| 	trace_suspend_resume(TPS("freeze_processes"), 0, false); | 	trace_suspend_resume(TPS("freeze_processes"), 0, false); | ||||||
|  | @ -550,6 +553,7 @@ int suspend_devices_and_enter(suspend_state_t state) | ||||||
| static void suspend_finish(void) | static void suspend_finish(void) | ||||||
| { | { | ||||||
| 	suspend_thaw_processes(); | 	suspend_thaw_processes(); | ||||||
|  | 	filesystems_thaw(); | ||||||
| 	pm_notifier_call_chain(PM_POST_SUSPEND); | 	pm_notifier_call_chain(PM_POST_SUSPEND); | ||||||
| 	pm_restore_console(); | 	pm_restore_console(); | ||||||
| } | } | ||||||
|  | @ -588,6 +592,8 @@ static int enter_state(suspend_state_t state) | ||||||
| 		ksys_sync_helper(); | 		ksys_sync_helper(); | ||||||
| 		trace_suspend_resume(TPS("sync_filesystems"), 0, false); | 		trace_suspend_resume(TPS("sync_filesystems"), 0, false); | ||||||
| 	} | 	} | ||||||
|  | 	if (filesystem_freeze_enabled) | ||||||
|  | 		filesystems_freeze(); | ||||||
| 
 | 
 | ||||||
| 	pm_pr_dbg("Preparing system for sleep (%s)\n", mem_sleep_labels[state]); | 	pm_pr_dbg("Preparing system for sleep (%s)\n", mem_sleep_labels[state]); | ||||||
| 	pm_suspend_clear_flags(); | 	pm_suspend_clear_flags(); | ||||||
|  | @ -609,6 +615,7 @@ static int enter_state(suspend_state_t state) | ||||||
| 	pm_pr_dbg("Finishing wakeup.\n"); | 	pm_pr_dbg("Finishing wakeup.\n"); | ||||||
| 	suspend_finish(); | 	suspend_finish(); | ||||||
|  Unlock: |  Unlock: | ||||||
|  | 	filesystems_thaw(); | ||||||
| 	mutex_unlock(&system_transition_mutex); | 	mutex_unlock(&system_transition_mutex); | ||||||
| 	return error; | 	return error; | ||||||
| } | } | ||||||
|  |  | ||||||
		Loading…
	
	Add table
		
		Reference in a new issue
	
	 Linus Torvalds
						Linus Torvalds