mirror of
				https://github.com/torvalds/linux.git
				synced 2025-10-31 08:38:45 +02:00 
			
		
		
		
	 453a73c306
			
		
	
	
		453a73c306
		
	
	
	
	
		
			
			On the zoned mode, once used and freed region is still not reusable after the freeing. The underlying zone needs to be reset before reusing. Btrfs resets a zone when it removes a block group, and then new block group is allocated on the zones to reuse the zones. But, it is sometime too late to catch up with a write side. This commit introduces a new space-info reclaim method ZONE_RESET. That will pick a block group from the unused list and reset its zone to reuse the zone_unusable space. It is faster than removing the block group and re-creating a new block group on the same zones. For the first implementation, the ZONE_RESET is only applied to a block group whose region is fully zone_unusable. Reclaiming partial zone_unusable block group could be implemented later. Signed-off-by: Naohiro Aota <naohiro.aota@wdc.com> Signed-off-by: David Sterba <dsterba@suse.com>
		
			
				
	
	
		
			415 lines
		
	
	
	
		
			12 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
			
		
		
	
	
			415 lines
		
	
	
	
		
			12 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
| /* SPDX-License-Identifier: GPL-2.0 */
 | |
| 
 | |
| #ifndef BTRFS_ZONED_H
 | |
| #define BTRFS_ZONED_H
 | |
| 
 | |
| #include <linux/types.h>
 | |
| #include <linux/atomic.h>
 | |
| #include <linux/blkdev.h>
 | |
| #include <linux/blkzoned.h>
 | |
| #include <linux/errno.h>
 | |
| #include <linux/spinlock.h>
 | |
| #include <linux/mutex.h>
 | |
| #include "messages.h"
 | |
| #include "volumes.h"
 | |
| #include "disk-io.h"
 | |
| #include "block-group.h"
 | |
| #include "btrfs_inode.h"
 | |
| #include "fs.h"
 | |
| 
 | |
| struct block_device;
 | |
| struct extent_buffer;
 | |
| struct btrfs_bio;
 | |
| struct btrfs_ordered_extent;
 | |
| struct btrfs_fs_info;
 | |
| struct btrfs_space_info;
 | |
| struct btrfs_eb_write_context;
 | |
| struct btrfs_fs_devices;
 | |
| 
 | |
| #define BTRFS_DEFAULT_RECLAIM_THRESH           			(75)
 | |
| 
 | |
| struct btrfs_zoned_device_info {
 | |
| 	/*
 | |
| 	 * Number of zones, zone size and types of zones if bdev is a
 | |
| 	 * zoned block device.
 | |
| 	 */
 | |
| 	u64 zone_size;
 | |
| 	u8  zone_size_shift;
 | |
| 	u32 nr_zones;
 | |
| 	unsigned int max_active_zones;
 | |
| 	/*
 | |
| 	 * Reserved active zones for one metadata and one system block group.
 | |
| 	 * It can vary per-device depending on the allocation status.
 | |
| 	 */
 | |
| 	int reserved_active_zones;
 | |
| 	atomic_t active_zones_left;
 | |
| 	unsigned long *seq_zones;
 | |
| 	unsigned long *empty_zones;
 | |
| 	unsigned long *active_zones;
 | |
| 	struct blk_zone *zone_cache;
 | |
| 	struct blk_zone sb_zones[2 * BTRFS_SUPER_MIRROR_MAX];
 | |
| };
 | |
| 
 | |
| void btrfs_finish_ordered_zoned(struct btrfs_ordered_extent *ordered);
 | |
| 
 | |
| #ifdef CONFIG_BLK_DEV_ZONED
 | |
| int btrfs_get_dev_zone_info_all_devices(struct btrfs_fs_info *fs_info);
 | |
| int btrfs_get_dev_zone_info(struct btrfs_device *device, bool populate_cache);
 | |
| void btrfs_destroy_dev_zone_info(struct btrfs_device *device);
 | |
| struct btrfs_zoned_device_info *btrfs_clone_dev_zone_info(struct btrfs_device *orig_dev);
 | |
| int btrfs_check_zoned_mode(struct btrfs_fs_info *fs_info);
 | |
| int btrfs_check_mountopts_zoned(const struct btrfs_fs_info *info,
 | |
| 				unsigned long long *mount_opt);
 | |
| int btrfs_sb_log_location_bdev(struct block_device *bdev, int mirror, int rw,
 | |
| 			       u64 *bytenr_ret);
 | |
| int btrfs_sb_log_location(struct btrfs_device *device, int mirror, int rw,
 | |
| 			  u64 *bytenr_ret);
 | |
| int btrfs_advance_sb_log(struct btrfs_device *device, int mirror);
 | |
| int btrfs_reset_sb_log_zones(struct block_device *bdev, int mirror);
 | |
| u64 btrfs_find_allocatable_zones(struct btrfs_device *device, u64 hole_start,
 | |
| 				 u64 hole_end, u64 num_bytes);
 | |
| int btrfs_reset_device_zone(struct btrfs_device *device, u64 physical,
 | |
| 			    u64 length, u64 *bytes);
 | |
| int btrfs_ensure_empty_zones(struct btrfs_device *device, u64 start, u64 size);
 | |
| int btrfs_load_block_group_zone_info(struct btrfs_block_group *cache, bool new);
 | |
| void btrfs_calc_zone_unusable(struct btrfs_block_group *cache);
 | |
| bool btrfs_use_zone_append(struct btrfs_bio *bbio);
 | |
| void btrfs_record_physical_zoned(struct btrfs_bio *bbio);
 | |
| int btrfs_check_meta_write_pointer(struct btrfs_fs_info *fs_info,
 | |
| 				   struct btrfs_eb_write_context *ctx);
 | |
| int btrfs_zoned_issue_zeroout(struct btrfs_device *device, u64 physical, u64 length);
 | |
| int btrfs_sync_zone_write_pointer(struct btrfs_device *tgt_dev, u64 logical,
 | |
| 				  u64 physical_start, u64 physical_pos);
 | |
| bool btrfs_zone_activate(struct btrfs_block_group *block_group);
 | |
| int btrfs_zone_finish(struct btrfs_block_group *block_group);
 | |
| bool btrfs_can_activate_zone(struct btrfs_fs_devices *fs_devices, u64 flags);
 | |
| void btrfs_zone_finish_endio(struct btrfs_fs_info *fs_info, u64 logical,
 | |
| 			     u64 length);
 | |
| void btrfs_schedule_zone_finish_bg(struct btrfs_block_group *bg,
 | |
| 				   struct extent_buffer *eb);
 | |
| void btrfs_clear_data_reloc_bg(struct btrfs_block_group *bg);
 | |
| void btrfs_free_zone_cache(struct btrfs_fs_info *fs_info);
 | |
| bool btrfs_zoned_should_reclaim(const struct btrfs_fs_info *fs_info);
 | |
| void btrfs_zoned_release_data_reloc_bg(struct btrfs_fs_info *fs_info, u64 logical,
 | |
| 				       u64 length);
 | |
| int btrfs_zone_finish_one_bg(struct btrfs_fs_info *fs_info);
 | |
| int btrfs_zoned_activate_one_bg(struct btrfs_fs_info *fs_info,
 | |
| 				struct btrfs_space_info *space_info, bool do_finish);
 | |
| void btrfs_check_active_zone_reservation(struct btrfs_fs_info *fs_info);
 | |
| int btrfs_reset_unused_block_groups(struct btrfs_space_info *space_info, u64 num_bytes);
 | |
| #else /* CONFIG_BLK_DEV_ZONED */
 | |
| 
 | |
| static inline int btrfs_get_dev_zone_info_all_devices(struct btrfs_fs_info *fs_info)
 | |
| {
 | |
| 	return 0;
 | |
| }
 | |
| 
 | |
| static inline int btrfs_get_dev_zone_info(struct btrfs_device *device,
 | |
| 					  bool populate_cache)
 | |
| {
 | |
| 	return 0;
 | |
| }
 | |
| 
 | |
| static inline void btrfs_destroy_dev_zone_info(struct btrfs_device *device) { }
 | |
| 
 | |
| /*
 | |
|  * In case the kernel is compiled without CONFIG_BLK_DEV_ZONED we'll never call
 | |
|  * into btrfs_clone_dev_zone_info() so it's safe to return NULL here.
 | |
|  */
 | |
| static inline struct btrfs_zoned_device_info *btrfs_clone_dev_zone_info(
 | |
| 						 struct btrfs_device *orig_dev)
 | |
| {
 | |
| 	return NULL;
 | |
| }
 | |
| 
 | |
| static inline int btrfs_check_zoned_mode(const struct btrfs_fs_info *fs_info)
 | |
| {
 | |
| 	if (!btrfs_is_zoned(fs_info))
 | |
| 		return 0;
 | |
| 
 | |
| 	btrfs_err(fs_info, "zoned block devices support is not enabled");
 | |
| 	return -EOPNOTSUPP;
 | |
| }
 | |
| 
 | |
| static inline int btrfs_check_mountopts_zoned(const struct btrfs_fs_info *info,
 | |
| 					      unsigned long long *mount_opt)
 | |
| {
 | |
| 	return 0;
 | |
| }
 | |
| 
 | |
| static inline int btrfs_sb_log_location_bdev(struct block_device *bdev,
 | |
| 					     int mirror, int rw, u64 *bytenr_ret)
 | |
| {
 | |
| 	*bytenr_ret = btrfs_sb_offset(mirror);
 | |
| 	return 0;
 | |
| }
 | |
| 
 | |
| static inline int btrfs_sb_log_location(struct btrfs_device *device, int mirror,
 | |
| 					int rw, u64 *bytenr_ret)
 | |
| {
 | |
| 	*bytenr_ret = btrfs_sb_offset(mirror);
 | |
| 	return 0;
 | |
| }
 | |
| 
 | |
| static inline int btrfs_advance_sb_log(struct btrfs_device *device, int mirror)
 | |
| {
 | |
| 	return 0;
 | |
| }
 | |
| 
 | |
| static inline int btrfs_reset_sb_log_zones(struct block_device *bdev, int mirror)
 | |
| {
 | |
| 	return 0;
 | |
| }
 | |
| 
 | |
| static inline u64 btrfs_find_allocatable_zones(struct btrfs_device *device,
 | |
| 					       u64 hole_start, u64 hole_end,
 | |
| 					       u64 num_bytes)
 | |
| {
 | |
| 	return hole_start;
 | |
| }
 | |
| 
 | |
| static inline int btrfs_reset_device_zone(struct btrfs_device *device,
 | |
| 					  u64 physical, u64 length, u64 *bytes)
 | |
| {
 | |
| 	*bytes = 0;
 | |
| 	return 0;
 | |
| }
 | |
| 
 | |
| static inline int btrfs_ensure_empty_zones(struct btrfs_device *device,
 | |
| 					   u64 start, u64 size)
 | |
| {
 | |
| 	return 0;
 | |
| }
 | |
| 
 | |
| static inline int btrfs_load_block_group_zone_info(
 | |
| 		struct btrfs_block_group *cache, bool new)
 | |
| {
 | |
| 	return 0;
 | |
| }
 | |
| 
 | |
| static inline void btrfs_calc_zone_unusable(struct btrfs_block_group *cache) { }
 | |
| 
 | |
| static inline bool btrfs_use_zone_append(struct btrfs_bio *bbio)
 | |
| {
 | |
| 	return false;
 | |
| }
 | |
| 
 | |
| static inline void btrfs_record_physical_zoned(struct btrfs_bio *bbio)
 | |
| {
 | |
| }
 | |
| 
 | |
| static inline int btrfs_check_meta_write_pointer(struct btrfs_fs_info *fs_info,
 | |
| 						 struct btrfs_eb_write_context *ctx)
 | |
| {
 | |
| 	return 0;
 | |
| }
 | |
| 
 | |
| static inline int btrfs_zoned_issue_zeroout(struct btrfs_device *device,
 | |
| 					    u64 physical, u64 length)
 | |
| {
 | |
| 	return -EOPNOTSUPP;
 | |
| }
 | |
| 
 | |
| static inline int btrfs_sync_zone_write_pointer(struct btrfs_device *tgt_dev,
 | |
| 						u64 logical, u64 physical_start,
 | |
| 						u64 physical_pos)
 | |
| {
 | |
| 	return -EOPNOTSUPP;
 | |
| }
 | |
| 
 | |
| static inline bool btrfs_zone_activate(struct btrfs_block_group *block_group)
 | |
| {
 | |
| 	return true;
 | |
| }
 | |
| 
 | |
| static inline int btrfs_zone_finish(struct btrfs_block_group *block_group)
 | |
| {
 | |
| 	return 0;
 | |
| }
 | |
| 
 | |
| static inline bool btrfs_can_activate_zone(struct btrfs_fs_devices *fs_devices,
 | |
| 					   u64 flags)
 | |
| {
 | |
| 	return true;
 | |
| }
 | |
| 
 | |
| static inline void btrfs_zone_finish_endio(struct btrfs_fs_info *fs_info,
 | |
| 					   u64 logical, u64 length) { }
 | |
| 
 | |
| static inline void btrfs_schedule_zone_finish_bg(struct btrfs_block_group *bg,
 | |
| 						 struct extent_buffer *eb) { }
 | |
| 
 | |
| static inline void btrfs_clear_data_reloc_bg(struct btrfs_block_group *bg) { }
 | |
| 
 | |
| static inline void btrfs_free_zone_cache(struct btrfs_fs_info *fs_info) { }
 | |
| 
 | |
| static inline bool btrfs_zoned_should_reclaim(const struct btrfs_fs_info *fs_info)
 | |
| {
 | |
| 	return false;
 | |
| }
 | |
| 
 | |
| static inline void btrfs_zoned_release_data_reloc_bg(struct btrfs_fs_info *fs_info,
 | |
| 						     u64 logical, u64 length) { }
 | |
| 
 | |
| static inline int btrfs_zone_finish_one_bg(struct btrfs_fs_info *fs_info)
 | |
| {
 | |
| 	return 1;
 | |
| }
 | |
| 
 | |
| static inline int btrfs_zoned_activate_one_bg(struct btrfs_fs_info *fs_info,
 | |
| 					      struct btrfs_space_info *space_info,
 | |
| 					      bool do_finish)
 | |
| {
 | |
| 	/* Consider all the block groups are active */
 | |
| 	return 0;
 | |
| }
 | |
| 
 | |
| static inline void btrfs_check_active_zone_reservation(struct btrfs_fs_info *fs_info) { }
 | |
| 
 | |
| static inline int btrfs_reset_unused_block_groups(struct btrfs_space_info *space_info,
 | |
| 						  u64 num_bytes)
 | |
| {
 | |
| 	return 0;
 | |
| }
 | |
| 
 | |
| #endif
 | |
| 
 | |
| static inline bool btrfs_dev_is_sequential(struct btrfs_device *device, u64 pos)
 | |
| {
 | |
| 	struct btrfs_zoned_device_info *zone_info = device->zone_info;
 | |
| 
 | |
| 	if (!zone_info)
 | |
| 		return false;
 | |
| 
 | |
| 	return test_bit(pos >> zone_info->zone_size_shift, zone_info->seq_zones);
 | |
| }
 | |
| 
 | |
| static inline bool btrfs_dev_is_empty_zone(struct btrfs_device *device, u64 pos)
 | |
| {
 | |
| 	struct btrfs_zoned_device_info *zone_info = device->zone_info;
 | |
| 
 | |
| 	if (!zone_info)
 | |
| 		return true;
 | |
| 
 | |
| 	return test_bit(pos >> zone_info->zone_size_shift, zone_info->empty_zones);
 | |
| }
 | |
| 
 | |
| static inline void btrfs_dev_set_empty_zone_bit(struct btrfs_device *device,
 | |
| 						u64 pos, bool set)
 | |
| {
 | |
| 	struct btrfs_zoned_device_info *zone_info = device->zone_info;
 | |
| 	unsigned int zno;
 | |
| 
 | |
| 	if (!zone_info)
 | |
| 		return;
 | |
| 
 | |
| 	zno = pos >> zone_info->zone_size_shift;
 | |
| 	if (set)
 | |
| 		set_bit(zno, zone_info->empty_zones);
 | |
| 	else
 | |
| 		clear_bit(zno, zone_info->empty_zones);
 | |
| }
 | |
| 
 | |
| static inline void btrfs_dev_set_zone_empty(struct btrfs_device *device, u64 pos)
 | |
| {
 | |
| 	btrfs_dev_set_empty_zone_bit(device, pos, true);
 | |
| }
 | |
| 
 | |
| static inline void btrfs_dev_clear_zone_empty(struct btrfs_device *device, u64 pos)
 | |
| {
 | |
| 	btrfs_dev_set_empty_zone_bit(device, pos, false);
 | |
| }
 | |
| 
 | |
| static inline bool btrfs_check_device_zone_type(const struct btrfs_fs_info *fs_info,
 | |
| 						struct block_device *bdev)
 | |
| {
 | |
| 	if (btrfs_is_zoned(fs_info)) {
 | |
| 		/*
 | |
| 		 * We can allow a regular device on a zoned filesystem, because
 | |
| 		 * we will emulate the zoned capabilities.
 | |
| 		 */
 | |
| 		if (!bdev_is_zoned(bdev))
 | |
| 			return true;
 | |
| 
 | |
| 		return fs_info->zone_size ==
 | |
| 			(bdev_zone_sectors(bdev) << SECTOR_SHIFT);
 | |
| 	}
 | |
| 
 | |
| 	/* Do not allow Host Managed zoned device. */
 | |
| 	return !bdev_is_zoned(bdev);
 | |
| }
 | |
| 
 | |
| static inline bool btrfs_check_super_location(struct btrfs_device *device, u64 pos)
 | |
| {
 | |
| 	/*
 | |
| 	 * On a non-zoned device, any address is OK. On a zoned device,
 | |
| 	 * non-SEQUENTIAL WRITE REQUIRED zones are capable.
 | |
| 	 */
 | |
| 	return device->zone_info == NULL || !btrfs_dev_is_sequential(device, pos);
 | |
| }
 | |
| 
 | |
| static inline bool btrfs_can_zone_reset(struct btrfs_device *device,
 | |
| 					u64 physical, u64 length)
 | |
| {
 | |
| 	u64 zone_size;
 | |
| 
 | |
| 	if (!btrfs_dev_is_sequential(device, physical))
 | |
| 		return false;
 | |
| 
 | |
| 	zone_size = device->zone_info->zone_size;
 | |
| 	if (!IS_ALIGNED(physical, zone_size) || !IS_ALIGNED(length, zone_size))
 | |
| 		return false;
 | |
| 
 | |
| 	return true;
 | |
| }
 | |
| 
 | |
| static inline void btrfs_zoned_meta_io_lock(struct btrfs_fs_info *fs_info)
 | |
| {
 | |
| 	if (!btrfs_is_zoned(fs_info))
 | |
| 		return;
 | |
| 	mutex_lock(&fs_info->zoned_meta_io_lock);
 | |
| }
 | |
| 
 | |
| static inline void btrfs_zoned_meta_io_unlock(struct btrfs_fs_info *fs_info)
 | |
| {
 | |
| 	if (!btrfs_is_zoned(fs_info))
 | |
| 		return;
 | |
| 	mutex_unlock(&fs_info->zoned_meta_io_lock);
 | |
| }
 | |
| 
 | |
| static inline void btrfs_clear_treelog_bg(struct btrfs_block_group *bg)
 | |
| {
 | |
| 	struct btrfs_fs_info *fs_info = bg->fs_info;
 | |
| 
 | |
| 	if (!btrfs_is_zoned(fs_info))
 | |
| 		return;
 | |
| 
 | |
| 	spin_lock(&fs_info->treelog_bg_lock);
 | |
| 	if (fs_info->treelog_bg == bg->start)
 | |
| 		fs_info->treelog_bg = 0;
 | |
| 	spin_unlock(&fs_info->treelog_bg_lock);
 | |
| }
 | |
| 
 | |
| static inline void btrfs_zoned_data_reloc_lock(struct btrfs_inode *inode)
 | |
| {
 | |
| 	struct btrfs_root *root = inode->root;
 | |
| 
 | |
| 	if (btrfs_is_data_reloc_root(root) && btrfs_is_zoned(root->fs_info))
 | |
| 		mutex_lock(&root->fs_info->zoned_data_reloc_io_lock);
 | |
| }
 | |
| 
 | |
| static inline void btrfs_zoned_data_reloc_unlock(struct btrfs_inode *inode)
 | |
| {
 | |
| 	struct btrfs_root *root = inode->root;
 | |
| 
 | |
| 	if (btrfs_is_data_reloc_root(root) && btrfs_is_zoned(root->fs_info))
 | |
| 		mutex_unlock(&root->fs_info->zoned_data_reloc_io_lock);
 | |
| }
 | |
| 
 | |
| static inline bool btrfs_zoned_bg_is_full(const struct btrfs_block_group *bg)
 | |
| {
 | |
| 	ASSERT(btrfs_is_zoned(bg->fs_info));
 | |
| 	return (bg->alloc_offset == bg->zone_capacity);
 | |
| }
 | |
| 
 | |
| #endif
 |