/* * Block Translation Table library * Copyright (c) 2014-2015, Intel Corporation. * * This program is free software; you can redistribute it and/or modify it * under the terms and conditions of the GNU General Public License, * version 2, as published by the Free Software Foundation. * * This program is distributed in the hope it will be useful, but WITHOUT * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for * more details. */ #ifndef _LINUX_BTT_H #define _LINUX_BTT_H #include <linux/badblocks.h> #include <linux/types.h> #define BTT_SIG_LEN 16 #define BTT_SIG "BTT_ARENA_INFO\0" #define MAP_ENT_SIZE 4 #define MAP_TRIM_SHIFT 31 #define MAP_TRIM_MASK (1 << MAP_TRIM_SHIFT) #define MAP_ERR_SHIFT 30 #define MAP_ERR_MASK (1 << MAP_ERR_SHIFT) #define MAP_LBA_MASK (~((1 << MAP_TRIM_SHIFT) | (1 << MAP_ERR_SHIFT))) #define MAP_ENT_NORMAL 0xC0000000 #define LOG_GRP_SIZE sizeof(struct log_group) #define LOG_ENT_SIZE sizeof(struct log_entry) #define ARENA_MIN_SIZE (1UL << 24) /* 16 MB */ #define ARENA_MAX_SIZE (1ULL << 39) /* 512 GB */ #define RTT_VALID (1UL << 31) #define RTT_INVALID 0 #define BTT_PG_SIZE 4096 #define BTT_DEFAULT_NFREE ND_MAX_LANES #define LOG_SEQ_INIT 1 #define IB_FLAG_ERROR 0x00000001 #define IB_FLAG_ERROR_MASK 0x00000001 #define ent_lba(ent) (ent & MAP_LBA_MASK) #define ent_e_flag(ent) (!!(ent & MAP_ERR_MASK)) #define ent_z_flag(ent) (!!(ent & MAP_TRIM_MASK)) #define set_e_flag(ent) (ent |= MAP_ERR_MASK) enum btt_init_state { INIT_UNCHECKED = 0, INIT_NOTFOUND, INIT_READY }; /* * A log group represents one log 'lane', and consists of four log entries. * Two of the four entries are valid entries, and the remaining two are * padding. Due to an old bug in the padding location, we need to perform a * test to determine the padding scheme being used, and use that scheme * thereafter. * * In kernels prior to 4.15, 'log group' would have actual log entries at * indices (0, 2) and padding at indices (1, 3), where as the correct/updated * format has log entries at indices (0, 1) and padding at indices (2, 3). * * Old (pre 4.15) format: * +-----------------+-----------------+ * | ent[0] | ent[1] | * | 16B | 16B | * | lba/old/new/seq | pad | * +-----------------------------------+ * | ent[2] | ent[3] | * | 16B | 16B | * | lba/old/new/seq | pad | * +-----------------+-----------------+ * * New format: * +-----------------+-----------------+ * | ent[0] | ent[1] | * | 16B | 16B | * | lba/old/new/seq | lba/old/new/seq | * +-----------------------------------+ * | ent[2] | ent[3] | * | 16B | 16B | * | pad | pad | * +-----------------+-----------------+ * * We detect during start-up which format is in use, and set * arena->log_index[(0, 1)] with the detected format. */ struct log_entry { __le32 lba; __le32 old_map; __le32 new_map; __le32 seq; }; struct log_group { struct log_entry ent[4]; }; struct btt_sb { u8 signature[BTT_SIG_LEN]; u8 uuid[16]; u8 parent_uuid[16]; __le32 flags; __le16 version_major; __le16 version_minor; __le32 external_lbasize; __le32 external_nlba; __le32 internal_lbasize; __le32 internal_nlba; __le32 nfree; __le32 infosize; __le64 nextoff; __le64 dataoff; __le64 mapoff; __le64 logoff; __le64 info2off; u8 padding[3968]; __le64 checksum; }; struct free_entry { u32 block; u8 sub; u8 seq; u8 has_err; }; struct aligned_lock { union { spinlock_t lock; u8 cacheline_padding[L1_CACHE_BYTES]; }; }; /** * struct arena_info - handle for an arena * @size: Size in bytes this arena occupies on the raw device. * This includes arena metadata. * @external_lba_start: The first external LBA in this arena. * @internal_nlba: Number of internal blocks available in the arena * including nfree reserved blocks * @internal_lbasize: Internal and external lba sizes may be different as * we can round up 'odd' external lbasizes such as 520B * to be aligned. * @external_nlba: Number of blocks contributed by the arena to the number * reported to upper layers. (internal_nlba - nfree) * @external_lbasize: LBA size as exposed to upper layers. * @nfree: A reserve number of 'free' blocks that is used to * handle incoming writes. * @version_major: Metadata layout version major. * @version_minor: Metadata layout version minor. * @sector_size: The Linux sector size - 512 or 4096 * @nextoff: Offset in bytes to the start of the next arena. * @infooff: Offset in bytes to the info block of this arena. * @dataoff: Offset in bytes to the data area of this arena. * @mapoff: Offset in bytes to the map area of this arena. * @logoff: Offset in bytes to the log area of this arena. * @info2off: Offset in bytes to the backup info block of this arena. * @freelist: Pointer to in-memory list of free blocks * @rtt: Pointer to in-memory "Read Tracking Table" * @map_locks: Spinlocks protecting concurrent map writes * @nd_btt: Pointer to parent nd_btt structure. * @list: List head for list of arenas * @debugfs_dir: Debugfs dentry * @flags: Arena flags - may signify error states. * @err_lock: Mutex for synchronizing error clearing. * @log_index: Indices of the valid log entries in a log_group * * arena_info is a per-arena handle. Once an arena is narrowed down for an * IO, this struct is passed around for the duration of the IO. */ struct arena_info { u64 size; /* Total bytes for this arena */ u64 external_lba_start; u32 internal_nlba; u32 internal_lbasize; u32 external_nlba; u32 external_lbasize; u32 nfree; u16 version_major; u16 version_minor; u32 sector_size; /* Byte offsets to the different on-media structures */ u64 nextoff; u64 infooff; u64 dataoff; u64 mapoff; u64 logoff; u64 info2off; /* Pointers to other in-memory structures for this arena */ struct free_entry *freelist; u32 *rtt; struct aligned_lock *map_locks; struct nd_btt *nd_btt; struct list_head list; struct dentry *debugfs_dir; /* Arena flags */ u32 flags; struct mutex err_lock; int log_index[2]; }; /** * struct btt - handle for a BTT instance * @btt_disk: Pointer to the gendisk for BTT device * @btt_queue: Pointer to the request queue for the BTT device * @arena_list: Head of the list of arenas * @debugfs_dir: Debugfs dentry * @nd_btt: Parent nd_btt struct * @nlba: Number of logical blocks exposed to the upper layers * after removing the amount of space needed by metadata * @rawsize: Total size in bytes of the available backing device * @lbasize: LBA size as requested and presented to upper layers. * This is sector_size + size of any metadata. * @sector_size: The Linux sector size - 512 or 4096 * @lanes: Per-lane spinlocks * @init_lock: Mutex used for the BTT initialization * @init_state: Flag describing the initialization state for the BTT * @num_arenas: Number of arenas in the BTT instance * @phys_bb: Pointer to the namespace's badblocks structure */ struct btt { struct gendisk *btt_disk; struct request_queue *btt_queue; struct list_head arena_list; struct dentry *debugfs_dir; struct nd_btt *nd_btt; u64 nlba; unsigned long long rawsize; u32 lbasize; u32 sector_size; struct nd_region *nd_region; struct mutex init_lock; int init_state; int num_arenas; struct badblocks *phys_bb; }; bool nd_btt_arena_is_valid(struct nd_btt *nd_btt, struct btt_sb *super); int nd_btt_version(struct nd_btt *nd_btt, struct nd_namespace_common *ndns, struct btt_sb *btt_sb); #endif