247 строки
7.6 KiB
C
247 строки
7.6 KiB
C
/*
|
|
* Block Translation Table library
|
|
* Copyright (c) 2014-2015, Intel Corporation.
|
|
*
|
|
* This program is free software; you can redistribute it and/or modify it
|
|
* under the terms and conditions of the GNU General Public License,
|
|
* version 2, as published by the Free Software Foundation.
|
|
*
|
|
* This program is distributed in the hope it will be useful, but WITHOUT
|
|
* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
|
|
* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
|
|
* more details.
|
|
*/
|
|
|
|
#ifndef _LINUX_BTT_H
|
|
#define _LINUX_BTT_H
|
|
|
|
#include <linux/badblocks.h>
|
|
#include <linux/types.h>
|
|
|
|
#define BTT_SIG_LEN 16
|
|
#define BTT_SIG "BTT_ARENA_INFO\0"
|
|
#define MAP_ENT_SIZE 4
|
|
#define MAP_TRIM_SHIFT 31
|
|
#define MAP_TRIM_MASK (1 << MAP_TRIM_SHIFT)
|
|
#define MAP_ERR_SHIFT 30
|
|
#define MAP_ERR_MASK (1 << MAP_ERR_SHIFT)
|
|
#define MAP_LBA_MASK (~((1 << MAP_TRIM_SHIFT) | (1 << MAP_ERR_SHIFT)))
|
|
#define MAP_ENT_NORMAL 0xC0000000
|
|
#define LOG_GRP_SIZE sizeof(struct log_group)
|
|
#define LOG_ENT_SIZE sizeof(struct log_entry)
|
|
#define ARENA_MIN_SIZE (1UL << 24) /* 16 MB */
|
|
#define ARENA_MAX_SIZE (1ULL << 39) /* 512 GB */
|
|
#define RTT_VALID (1UL << 31)
|
|
#define RTT_INVALID 0
|
|
#define BTT_PG_SIZE 4096
|
|
#define BTT_DEFAULT_NFREE ND_MAX_LANES
|
|
#define LOG_SEQ_INIT 1
|
|
|
|
#define IB_FLAG_ERROR 0x00000001
|
|
#define IB_FLAG_ERROR_MASK 0x00000001
|
|
|
|
#define ent_lba(ent) (ent & MAP_LBA_MASK)
|
|
#define ent_e_flag(ent) (!!(ent & MAP_ERR_MASK))
|
|
#define ent_z_flag(ent) (!!(ent & MAP_TRIM_MASK))
|
|
#define set_e_flag(ent) (ent |= MAP_ERR_MASK)
|
|
|
|
enum btt_init_state {
|
|
INIT_UNCHECKED = 0,
|
|
INIT_NOTFOUND,
|
|
INIT_READY
|
|
};
|
|
|
|
/*
|
|
* A log group represents one log 'lane', and consists of four log entries.
|
|
* Two of the four entries are valid entries, and the remaining two are
|
|
* padding. Due to an old bug in the padding location, we need to perform a
|
|
* test to determine the padding scheme being used, and use that scheme
|
|
* thereafter.
|
|
*
|
|
* In kernels prior to 4.15, 'log group' would have actual log entries at
|
|
* indices (0, 2) and padding at indices (1, 3), where as the correct/updated
|
|
* format has log entries at indices (0, 1) and padding at indices (2, 3).
|
|
*
|
|
* Old (pre 4.15) format:
|
|
* +-----------------+-----------------+
|
|
* | ent[0] | ent[1] |
|
|
* | 16B | 16B |
|
|
* | lba/old/new/seq | pad |
|
|
* +-----------------------------------+
|
|
* | ent[2] | ent[3] |
|
|
* | 16B | 16B |
|
|
* | lba/old/new/seq | pad |
|
|
* +-----------------+-----------------+
|
|
*
|
|
* New format:
|
|
* +-----------------+-----------------+
|
|
* | ent[0] | ent[1] |
|
|
* | 16B | 16B |
|
|
* | lba/old/new/seq | lba/old/new/seq |
|
|
* +-----------------------------------+
|
|
* | ent[2] | ent[3] |
|
|
* | 16B | 16B |
|
|
* | pad | pad |
|
|
* +-----------------+-----------------+
|
|
*
|
|
* We detect during start-up which format is in use, and set
|
|
* arena->log_index[(0, 1)] with the detected format.
|
|
*/
|
|
|
|
struct log_entry {
|
|
__le32 lba;
|
|
__le32 old_map;
|
|
__le32 new_map;
|
|
__le32 seq;
|
|
};
|
|
|
|
struct log_group {
|
|
struct log_entry ent[4];
|
|
};
|
|
|
|
struct btt_sb {
|
|
u8 signature[BTT_SIG_LEN];
|
|
u8 uuid[16];
|
|
u8 parent_uuid[16];
|
|
__le32 flags;
|
|
__le16 version_major;
|
|
__le16 version_minor;
|
|
__le32 external_lbasize;
|
|
__le32 external_nlba;
|
|
__le32 internal_lbasize;
|
|
__le32 internal_nlba;
|
|
__le32 nfree;
|
|
__le32 infosize;
|
|
__le64 nextoff;
|
|
__le64 dataoff;
|
|
__le64 mapoff;
|
|
__le64 logoff;
|
|
__le64 info2off;
|
|
u8 padding[3968];
|
|
__le64 checksum;
|
|
};
|
|
|
|
struct free_entry {
|
|
u32 block;
|
|
u8 sub;
|
|
u8 seq;
|
|
u8 has_err;
|
|
};
|
|
|
|
struct aligned_lock {
|
|
union {
|
|
spinlock_t lock;
|
|
u8 cacheline_padding[L1_CACHE_BYTES];
|
|
};
|
|
};
|
|
|
|
/**
|
|
* struct arena_info - handle for an arena
|
|
* @size: Size in bytes this arena occupies on the raw device.
|
|
* This includes arena metadata.
|
|
* @external_lba_start: The first external LBA in this arena.
|
|
* @internal_nlba: Number of internal blocks available in the arena
|
|
* including nfree reserved blocks
|
|
* @internal_lbasize: Internal and external lba sizes may be different as
|
|
* we can round up 'odd' external lbasizes such as 520B
|
|
* to be aligned.
|
|
* @external_nlba: Number of blocks contributed by the arena to the number
|
|
* reported to upper layers. (internal_nlba - nfree)
|
|
* @external_lbasize: LBA size as exposed to upper layers.
|
|
* @nfree: A reserve number of 'free' blocks that is used to
|
|
* handle incoming writes.
|
|
* @version_major: Metadata layout version major.
|
|
* @version_minor: Metadata layout version minor.
|
|
* @sector_size: The Linux sector size - 512 or 4096
|
|
* @nextoff: Offset in bytes to the start of the next arena.
|
|
* @infooff: Offset in bytes to the info block of this arena.
|
|
* @dataoff: Offset in bytes to the data area of this arena.
|
|
* @mapoff: Offset in bytes to the map area of this arena.
|
|
* @logoff: Offset in bytes to the log area of this arena.
|
|
* @info2off: Offset in bytes to the backup info block of this arena.
|
|
* @freelist: Pointer to in-memory list of free blocks
|
|
* @rtt: Pointer to in-memory "Read Tracking Table"
|
|
* @map_locks: Spinlocks protecting concurrent map writes
|
|
* @nd_btt: Pointer to parent nd_btt structure.
|
|
* @list: List head for list of arenas
|
|
* @debugfs_dir: Debugfs dentry
|
|
* @flags: Arena flags - may signify error states.
|
|
* @err_lock: Mutex for synchronizing error clearing.
|
|
* @log_index: Indices of the valid log entries in a log_group
|
|
*
|
|
* arena_info is a per-arena handle. Once an arena is narrowed down for an
|
|
* IO, this struct is passed around for the duration of the IO.
|
|
*/
|
|
struct arena_info {
|
|
u64 size; /* Total bytes for this arena */
|
|
u64 external_lba_start;
|
|
u32 internal_nlba;
|
|
u32 internal_lbasize;
|
|
u32 external_nlba;
|
|
u32 external_lbasize;
|
|
u32 nfree;
|
|
u16 version_major;
|
|
u16 version_minor;
|
|
u32 sector_size;
|
|
/* Byte offsets to the different on-media structures */
|
|
u64 nextoff;
|
|
u64 infooff;
|
|
u64 dataoff;
|
|
u64 mapoff;
|
|
u64 logoff;
|
|
u64 info2off;
|
|
/* Pointers to other in-memory structures for this arena */
|
|
struct free_entry *freelist;
|
|
u32 *rtt;
|
|
struct aligned_lock *map_locks;
|
|
struct nd_btt *nd_btt;
|
|
struct list_head list;
|
|
struct dentry *debugfs_dir;
|
|
/* Arena flags */
|
|
u32 flags;
|
|
struct mutex err_lock;
|
|
int log_index[2];
|
|
};
|
|
|
|
/**
|
|
* struct btt - handle for a BTT instance
|
|
* @btt_disk: Pointer to the gendisk for BTT device
|
|
* @btt_queue: Pointer to the request queue for the BTT device
|
|
* @arena_list: Head of the list of arenas
|
|
* @debugfs_dir: Debugfs dentry
|
|
* @nd_btt: Parent nd_btt struct
|
|
* @nlba: Number of logical blocks exposed to the upper layers
|
|
* after removing the amount of space needed by metadata
|
|
* @rawsize: Total size in bytes of the available backing device
|
|
* @lbasize: LBA size as requested and presented to upper layers.
|
|
* This is sector_size + size of any metadata.
|
|
* @sector_size: The Linux sector size - 512 or 4096
|
|
* @lanes: Per-lane spinlocks
|
|
* @init_lock: Mutex used for the BTT initialization
|
|
* @init_state: Flag describing the initialization state for the BTT
|
|
* @num_arenas: Number of arenas in the BTT instance
|
|
* @phys_bb: Pointer to the namespace's badblocks structure
|
|
*/
|
|
struct btt {
|
|
struct gendisk *btt_disk;
|
|
struct request_queue *btt_queue;
|
|
struct list_head arena_list;
|
|
struct dentry *debugfs_dir;
|
|
struct nd_btt *nd_btt;
|
|
u64 nlba;
|
|
unsigned long long rawsize;
|
|
u32 lbasize;
|
|
u32 sector_size;
|
|
struct nd_region *nd_region;
|
|
struct mutex init_lock;
|
|
int init_state;
|
|
int num_arenas;
|
|
struct badblocks *phys_bb;
|
|
};
|
|
|
|
bool nd_btt_arena_is_valid(struct nd_btt *nd_btt, struct btt_sb *super);
|
|
int nd_btt_version(struct nd_btt *nd_btt, struct nd_namespace_common *ndns,
|
|
struct btt_sb *btt_sb);
|
|
|
|
#endif
|