2017-03-16 22:18:50 -08:00
// SPDX-License-Identifier: GPL-2.0
/*
* Code for manipulating bucket marks for garbage collection .
*
* Copyright 2014 Datera , Inc .
*
* Bucket states :
* - free bucket : mark = = 0
* The bucket contains no data and will not be read
*
* - allocator bucket : owned_by_allocator = = 1
* The bucket is on a free list , or it is an open bucket
*
* - cached bucket : owned_by_allocator = = 0 & &
* dirty_sectors = = 0 & &
* cached_sectors > 0
* The bucket contains data but may be safely discarded as there are
* enough replicas of the data on other cache devices , or it has been
* written back to the backing device
*
* - dirty bucket : owned_by_allocator = = 0 & &
* dirty_sectors > 0
* The bucket contains data that we must not discard ( either only copy ,
* or one of the ' main copies ' for data requiring multiple replicas )
*
* - metadata bucket : owned_by_allocator = = 0 & & is_metadata = = 1
* This is a btree node , journal or gen / prio bucket
*
* Lifecycle :
*
* bucket invalidated = > bucket on freelist = > open bucket = >
* [ dirty bucket = > ] cached bucket = > bucket invalidated = > . . .
*
* Note that cache promotion can skip the dirty bucket step , as data
* is copied from a deeper tier to a shallower tier , onto a cached
* bucket .
* Note also that a cached bucket can spontaneously become dirty - -
* see below .
*
* Only a traversal of the key space can determine whether a bucket is
* truly dirty or cached .
*
* Transitions :
*
* - free = > allocator : bucket was invalidated
* - cached = > allocator : bucket was invalidated
*
* - allocator = > dirty : open bucket was filled up
* - allocator = > cached : open bucket was filled up
* - allocator = > metadata : metadata was allocated
*
* - dirty = > cached : dirty sectors were copied to a deeper tier
* - dirty = > free : dirty sectors were overwritten or moved ( copy gc )
* - cached = > free : cached sectors were overwritten
*
* - metadata = > free : metadata was freed
*
* Oddities :
* - cached = > dirty : a device was removed so formerly replicated data
* is no longer sufficiently replicated
* - free = > cached : cannot happen
* - free = > dirty : cannot happen
* - free = > metadata : cannot happen
*/
# include "bcachefs.h"
2018-10-06 00:46:55 -04:00
# include "alloc_background.h"
2018-11-05 02:31:48 -05:00
# include "bset.h"
2017-03-16 22:18:50 -08:00
# include "btree_gc.h"
2018-11-05 02:31:48 -05:00
# include "btree_update.h"
2017-03-16 22:18:50 -08:00
# include "buckets.h"
2018-11-01 15:13:19 -04:00
# include "ec.h"
2017-03-16 22:18:50 -08:00
# include "error.h"
# include "movinggc.h"
2019-01-21 15:32:13 -05:00
# include "replicas.h"
2017-03-16 22:18:50 -08:00
# include "trace.h"
# include <linux/preempt.h>
2020-07-09 18:31:51 -04:00
static inline void fs_usage_data_type_to_base ( struct bch_fs_usage * fs_usage ,
enum bch_data_type data_type ,
s64 sectors )
{
switch ( data_type ) {
case BCH_DATA_btree :
fs_usage - > btree + = sectors ;
break ;
case BCH_DATA_user :
case BCH_DATA_parity :
fs_usage - > data + = sectors ;
break ;
case BCH_DATA_cached :
fs_usage - > cached + = sectors ;
break ;
default :
break ;
}
}
2017-03-16 22:18:50 -08:00
/*
* Clear journal_seq_valid for buckets for which it ' s not needed , to prevent
* wraparound :
*/
void bch2_bucket_seq_cleanup ( struct bch_fs * c )
{
2018-07-21 22:57:20 -04:00
u64 journal_seq = atomic64_read ( & c - > journal . seq ) ;
2017-03-16 22:18:50 -08:00
u16 last_seq_ondisk = c - > journal . last_seq_ondisk ;
struct bch_dev * ca ;
struct bucket_array * buckets ;
struct bucket * g ;
struct bucket_mark m ;
unsigned i ;
2018-07-21 22:57:20 -04:00
if ( journal_seq - c - > last_bucket_seq_cleanup <
( 1U < < ( BUCKET_JOURNAL_SEQ_BITS - 2 ) ) )
return ;
c - > last_bucket_seq_cleanup = journal_seq ;
2017-03-16 22:18:50 -08:00
for_each_member_device ( ca , c , i ) {
down_read ( & ca - > bucket_lock ) ;
buckets = bucket_array ( ca ) ;
for_each_bucket ( g , buckets ) {
bucket_cmpxchg ( g , m , ( {
if ( ! m . journal_seq_valid | |
bucket_needs_journal_commit ( m , last_seq_ondisk ) )
break ;
m . journal_seq_valid = 0 ;
} ) ) ;
}
up_read ( & ca - > bucket_lock ) ;
}
}
2019-01-24 20:25:40 -05:00
void bch2_fs_usage_initialize ( struct bch_fs * c )
{
struct bch_fs_usage * usage ;
2021-01-21 21:52:06 -05:00
struct bch_dev * ca ;
2019-02-14 20:39:17 -05:00
unsigned i ;
2019-01-24 20:25:40 -05:00
percpu_down_write ( & c - > mark_lock ) ;
2019-02-10 19:34:47 -05:00
usage = c - > usage_base ;
for ( i = 0 ; i < ARRAY_SIZE ( c - > usage ) ; i + + )
bch2_fs_usage_acc_to_base ( c , i ) ;
2019-01-24 20:25:40 -05:00
2019-02-09 19:20:57 -05:00
for ( i = 0 ; i < BCH_REPLICAS_MAX ; i + + )
2019-02-14 18:38:52 -05:00
usage - > reserved + = usage - > persistent_reserved [ i ] ;
2019-02-09 19:20:57 -05:00
2019-01-24 20:25:40 -05:00
for ( i = 0 ; i < c - > replicas . nr ; i + + ) {
struct bch_replicas_entry * e =
cpu_replicas_entry ( & c - > replicas , i ) ;
2020-07-09 18:31:51 -04:00
fs_usage_data_type_to_base ( usage , e - > data_type , usage - > replicas [ i ] ) ;
2019-01-24 20:25:40 -05:00
}
2021-01-21 21:52:06 -05:00
for_each_member_device ( ca , c , i ) {
struct bch_dev_usage dev = bch2_dev_usage_read ( ca ) ;
usage - > hidden + = ( dev . d [ BCH_DATA_sb ] . buckets +
dev . d [ BCH_DATA_journal ] . buckets ) *
ca - > mi . bucket_size ;
}
2019-01-24 20:25:40 -05:00
percpu_up_write ( & c - > mark_lock ) ;
}
2021-01-21 21:52:06 -05:00
static inline struct bch_dev_usage * dev_usage_ptr ( struct bch_dev * ca ,
unsigned journal_seq ,
bool gc )
{
return this_cpu_ptr ( gc
? ca - > usage_gc
: ca - > usage [ journal_seq & JOURNAL_BUF_MASK ] ) ;
}
2020-07-22 13:27:00 -04:00
struct bch_dev_usage bch2_dev_usage_read ( struct bch_dev * ca )
2017-03-16 22:18:50 -08:00
{
2021-01-21 21:52:06 -05:00
struct bch_fs * c = ca - > fs ;
2019-02-14 18:38:52 -05:00
struct bch_dev_usage ret ;
2021-01-21 21:52:06 -05:00
unsigned seq , i , u64s = dev_usage_u64s ( ) ;
2019-02-14 18:38:52 -05:00
2021-01-21 21:52:06 -05:00
do {
seq = read_seqcount_begin ( & c - > usage_lock ) ;
memcpy ( & ret , ca - > usage_base , u64s * sizeof ( u64 ) ) ;
for ( i = 0 ; i < ARRAY_SIZE ( ca - > usage ) ; i + + )
acc_u64s_percpu ( ( u64 * ) & ret , ( u64 __percpu * ) ca - > usage [ i ] , u64s ) ;
} while ( read_seqcount_retry ( & c - > usage_lock , seq ) ) ;
2019-02-14 18:38:52 -05:00
return ret ;
2017-03-16 22:18:50 -08:00
}
2019-02-10 19:34:47 -05:00
static inline struct bch_fs_usage * fs_usage_ptr ( struct bch_fs * c ,
unsigned journal_seq ,
bool gc )
2017-03-16 22:18:50 -08:00
{
2019-02-10 19:34:47 -05:00
return this_cpu_ptr ( gc
? c - > usage_gc
2020-11-13 18:36:33 -05:00
: c - > usage [ journal_seq & JOURNAL_BUF_MASK ] ) ;
2019-02-10 19:34:47 -05:00
}
u64 bch2_fs_usage_read_one ( struct bch_fs * c , u64 * v )
{
ssize_t offset = v - ( u64 * ) c - > usage_base ;
2020-11-13 18:36:33 -05:00
unsigned i , seq ;
2019-02-10 19:34:47 -05:00
u64 ret ;
BUG_ON ( offset < 0 | | offset > = fs_usage_u64s ( c ) ) ;
percpu_rwsem_assert_held ( & c - > mark_lock ) ;
do {
seq = read_seqcount_begin ( & c - > usage_lock ) ;
2020-11-13 18:36:33 -05:00
ret = * v ;
for ( i = 0 ; i < ARRAY_SIZE ( c - > usage ) ; i + + )
ret + = percpu_u64_get ( ( u64 __percpu * ) c - > usage [ i ] + offset ) ;
2019-02-10 19:34:47 -05:00
} while ( read_seqcount_retry ( & c - > usage_lock , seq ) ) ;
return ret ;
}
struct bch_fs_usage_online * bch2_fs_usage_read ( struct bch_fs * c )
{
struct bch_fs_usage_online * ret ;
2021-04-13 10:30:58 -04:00
unsigned seq , i , v , u64s = fs_usage_u64s ( c ) + 1 ;
2020-11-13 18:36:33 -05:00
retry :
ret = kmalloc ( u64s * sizeof ( u64 ) , GFP_NOFS ) ;
if ( unlikely ( ! ret ) )
return NULL ;
2019-01-21 15:32:13 -05:00
percpu_down_read ( & c - > mark_lock ) ;
2021-04-13 10:30:58 -04:00
v = fs_usage_u64s ( c ) + 1 ;
2020-11-13 18:36:33 -05:00
if ( unlikely ( u64s ! = v ) ) {
u64s = v ;
2019-01-21 15:32:13 -05:00
percpu_up_read ( & c - > mark_lock ) ;
2020-11-13 18:36:33 -05:00
kfree ( ret ) ;
goto retry ;
2019-01-21 15:32:13 -05:00
}
2019-02-10 19:34:47 -05:00
ret - > online_reserved = percpu_u64_get ( c - > online_reserved ) ;
do {
seq = read_seqcount_begin ( & c - > usage_lock ) ;
2021-03-28 20:56:25 -04:00
memcpy ( & ret - > u , c - > usage_base , u64s * sizeof ( u64 ) ) ;
2019-02-10 19:34:47 -05:00
for ( i = 0 ; i < ARRAY_SIZE ( c - > usage ) ; i + + )
acc_u64s_percpu ( ( u64 * ) & ret - > u , ( u64 __percpu * ) c - > usage [ i ] , u64s ) ;
} while ( read_seqcount_retry ( & c - > usage_lock , seq ) ) ;
2019-01-21 15:32:13 -05:00
return ret ;
2017-03-16 22:18:50 -08:00
}
2019-02-10 19:34:47 -05:00
void bch2_fs_usage_acc_to_base ( struct bch_fs * c , unsigned idx )
{
2021-01-21 21:52:06 -05:00
struct bch_dev * ca ;
unsigned i , u64s = fs_usage_u64s ( c ) ;
2019-02-10 19:34:47 -05:00
BUG_ON ( idx > = ARRAY_SIZE ( c - > usage ) ) ;
preempt_disable ( ) ;
write_seqcount_begin ( & c - > usage_lock ) ;
acc_u64s_percpu ( ( u64 * ) c - > usage_base ,
( u64 __percpu * ) c - > usage [ idx ] , u64s ) ;
percpu_memset ( c - > usage [ idx ] , 0 , u64s * sizeof ( u64 ) ) ;
2021-01-21 21:52:06 -05:00
rcu_read_lock ( ) ;
for_each_member_device_rcu ( ca , c , i , NULL ) {
u64s = dev_usage_u64s ( ) ;
acc_u64s_percpu ( ( u64 * ) ca - > usage_base ,
( u64 __percpu * ) ca - > usage [ idx ] , u64s ) ;
percpu_memset ( ca - > usage [ idx ] , 0 , u64s * sizeof ( u64 ) ) ;
}
rcu_read_unlock ( ) ;
2019-02-10 19:34:47 -05:00
write_seqcount_end ( & c - > usage_lock ) ;
preempt_enable ( ) ;
}
void bch2_fs_usage_to_text ( struct printbuf * out ,
struct bch_fs * c ,
struct bch_fs_usage_online * fs_usage )
{
unsigned i ;
pr_buf ( out , " capacity: \t \t \t %llu \n " , c - > capacity ) ;
pr_buf ( out , " hidden: \t \t \t \t %llu \n " ,
fs_usage - > u . hidden ) ;
pr_buf ( out , " data: \t \t \t \t %llu \n " ,
fs_usage - > u . data ) ;
pr_buf ( out , " cached: \t \t \t \t %llu \n " ,
fs_usage - > u . cached ) ;
pr_buf ( out , " reserved: \t \t \t %llu \n " ,
fs_usage - > u . reserved ) ;
pr_buf ( out , " nr_inodes: \t \t \t %llu \n " ,
fs_usage - > u . nr_inodes ) ;
pr_buf ( out , " online reserved: \t \t %llu \n " ,
fs_usage - > online_reserved ) ;
for ( i = 0 ;
i < ARRAY_SIZE ( fs_usage - > u . persistent_reserved ) ;
i + + ) {
pr_buf ( out , " %u replicas: \n " , i + 1 ) ;
pr_buf ( out , " \t reserved: \t \t %llu \n " ,
fs_usage - > u . persistent_reserved [ i ] ) ;
}
for ( i = 0 ; i < c - > replicas . nr ; i + + ) {
struct bch_replicas_entry * e =
cpu_replicas_entry ( & c - > replicas , i ) ;
pr_buf ( out , " \t " ) ;
bch2_replicas_entry_to_text ( out , e ) ;
pr_buf ( out , " : \t %llu \n " , fs_usage - > u . replicas [ i ] ) ;
}
}
2017-03-16 22:18:50 -08:00
# define RESERVE_FACTOR 6
static u64 reserve_factor ( u64 r )
{
return r + ( round_up ( r , ( 1 < < RESERVE_FACTOR ) ) > > RESERVE_FACTOR ) ;
}
static u64 avail_factor ( u64 r )
{
2020-11-13 14:49:57 -05:00
return div_u64 ( r < < RESERVE_FACTOR , ( 1 < < RESERVE_FACTOR ) + 1 ) ;
2017-03-16 22:18:50 -08:00
}
2019-02-10 19:34:47 -05:00
u64 bch2_fs_sectors_used ( struct bch_fs * c , struct bch_fs_usage_online * fs_usage )
2017-03-16 22:18:50 -08:00
{
2019-02-10 19:34:47 -05:00
return min ( fs_usage - > u . hidden +
fs_usage - > u . btree +
fs_usage - > u . data +
reserve_factor ( fs_usage - > u . reserved +
2019-02-14 18:38:52 -05:00
fs_usage - > online_reserved ) ,
2019-01-21 15:32:13 -05:00
c - > capacity ) ;
2018-11-27 08:23:22 -05:00
}
2019-02-14 18:38:52 -05:00
static struct bch_fs_usage_short
__bch2_fs_usage_read_short ( struct bch_fs * c )
{
struct bch_fs_usage_short ret ;
u64 data , reserved ;
ret . capacity = c - > capacity -
2019-02-10 19:34:47 -05:00
bch2_fs_usage_read_one ( c , & c - > usage_base - > hidden ) ;
2019-02-14 18:38:52 -05:00
2019-02-10 19:34:47 -05:00
data = bch2_fs_usage_read_one ( c , & c - > usage_base - > data ) +
bch2_fs_usage_read_one ( c , & c - > usage_base - > btree ) ;
reserved = bch2_fs_usage_read_one ( c , & c - > usage_base - > reserved ) +
percpu_u64_get ( c - > online_reserved ) ;
2019-02-14 18:38:52 -05:00
ret . used = min ( ret . capacity , data + reserve_factor ( reserved ) ) ;
ret . free = ret . capacity - ret . used ;
2019-02-10 19:34:47 -05:00
ret . nr_inodes = bch2_fs_usage_read_one ( c , & c - > usage_base - > nr_inodes ) ;
2019-02-14 18:38:52 -05:00
return ret ;
}
2018-11-27 08:23:22 -05:00
struct bch_fs_usage_short
bch2_fs_usage_read_short ( struct bch_fs * c )
{
struct bch_fs_usage_short ret ;
2019-02-14 18:38:52 -05:00
percpu_down_read ( & c - > mark_lock ) ;
ret = __bch2_fs_usage_read_short ( c ) ;
percpu_up_read ( & c - > mark_lock ) ;
2018-11-27 08:23:22 -05:00
return ret ;
2017-03-16 22:18:50 -08:00
}
static inline int is_unavailable_bucket ( struct bucket_mark m )
{
return ! is_available_bucket ( m ) ;
}
2021-01-21 20:51:51 -05:00
static inline int bucket_sectors_fragmented ( struct bch_dev * ca ,
struct bucket_mark m )
2017-03-16 22:18:50 -08:00
{
2021-01-21 20:51:51 -05:00
return bucket_sectors_used ( m )
? max ( 0 , ( int ) ca - > mi . bucket_size - ( int ) bucket_sectors_used ( m ) )
: 0 ;
2017-03-16 22:18:50 -08:00
}
2020-07-09 18:31:51 -04:00
static inline int is_stripe_data_bucket ( struct bucket_mark m )
{
return m . stripe & & m . data_type ! = BCH_DATA_parity ;
}
2017-03-16 22:18:50 -08:00
static inline enum bch_data_type bucket_type ( struct bucket_mark m )
{
return m . cached_sectors & & ! m . dirty_sectors
2020-07-09 18:28:11 -04:00
? BCH_DATA_cached
2017-03-16 22:18:50 -08:00
: m . data_type ;
}
2018-07-23 05:32:01 -04:00
static bool bucket_became_unavailable ( struct bucket_mark old ,
2017-03-16 22:18:50 -08:00
struct bucket_mark new )
{
return is_available_bucket ( old ) & &
2018-07-23 05:32:01 -04:00
! is_available_bucket ( new ) ;
2017-03-16 22:18:50 -08:00
}
2018-12-01 11:32:12 -05:00
static inline void account_bucket ( struct bch_fs_usage * fs_usage ,
struct bch_dev_usage * dev_usage ,
enum bch_data_type type ,
int nr , s64 size )
{
2020-07-09 18:28:11 -04:00
if ( type = = BCH_DATA_sb | | type = = BCH_DATA_journal )
2019-02-14 18:38:52 -05:00
fs_usage - > hidden + = size ;
2018-12-01 11:32:12 -05:00
2021-01-21 20:51:51 -05:00
dev_usage - > d [ type ] . buckets + = nr ;
2018-12-01 11:32:12 -05:00
}
2017-03-16 22:18:50 -08:00
static void bch2_dev_usage_update ( struct bch_fs * c , struct bch_dev * ca ,
2018-07-23 05:32:01 -04:00
struct bch_fs_usage * fs_usage ,
struct bucket_mark old , struct bucket_mark new ,
2021-01-21 21:52:06 -05:00
u64 journal_seq , bool gc )
2017-03-16 22:18:50 -08:00
{
2020-06-18 21:06:42 -04:00
struct bch_dev_usage * u ;
2017-03-16 22:18:50 -08:00
2018-11-26 00:13:33 -05:00
percpu_rwsem_assert_held ( & c - > mark_lock ) ;
2017-03-16 22:18:50 -08:00
preempt_disable ( ) ;
2021-04-03 20:29:05 -04:00
if ( ! fs_usage )
fs_usage = fs_usage_ptr ( c , journal_seq , gc ) ;
2021-01-21 21:52:06 -05:00
u = dev_usage_ptr ( ca , journal_seq , gc ) ;
2017-03-16 22:18:50 -08:00
2018-12-01 11:32:12 -05:00
if ( bucket_type ( old ) )
2020-06-18 21:06:42 -04:00
account_bucket ( fs_usage , u , bucket_type ( old ) ,
2018-12-01 11:32:12 -05:00
- 1 , - ca - > mi . bucket_size ) ;
2018-11-24 17:09:44 -05:00
2018-12-01 11:32:12 -05:00
if ( bucket_type ( new ) )
2020-06-18 21:06:42 -04:00
account_bucket ( fs_usage , u , bucket_type ( new ) ,
2018-12-01 11:32:12 -05:00
1 , ca - > mi . bucket_size ) ;
2017-03-16 22:18:50 -08:00
2020-06-18 21:06:42 -04:00
u - > buckets_unavailable + =
2017-03-16 22:18:50 -08:00
is_unavailable_bucket ( new ) - is_unavailable_bucket ( old ) ;
2021-01-21 20:51:51 -05:00
u - > d [ old . data_type ] . sectors - = old . dirty_sectors ;
u - > d [ new . data_type ] . sectors + = new . dirty_sectors ;
u - > d [ BCH_DATA_cached ] . sectors + =
2017-03-16 22:18:50 -08:00
( int ) new . cached_sectors - ( int ) old . cached_sectors ;
2021-01-21 20:51:51 -05:00
u - > d [ old . data_type ] . fragmented - = bucket_sectors_fragmented ( ca , old ) ;
u - > d [ new . data_type ] . fragmented + = bucket_sectors_fragmented ( ca , new ) ;
2017-03-16 22:18:50 -08:00
preempt_enable ( ) ;
if ( ! is_available_bucket ( old ) & & is_available_bucket ( new ) )
bch2_wake_allocator ( ca ) ;
}
2021-04-03 20:29:05 -04:00
static inline void update_replicas ( struct bch_fs * c ,
struct bch_fs_usage * fs_usage ,
struct bch_replicas_entry * r ,
s64 sectors )
2019-01-21 15:32:13 -05:00
{
int idx = bch2_replicas_entry_idx ( c , r ) ;
2021-04-03 20:29:05 -04:00
BUG_ON ( idx < 0 ) ;
2019-01-21 15:32:13 -05:00
2020-07-09 18:31:51 -04:00
fs_usage_data_type_to_base ( fs_usage , r - > data_type , sectors ) ;
2019-02-14 18:38:52 -05:00
fs_usage - > replicas [ idx ] + = sectors ;
2019-01-21 15:32:13 -05:00
}
static inline void update_cached_sectors ( struct bch_fs * c ,
struct bch_fs_usage * fs_usage ,
unsigned dev , s64 sectors )
{
struct bch_replicas_padded r ;
bch2_replicas_entry_cached ( & r . e , dev ) ;
update_replicas ( c , fs_usage , & r . e , sectors ) ;
}
2019-05-24 11:56:20 -04:00
static struct replicas_delta_list *
replicas_deltas_realloc ( struct btree_trans * trans , unsigned more )
{
struct replicas_delta_list * d = trans - > fs_usage_deltas ;
unsigned new_size = d ? ( d - > size + more ) * 2 : 128 ;
2021-04-24 00:24:25 -04:00
unsigned alloc_size = sizeof ( * d ) + new_size ;
WARN_ON_ONCE ( alloc_size > REPLICAS_DELTA_LIST_MAX ) ;
2019-05-24 11:56:20 -04:00
if ( ! d | | d - > used + more > d - > size ) {
2021-04-24 00:24:25 -04:00
d = krealloc ( d , alloc_size , GFP_NOIO | __GFP_ZERO ) ;
BUG_ON ( ! d & & alloc_size > REPLICAS_DELTA_LIST_MAX ) ;
if ( ! d ) {
d = mempool_alloc ( & trans - > c - > replicas_delta_pool , GFP_NOIO ) ;
memset ( d , 0 , REPLICAS_DELTA_LIST_MAX ) ;
if ( trans - > fs_usage_deltas )
memcpy ( d , trans - > fs_usage_deltas ,
trans - > fs_usage_deltas - > size + sizeof ( * d ) ) ;
new_size = REPLICAS_DELTA_LIST_MAX - sizeof ( * d ) ;
kfree ( trans - > fs_usage_deltas ) ;
}
2019-05-24 11:56:20 -04:00
d - > size = new_size ;
trans - > fs_usage_deltas = d ;
}
return d ;
}
static inline void update_replicas_list ( struct btree_trans * trans ,
struct bch_replicas_entry * r ,
s64 sectors )
{
struct replicas_delta_list * d ;
struct replicas_delta * n ;
2019-08-22 13:20:38 -04:00
unsigned b ;
if ( ! sectors )
return ;
2019-05-24 11:56:20 -04:00
2019-08-22 13:20:38 -04:00
b = replicas_entry_bytes ( r ) + 8 ;
2019-05-24 11:56:20 -04:00
d = replicas_deltas_realloc ( trans , b ) ;
n = ( void * ) d - > d + d - > used ;
n - > delta = sectors ;
memcpy ( ( void * ) n + offsetof ( struct replicas_delta , r ) ,
r , replicas_entry_bytes ( r ) ) ;
2021-04-03 19:41:09 -04:00
bch2_replicas_entry_sort ( & n - > r ) ;
2019-05-24 11:56:20 -04:00
d - > used + = b ;
}
static inline void update_cached_sectors_list ( struct btree_trans * trans ,
unsigned dev , s64 sectors )
{
struct bch_replicas_padded r ;
bch2_replicas_entry_cached ( & r . e , dev ) ;
update_replicas_list ( trans , & r . e , sectors ) ;
}
2019-02-12 15:03:47 -05:00
# define do_mark_fn(fn, c, pos, flags, ...) \
( { \
int gc , ret = 0 ; \
\
percpu_rwsem_assert_held ( & c - > mark_lock ) ; \
\
for ( gc = 0 ; gc < 2 & & ! ret ; gc + + ) \
2019-12-31 16:17:42 -05:00
if ( ! gc = = ! ( flags & BTREE_TRIGGER_GC ) | | \
2019-02-12 15:03:47 -05:00
( gc & & gc_visited ( c , pos ) ) ) \
ret = fn ( c , __VA_ARGS__ , gc ) ; \
ret ; \
} )
static int __bch2_mark_alloc_bucket ( struct bch_fs * c , struct bch_dev * ca ,
size_t b , bool owned_by_allocator ,
bool gc )
2017-03-16 22:18:50 -08:00
{
2018-07-23 05:32:01 -04:00
struct bucket * g = __bucket ( ca , b , gc ) ;
2017-03-16 22:18:50 -08:00
struct bucket_mark old , new ;
2019-08-29 11:34:01 -04:00
old = bucket_cmpxchg ( g , new , ( {
2017-03-16 22:18:50 -08:00
new . owned_by_allocator = owned_by_allocator ;
} ) ) ;
2018-07-23 05:32:01 -04:00
BUG_ON ( ! gc & &
! owned_by_allocator & & ! old . owned_by_allocator ) ;
2019-02-12 15:03:47 -05:00
return 0 ;
2018-07-23 05:32:01 -04:00
}
void bch2_mark_alloc_bucket ( struct bch_fs * c , struct bch_dev * ca ,
size_t b , bool owned_by_allocator ,
struct gc_pos pos , unsigned flags )
{
2022-12-24 22:44:56 -05:00
preempt_disable ( ) ;
2019-02-12 15:03:47 -05:00
do_mark_fn ( __bch2_mark_alloc_bucket , c , pos , flags ,
ca , b , owned_by_allocator ) ;
2022-12-24 22:44:56 -05:00
preempt_enable ( ) ;
2017-03-16 22:18:50 -08:00
}
2020-07-06 19:16:25 -04:00
static int bch2_mark_alloc ( struct bch_fs * c ,
struct bkey_s_c old , struct bkey_s_c new ,
2019-02-13 14:46:32 -05:00
struct bch_fs_usage * fs_usage ,
2019-05-24 11:56:20 -04:00
u64 journal_seq , unsigned flags )
2019-02-13 14:46:32 -05:00
{
2019-12-31 16:17:42 -05:00
bool gc = flags & BTREE_TRIGGER_GC ;
2019-02-13 14:46:32 -05:00
struct bkey_alloc_unpacked u ;
struct bch_dev * ca ;
struct bucket * g ;
2020-07-06 19:16:25 -04:00
struct bucket_mark old_m , m ;
/* We don't do anything for deletions - do we?: */
2021-01-22 18:01:07 -05:00
if ( new . k - > type ! = KEY_TYPE_alloc & &
new . k - > type ! = KEY_TYPE_alloc_v2 )
2020-07-06 19:16:25 -04:00
return 0 ;
2019-02-13 14:46:32 -05:00
/*
* alloc btree is read in by bch2_alloc_read , not gc :
*/
2019-12-31 16:17:42 -05:00
if ( ( flags & BTREE_TRIGGER_GC ) & &
! ( flags & BTREE_TRIGGER_BUCKET_INVALIDATE ) )
2019-02-13 14:46:32 -05:00
return 0 ;
2020-07-06 19:16:25 -04:00
ca = bch_dev_bkey_exists ( c , new . k - > p . inode ) ;
2019-04-17 18:14:46 -04:00
2020-07-06 19:16:25 -04:00
if ( new . k - > p . offset > = ca - > mi . nbuckets )
2019-04-17 18:14:46 -04:00
return 0 ;
2020-07-06 19:16:25 -04:00
g = __bucket ( ca , new . k - > p . offset , gc ) ;
u = bch2_alloc_unpack ( new ) ;
2019-02-13 14:46:32 -05:00
2020-07-06 19:16:25 -04:00
old_m = bucket_cmpxchg ( g , m , ( {
2019-02-13 14:46:32 -05:00
m . gen = u . gen ;
m . data_type = u . data_type ;
m . dirty_sectors = u . dirty_sectors ;
m . cached_sectors = u . cached_sectors ;
2021-01-22 18:01:07 -05:00
m . stripe = u . stripe ! = 0 ;
2019-03-11 14:59:58 -04:00
2019-05-24 11:56:20 -04:00
if ( journal_seq ) {
2019-03-11 14:59:58 -04:00
m . journal_seq_valid = 1 ;
m . journal_seq = journal_seq ;
}
2019-02-13 14:46:32 -05:00
} ) ) ;
2021-01-21 21:52:06 -05:00
bch2_dev_usage_update ( c , ca , fs_usage , old_m , m , journal_seq , gc ) ;
2019-05-14 14:37:11 -04:00
2019-02-13 14:46:32 -05:00
g - > io_time [ READ ] = u . read_time ;
g - > io_time [ WRITE ] = u . write_time ;
g - > oldest_gen = u . oldest_gen ;
g - > gen_valid = 1 ;
2021-01-22 18:01:07 -05:00
g - > stripe = u . stripe ;
g - > stripe_redundancy = u . stripe_redundancy ;
2019-02-13 14:46:32 -05:00
2019-03-11 14:59:58 -04:00
/*
* need to know if we ' re getting called from the invalidate path or
* not :
*/
2019-12-31 16:17:42 -05:00
if ( ( flags & BTREE_TRIGGER_BUCKET_INVALIDATE ) & &
2020-07-06 19:16:25 -04:00
old_m . cached_sectors ) {
2019-02-13 14:46:32 -05:00
update_cached_sectors ( c , fs_usage , ca - > dev_idx ,
2020-07-06 19:16:25 -04:00
- old_m . cached_sectors ) ;
trace_invalidate ( ca , bucket_to_sector ( ca , new . k - > p . offset ) ,
old_m . cached_sectors ) ;
2019-02-13 14:46:32 -05:00
}
return 0 ;
}
2018-07-22 06:10:52 -04:00
# define checked_add(a, b) \
2019-03-07 16:33:56 -05:00
( { \
2018-07-22 06:10:52 -04:00
unsigned _res = ( unsigned ) ( a ) + ( b ) ; \
2019-03-07 16:33:56 -05:00
bool overflow = _res > U16_MAX ; \
if ( overflow ) \
_res = U16_MAX ; \
2018-07-22 06:10:52 -04:00
( a ) = _res ; \
2019-03-07 16:33:56 -05:00
overflow ; \
} )
2017-03-16 22:18:50 -08:00
2019-02-12 15:03:47 -05:00
static int __bch2_mark_metadata_bucket ( struct bch_fs * c , struct bch_dev * ca ,
2020-05-24 14:20:00 -04:00
size_t b , enum bch_data_type data_type ,
2019-02-12 15:03:47 -05:00
unsigned sectors , bool gc )
2018-07-23 05:32:01 -04:00
{
struct bucket * g = __bucket ( ca , b , gc ) ;
2019-03-07 16:33:56 -05:00
struct bucket_mark old , new ;
bool overflow ;
2018-07-23 05:32:01 -04:00
2020-07-09 18:28:11 -04:00
BUG_ON ( data_type ! = BCH_DATA_sb & &
data_type ! = BCH_DATA_journal ) ;
2018-07-23 05:32:01 -04:00
2019-03-07 16:33:56 -05:00
old = bucket_cmpxchg ( g , new , ( {
2020-05-24 14:20:00 -04:00
new . data_type = data_type ;
2019-03-07 16:33:56 -05:00
overflow = checked_add ( new . dirty_sectors , sectors ) ;
2018-07-23 05:32:01 -04:00
} ) ) ;
2019-02-12 15:03:47 -05:00
2019-08-29 11:34:01 -04:00
bch2_fs_inconsistent_on ( old . data_type & &
2020-05-24 14:20:00 -04:00
old . data_type ! = data_type , c ,
2019-08-29 11:34:01 -04:00
" different types of data in same bucket: %s, %s " ,
bch2_data_types [ old . data_type ] ,
2020-05-24 14:20:00 -04:00
bch2_data_types [ data_type ] ) ;
2019-08-29 11:34:01 -04:00
2019-03-07 16:33:56 -05:00
bch2_fs_inconsistent_on ( overflow , c ,
2020-05-24 14:20:00 -04:00
" bucket %u:%zu gen %u data type %s sector count overflow: %u + %u > U16_MAX " ,
ca - > dev_idx , b , new . gen ,
bch2_data_types [ old . data_type ? : data_type ] ,
2019-03-07 16:33:56 -05:00
old . dirty_sectors , sectors ) ;
if ( c )
2019-02-10 19:34:47 -05:00
bch2_dev_usage_update ( c , ca , fs_usage_ptr ( c , 0 , gc ) ,
2021-01-21 21:52:06 -05:00
old , new , 0 , gc ) ;
2019-03-07 16:33:56 -05:00
2019-02-12 15:03:47 -05:00
return 0 ;
2018-07-23 05:32:01 -04:00
}
2017-03-16 22:18:50 -08:00
void bch2_mark_metadata_bucket ( struct bch_fs * c , struct bch_dev * ca ,
size_t b , enum bch_data_type type ,
unsigned sectors , struct gc_pos pos ,
unsigned flags )
{
2020-07-09 18:28:11 -04:00
BUG_ON ( type ! = BCH_DATA_sb & &
type ! = BCH_DATA_journal ) ;
2017-03-16 22:18:50 -08:00
2018-07-23 05:32:01 -04:00
preempt_disable ( ) ;
2017-03-16 22:18:50 -08:00
if ( likely ( c ) ) {
2019-02-12 15:03:47 -05:00
do_mark_fn ( __bch2_mark_metadata_bucket , c , pos , flags ,
ca , b , type , sectors ) ;
2018-07-24 16:42:49 -04:00
} else {
2019-03-07 16:33:56 -05:00
__bch2_mark_metadata_bucket ( c , ca , b , type , sectors , 0 ) ;
2018-07-24 16:42:49 -04:00
}
2017-03-16 22:18:50 -08:00
2018-07-23 05:32:01 -04:00
preempt_enable ( ) ;
2017-03-16 22:18:50 -08:00
}
2019-10-07 15:57:47 -04:00
static s64 disk_sectors_scaled ( unsigned n , unsigned d , unsigned sectors )
{
return DIV_ROUND_UP ( sectors * n , d ) ;
}
static s64 __ptr_disk_sectors_delta ( unsigned old_size ,
unsigned offset , s64 delta ,
unsigned flags ,
unsigned n , unsigned d )
2017-03-16 22:18:50 -08:00
{
2019-10-07 15:57:47 -04:00
BUG_ON ( ! n | | ! d ) ;
2019-12-31 16:17:42 -05:00
if ( flags & BTREE_TRIGGER_OVERWRITE_SPLIT ) {
2019-10-07 15:57:47 -04:00
BUG_ON ( offset + - delta > old_size ) ;
2019-08-09 13:01:10 -04:00
2019-10-07 15:57:47 -04:00
return - disk_sectors_scaled ( n , d , old_size ) +
disk_sectors_scaled ( n , d , offset ) +
disk_sectors_scaled ( n , d , old_size - offset + delta ) ;
2019-12-31 16:17:42 -05:00
} else if ( flags & BTREE_TRIGGER_OVERWRITE ) {
2019-10-07 15:57:47 -04:00
BUG_ON ( offset + - delta > old_size ) ;
2019-08-09 13:01:10 -04:00
2019-10-07 15:57:47 -04:00
return - disk_sectors_scaled ( n , d , old_size ) +
disk_sectors_scaled ( n , d , old_size + delta ) ;
2018-12-06 11:52:58 -05:00
} else {
2019-10-07 15:57:47 -04:00
return disk_sectors_scaled ( n , d , delta ) ;
2017-03-16 22:18:50 -08:00
}
2018-11-01 15:21:48 -04:00
}
2019-10-07 15:57:47 -04:00
static s64 ptr_disk_sectors_delta ( struct extent_ptr_decoded p ,
unsigned offset , s64 delta ,
unsigned flags )
{
return __ptr_disk_sectors_delta ( p . crc . live_size ,
offset , delta , flags ,
p . crc . compressed_size ,
p . crc . uncompressed_size ) ;
}
2020-10-19 22:36:24 -04:00
static int check_bucket_ref ( struct bch_fs * c , struct bkey_s_c k ,
const struct bch_extent_ptr * ptr ,
s64 sectors , enum bch_data_type ptr_data_type ,
u8 bucket_gen , u8 bucket_data_type ,
u16 dirty_sectors , u16 cached_sectors )
2019-03-11 14:59:58 -04:00
{
2020-10-19 22:36:24 -04:00
size_t bucket_nr = PTR_BUCKET_NR ( bch_dev_bkey_exists ( c , ptr - > dev ) , ptr ) ;
u16 bucket_sectors = ! ptr - > cached
2020-06-03 18:27:07 -04:00
? dirty_sectors
: cached_sectors ;
char buf [ 200 ] ;
2020-10-19 22:36:24 -04:00
if ( gen_after ( ptr - > gen , bucket_gen ) ) {
2020-06-03 18:27:07 -04:00
bch2_fsck_err ( c , FSCK_CAN_IGNORE | FSCK_NEED_FSCK ,
" bucket %u:%zu gen %u data type %s: ptr gen %u newer than bucket gen \n "
" while marking %s " ,
2020-10-19 22:36:24 -04:00
ptr - > dev , bucket_nr , bucket_gen ,
bch2_data_types [ bucket_data_type ? : ptr_data_type ] ,
ptr - > gen ,
2020-06-03 18:27:07 -04:00
( bch2_bkey_val_to_text ( & PBUF ( buf ) , c , k ) , buf ) ) ;
return - EIO ;
}
2020-10-19 22:36:24 -04:00
if ( gen_cmp ( bucket_gen , ptr - > gen ) > BUCKET_GC_GEN_MAX ) {
2020-06-03 18:27:07 -04:00
bch2_fsck_err ( c , FSCK_CAN_IGNORE | FSCK_NEED_FSCK ,
" bucket %u:%zu gen %u data type %s: ptr gen %u too stale \n "
" while marking %s " ,
2020-10-19 22:36:24 -04:00
ptr - > dev , bucket_nr , bucket_gen ,
bch2_data_types [ bucket_data_type ? : ptr_data_type ] ,
ptr - > gen ,
2020-06-03 18:27:07 -04:00
( bch2_bkey_val_to_text ( & PBUF ( buf ) , c , k ) , buf ) ) ;
return - EIO ;
}
2020-10-19 22:36:24 -04:00
if ( bucket_gen ! = ptr - > gen & & ! ptr - > cached ) {
2020-06-03 18:27:07 -04:00
bch2_fsck_err ( c , FSCK_CAN_IGNORE | FSCK_NEED_FSCK ,
" bucket %u:%zu gen %u data type %s: stale dirty ptr (gen %u) \n "
" while marking %s " ,
2020-10-19 22:36:24 -04:00
ptr - > dev , bucket_nr , bucket_gen ,
bch2_data_types [ bucket_data_type ? : ptr_data_type ] ,
ptr - > gen ,
2020-06-03 18:27:07 -04:00
( bch2_bkey_val_to_text ( & PBUF ( buf ) , c , k ) , buf ) ) ;
return - EIO ;
}
2020-10-19 22:36:24 -04:00
if ( bucket_gen ! = ptr - > gen )
2020-06-03 18:27:07 -04:00
return 1 ;
2020-10-19 22:36:24 -04:00
if ( bucket_data_type & & ptr_data_type & &
bucket_data_type ! = ptr_data_type ) {
2020-06-03 18:27:07 -04:00
bch2_fsck_err ( c , FSCK_CAN_IGNORE | FSCK_NEED_FSCK ,
" bucket %u:%zu gen %u different types of data in same bucket: %s, %s \n "
" while marking %s " ,
2020-10-19 22:36:24 -04:00
ptr - > dev , bucket_nr , bucket_gen ,
bch2_data_types [ bucket_data_type ] ,
2020-06-03 18:27:07 -04:00
bch2_data_types [ ptr_data_type ] ,
( bch2_bkey_val_to_text ( & PBUF ( buf ) , c , k ) , buf ) ) ;
return - EIO ;
}
2020-10-19 22:36:24 -04:00
if ( ( unsigned ) ( bucket_sectors + sectors ) > U16_MAX ) {
2020-06-03 18:27:07 -04:00
bch2_fsck_err ( c , FSCK_CAN_IGNORE | FSCK_NEED_FSCK ,
" bucket %u:%zu gen %u data type %s sector count overflow: %u + %lli > U16_MAX \n "
" while marking %s " ,
2020-10-19 22:36:24 -04:00
ptr - > dev , bucket_nr , bucket_gen ,
bch2_data_types [ bucket_data_type ? : ptr_data_type ] ,
bucket_sectors , sectors ,
2020-06-03 18:27:07 -04:00
( bch2_bkey_val_to_text ( & PBUF ( buf ) , c , k ) , buf ) ) ;
return - EIO ;
}
2020-10-19 22:36:24 -04:00
return 0 ;
}
2021-01-22 18:01:07 -05:00
static int mark_stripe_bucket ( struct bch_fs * c , struct bkey_s_c k ,
2020-07-09 18:31:51 -04:00
unsigned ptr_idx ,
2020-10-19 22:36:24 -04:00
struct bch_fs_usage * fs_usage ,
2021-01-22 18:01:07 -05:00
u64 journal_seq , unsigned flags )
2020-10-19 22:36:24 -04:00
{
2020-07-09 18:31:51 -04:00
const struct bch_stripe * s = bkey_s_c_to_stripe ( k ) . v ;
unsigned nr_data = s - > nr_blocks - s - > nr_redundant ;
bool parity = ptr_idx > = nr_data ;
const struct bch_extent_ptr * ptr = s - > ptrs + ptr_idx ;
2020-10-19 22:36:24 -04:00
bool gc = flags & BTREE_TRIGGER_GC ;
struct bch_dev * ca = bch_dev_bkey_exists ( c , ptr - > dev ) ;
struct bucket * g = PTR_BUCKET ( ca , ptr , gc ) ;
struct bucket_mark new , old ;
char buf [ 200 ] ;
int ret ;
2021-01-22 18:01:07 -05:00
if ( g - > stripe & & g - > stripe ! = k . k - > p . offset ) {
bch2_fs_inconsistent ( c ,
" bucket %u:%zu gen %u: multiple stripes using same bucket \n %s " ,
2021-04-04 22:38:07 -04:00
ptr - > dev , PTR_BUCKET_NR ( ca , ptr ) , g - > mark . gen ,
2021-01-22 18:01:07 -05:00
( bch2_bkey_val_to_text ( & PBUF ( buf ) , c , k ) , buf ) ) ;
return - EINVAL ;
}
2020-07-22 23:11:48 -04:00
2020-10-19 22:36:24 -04:00
old = bucket_cmpxchg ( g , new , ( {
ret = check_bucket_ref ( c , k , ptr , 0 , 0 , new . gen , new . data_type ,
new . dirty_sectors , new . cached_sectors ) ;
if ( ret )
return ret ;
2021-01-22 18:01:07 -05:00
if ( parity ) {
new . data_type = BCH_DATA_parity ;
new . dirty_sectors = le16_to_cpu ( s - > sectors ) ;
2020-07-09 18:31:51 -04:00
}
2020-10-19 22:36:24 -04:00
if ( journal_seq ) {
new . journal_seq_valid = 1 ;
new . journal_seq = journal_seq ;
}
} ) ) ;
2021-01-22 18:01:07 -05:00
g - > stripe = k . k - > p . offset ;
g - > stripe_redundancy = s - > nr_redundant ;
2020-07-22 23:11:48 -04:00
2021-01-21 21:52:06 -05:00
bch2_dev_usage_update ( c , ca , fs_usage , old , new , journal_seq , gc ) ;
2020-10-19 22:36:24 -04:00
return 0 ;
}
static int __mark_pointer ( struct bch_fs * c , struct bkey_s_c k ,
const struct bch_extent_ptr * ptr ,
s64 sectors , enum bch_data_type ptr_data_type ,
u8 bucket_gen , u8 * bucket_data_type ,
u16 * dirty_sectors , u16 * cached_sectors )
{
u16 * dst_sectors = ! ptr - > cached
? dirty_sectors
: cached_sectors ;
int ret = check_bucket_ref ( c , k , ptr , sectors , ptr_data_type ,
bucket_gen , * bucket_data_type ,
* dirty_sectors , * cached_sectors ) ;
if ( ret )
return ret ;
* dst_sectors + = sectors ;
2020-06-03 18:27:07 -04:00
* bucket_data_type = * dirty_sectors | | * cached_sectors
? ptr_data_type : 0 ;
return 0 ;
}
static int bch2_mark_pointer ( struct bch_fs * c , struct bkey_s_c k ,
struct extent_ptr_decoded p ,
s64 sectors , enum bch_data_type data_type ,
struct bch_fs_usage * fs_usage ,
u64 journal_seq , unsigned flags )
2018-11-01 15:21:48 -04:00
{
2019-12-31 16:17:42 -05:00
bool gc = flags & BTREE_TRIGGER_GC ;
2018-11-01 15:21:48 -04:00
struct bucket_mark old , new ;
struct bch_dev * ca = bch_dev_bkey_exists ( c , p . ptr . dev ) ;
2019-03-11 14:59:58 -04:00
struct bucket * g = PTR_BUCKET ( ca , & p . ptr , gc ) ;
2020-06-03 18:27:07 -04:00
u8 bucket_data_type ;
2018-11-01 15:21:48 -04:00
u64 v ;
2020-06-03 18:27:07 -04:00
int ret ;
2018-07-24 16:42:49 -04:00
2017-03-16 22:18:50 -08:00
v = atomic64_read ( & g - > _mark . v ) ;
do {
new . v . counter = old . v . counter = v ;
2020-06-03 18:27:07 -04:00
bucket_data_type = new . data_type ;
2017-03-16 22:18:50 -08:00
2020-10-19 22:36:24 -04:00
ret = __mark_pointer ( c , k , & p . ptr , sectors , data_type , new . gen ,
2020-06-03 18:27:07 -04:00
& bucket_data_type ,
& new . dirty_sectors ,
& new . cached_sectors ) ;
if ( ret )
return ret ;
2017-03-16 22:18:50 -08:00
2020-06-03 18:27:07 -04:00
new . data_type = bucket_data_type ;
2017-03-16 22:18:50 -08:00
2020-06-03 18:27:07 -04:00
if ( journal_seq ) {
new . journal_seq_valid = 1 ;
new . journal_seq = journal_seq ;
2017-03-16 22:18:50 -08:00
}
2019-12-31 16:17:42 -05:00
if ( flags & BTREE_TRIGGER_NOATOMIC ) {
2017-03-16 22:18:50 -08:00
g - > _mark = new ;
break ;
}
} while ( ( v = atomic64_cmpxchg ( & g - > _mark . v ,
old . v . counter ,
new . v . counter ) ) ! = old . v . counter ) ;
2021-01-21 21:52:06 -05:00
bch2_dev_usage_update ( c , ca , fs_usage , old , new , journal_seq , gc ) ;
2017-03-16 22:18:50 -08:00
2018-07-23 05:32:01 -04:00
BUG_ON ( ! gc & & bucket_became_unavailable ( old , new ) ) ;
2019-02-14 15:42:41 -05:00
2020-06-03 18:27:07 -04:00
return 0 ;
2017-03-16 22:18:50 -08:00
}
2018-11-24 17:09:44 -05:00
static int bch2_mark_stripe_ptr ( struct bch_fs * c ,
struct bch_extent_stripe_ptr p ,
2019-01-21 15:32:13 -05:00
enum bch_data_type data_type ,
struct bch_fs_usage * fs_usage ,
2020-07-09 18:31:51 -04:00
s64 sectors , unsigned flags )
2018-11-01 15:13:19 -04:00
{
2019-12-31 16:17:42 -05:00
bool gc = flags & BTREE_TRIGGER_GC ;
2020-07-09 18:31:51 -04:00
struct bch_replicas_padded r ;
2018-11-24 17:09:44 -05:00
struct stripe * m ;
2020-07-06 20:18:13 -04:00
unsigned i , blocks_nonempty = 0 ;
2018-11-25 20:53:51 -05:00
2018-11-24 17:09:44 -05:00
m = genradix_ptr ( & c - > stripes [ gc ] , p . idx ) ;
2018-11-01 15:13:19 -04:00
2018-11-25 20:53:51 -05:00
spin_lock ( & c - > ec_stripes_heap_lock ) ;
2018-11-24 17:09:44 -05:00
if ( ! m | | ! m - > alive ) {
2018-11-25 20:53:51 -05:00
spin_unlock ( & c - > ec_stripes_heap_lock ) ;
2018-11-24 17:09:44 -05:00
bch_err_ratelimited ( c , " pointer to nonexistent stripe %llu " ,
( u64 ) p . idx ) ;
2019-08-16 09:59:56 -04:00
return - EIO ;
2018-11-24 17:09:44 -05:00
}
2018-11-01 15:13:19 -04:00
2018-11-25 20:53:51 -05:00
m - > block_sectors [ p . block ] + = sectors ;
2018-11-01 15:13:19 -04:00
2020-07-09 18:31:51 -04:00
r = m - > r ;
2020-07-06 20:18:13 -04:00
for ( i = 0 ; i < m - > nr_blocks ; i + + )
blocks_nonempty + = m - > block_sectors [ i ] ! = 0 ;
2018-11-01 15:13:19 -04:00
2020-07-06 20:18:13 -04:00
if ( m - > blocks_nonempty ! = blocks_nonempty ) {
m - > blocks_nonempty = blocks_nonempty ;
2018-11-25 20:53:51 -05:00
if ( ! gc )
bch2_stripes_heap_update ( c , m , p . idx ) ;
}
2018-11-01 15:13:19 -04:00
2018-11-25 20:53:51 -05:00
spin_unlock ( & c - > ec_stripes_heap_lock ) ;
2018-11-24 17:09:44 -05:00
2020-07-09 18:31:51 -04:00
r . e . data_type = data_type ;
update_replicas ( c , fs_usage , & r . e , sectors ) ;
2018-11-24 17:09:44 -05:00
return 0 ;
2018-11-01 15:13:19 -04:00
}
2020-07-06 19:16:25 -04:00
static int bch2_mark_extent ( struct bch_fs * c ,
struct bkey_s_c old , struct bkey_s_c new ,
2019-08-09 13:01:10 -04:00
unsigned offset , s64 sectors ,
enum bch_data_type data_type ,
2018-11-27 08:23:22 -05:00
struct bch_fs_usage * fs_usage ,
2019-05-24 11:56:20 -04:00
unsigned journal_seq , unsigned flags )
2017-03-16 22:18:50 -08:00
{
2020-07-06 19:16:25 -04:00
struct bkey_s_c k = flags & BTREE_TRIGGER_INSERT ? new : old ;
2018-11-01 15:10:01 -04:00
struct bkey_ptrs_c ptrs = bch2_bkey_ptrs_c ( k ) ;
const union bch_extent_entry * entry ;
struct extent_ptr_decoded p ;
2019-01-21 15:32:13 -05:00
struct bch_replicas_padded r ;
s64 dirty_sectors = 0 ;
2020-06-03 18:27:07 -04:00
bool stale ;
2018-11-01 15:10:01 -04:00
int ret ;
2019-01-21 15:32:13 -05:00
r . e . data_type = data_type ;
r . e . nr_devs = 0 ;
r . e . nr_required = 1 ;
2018-11-01 15:21:48 -04:00
BUG_ON ( ! sectors ) ;
2018-11-01 15:10:01 -04:00
bkey_for_each_ptr_decode ( k . k , ptrs , p , entry ) {
2020-07-09 18:28:11 -04:00
s64 disk_sectors = data_type = = BCH_DATA_btree
2018-12-06 11:52:58 -05:00
? sectors
2019-08-09 13:01:10 -04:00
: ptr_disk_sectors_delta ( p , offset , sectors , flags ) ;
2020-06-03 18:27:07 -04:00
ret = bch2_mark_pointer ( c , k , p , disk_sectors , data_type ,
fs_usage , journal_seq , flags ) ;
if ( ret < 0 )
return ret ;
stale = ret > 0 ;
2018-11-05 02:31:48 -05:00
2019-01-21 15:32:13 -05:00
if ( p . ptr . cached ) {
2019-08-22 13:20:38 -04:00
if ( ! stale )
2019-02-14 15:42:41 -05:00
update_cached_sectors ( c , fs_usage , p . ptr . dev ,
disk_sectors ) ;
2019-10-08 18:45:29 -04:00
} else if ( ! p . has_ec ) {
2019-01-21 15:32:13 -05:00
dirty_sectors + = disk_sectors ;
r . e . devs [ r . e . nr_devs + + ] = p . ptr . dev ;
} else {
2019-10-07 15:57:47 -04:00
ret = bch2_mark_stripe_ptr ( c , p . ec , data_type ,
2020-07-09 18:31:51 -04:00
fs_usage , disk_sectors , flags ) ;
2019-10-08 18:45:29 -04:00
if ( ret )
return ret ;
2018-11-01 15:10:01 -04:00
2019-10-07 15:57:47 -04:00
/*
* There may be other dirty pointers in this extent , but
* if so they ' re not required for mounting if we have an
* erasure coded pointer in this extent :
*/
2019-01-21 15:32:13 -05:00
r . e . nr_required = 0 ;
}
2018-11-01 15:21:48 -04:00
}
2018-11-05 02:31:48 -05:00
2019-10-08 21:33:56 -04:00
if ( r . e . nr_devs )
update_replicas ( c , fs_usage , & r . e , dirty_sectors ) ;
2018-11-24 17:09:44 -05:00
return 0 ;
2018-11-01 15:21:48 -04:00
}
2018-07-24 14:54:39 -04:00
2020-07-06 19:16:25 -04:00
static int bch2_mark_stripe ( struct bch_fs * c ,
struct bkey_s_c old , struct bkey_s_c new ,
2018-11-24 17:09:44 -05:00
struct bch_fs_usage * fs_usage ,
2019-05-24 11:56:20 -04:00
u64 journal_seq , unsigned flags )
2018-11-01 15:13:19 -04:00
{
2019-12-31 16:17:42 -05:00
bool gc = flags & BTREE_TRIGGER_GC ;
2020-07-06 19:16:25 -04:00
size_t idx = new . k - > p . offset ;
const struct bch_stripe * old_s = old . k - > type = = KEY_TYPE_stripe
? bkey_s_c_to_stripe ( old ) . v : NULL ;
const struct bch_stripe * new_s = new . k - > type = = KEY_TYPE_stripe
? bkey_s_c_to_stripe ( new ) . v : NULL ;
2018-11-01 15:10:01 -04:00
struct stripe * m = genradix_ptr ( & c - > stripes [ gc ] , idx ) ;
unsigned i ;
2020-10-19 22:36:24 -04:00
int ret ;
2018-11-01 15:13:19 -04:00
2021-01-22 18:01:07 -05:00
BUG_ON ( gc & & old_s ) ;
2020-07-06 19:16:25 -04:00
if ( ! m | | ( old_s & & ! m - > alive ) ) {
2018-11-01 15:10:01 -04:00
bch_err_ratelimited ( c , " error marking nonexistent stripe %zu " ,
idx ) ;
return - 1 ;
}
2018-11-01 15:13:19 -04:00
2020-07-06 19:16:25 -04:00
if ( ! new_s ) {
2021-01-22 18:01:07 -05:00
spin_lock ( & c - > ec_stripes_heap_lock ) ;
bch2_stripes_heap_del ( c , m , idx ) ;
spin_unlock ( & c - > ec_stripes_heap_lock ) ;
2020-07-09 18:31:51 -04:00
2020-07-06 19:16:25 -04:00
memset ( m , 0 , sizeof ( * m ) ) ;
} else {
2020-07-06 20:18:13 -04:00
m - > alive = true ;
2020-07-06 19:16:25 -04:00
m - > sectors = le16_to_cpu ( new_s - > sectors ) ;
m - > algorithm = new_s - > algorithm ;
m - > nr_blocks = new_s - > nr_blocks ;
m - > nr_redundant = new_s - > nr_redundant ;
2020-10-23 18:40:30 -04:00
m - > blocks_nonempty = 0 ;
for ( i = 0 ; i < new_s - > nr_blocks ; i + + ) {
2021-01-22 18:01:07 -05:00
m - > block_sectors [ i ] =
stripe_blockcount_get ( new_s , i ) ;
m - > blocks_nonempty + = ! ! m - > block_sectors [ i ] ;
2021-03-12 16:55:28 -05:00
m - > ptrs [ i ] = new_s - > ptrs [ i ] ;
2020-10-23 18:40:30 -04:00
}
2020-07-06 19:16:25 -04:00
bch2_bkey_to_replicas ( & m - > r . e , new ) ;
2019-01-21 15:32:13 -05:00
2020-07-06 19:16:25 -04:00
if ( ! gc ) {
spin_lock ( & c - > ec_stripes_heap_lock ) ;
2019-05-24 11:56:20 -04:00
bch2_stripes_heap_update ( c , m , idx ) ;
2020-07-06 19:16:25 -04:00
spin_unlock ( & c - > ec_stripes_heap_lock ) ;
}
2018-11-01 15:13:19 -04:00
}
2018-11-24 17:09:44 -05:00
2021-01-22 18:01:07 -05:00
if ( gc ) {
/*
* gc recalculates this field from stripe ptr
* references :
*/
memset ( m - > block_sectors , 0 , sizeof ( m - > block_sectors ) ) ;
m - > blocks_nonempty = 0 ;
for ( i = 0 ; i < new_s - > nr_blocks ; i + + ) {
ret = mark_stripe_bucket ( c , new , i , fs_usage ,
journal_seq , flags ) ;
if ( ret )
return ret ;
}
update_replicas ( c , fs_usage , & m - > r . e ,
( ( s64 ) m - > sectors * m - > nr_redundant ) ) ;
}
2018-11-24 17:09:44 -05:00
return 0 ;
2018-11-01 15:13:19 -04:00
}
2020-05-25 14:57:06 -04:00
static int bch2_mark_key_locked ( struct bch_fs * c ,
2020-07-06 19:16:25 -04:00
struct bkey_s_c old ,
struct bkey_s_c new ,
2019-08-09 13:01:10 -04:00
unsigned offset , s64 sectors ,
2019-03-29 19:49:17 -04:00
struct bch_fs_usage * fs_usage ,
u64 journal_seq , unsigned flags )
2018-11-01 15:21:48 -04:00
{
2020-07-06 19:16:25 -04:00
struct bkey_s_c k = flags & BTREE_TRIGGER_INSERT ? new : old ;
2019-03-15 18:20:46 -04:00
int ret = 0 ;
2020-07-06 19:16:25 -04:00
BUG_ON ( ! ( flags & ( BTREE_TRIGGER_INSERT | BTREE_TRIGGER_OVERWRITE ) ) ) ;
2019-03-15 18:20:46 -04:00
preempt_disable ( ) ;
2019-12-31 16:17:42 -05:00
if ( ! fs_usage | | ( flags & BTREE_TRIGGER_GC ) )
2019-05-24 11:56:20 -04:00
fs_usage = fs_usage_ptr ( c , journal_seq ,
2019-12-31 16:17:42 -05:00
flags & BTREE_TRIGGER_GC ) ;
2018-11-24 17:09:44 -05:00
2018-11-01 15:10:01 -04:00
switch ( k . k - > type ) {
2019-02-13 14:46:32 -05:00
case KEY_TYPE_alloc :
2021-01-22 18:01:07 -05:00
case KEY_TYPE_alloc_v2 :
2020-07-06 19:16:25 -04:00
ret = bch2_mark_alloc ( c , old , new , fs_usage , journal_seq , flags ) ;
2019-03-15 18:20:46 -04:00
break ;
2018-11-01 15:10:01 -04:00
case KEY_TYPE_btree_ptr :
2020-02-07 13:38:02 -05:00
case KEY_TYPE_btree_ptr_v2 :
2019-12-31 16:17:42 -05:00
sectors = ! ( flags & BTREE_TRIGGER_OVERWRITE )
2019-05-24 11:56:20 -04:00
? c - > opts . btree_node_size
: - c - > opts . btree_node_size ;
2020-07-06 19:16:25 -04:00
ret = bch2_mark_extent ( c , old , new , offset , sectors ,
2020-07-09 18:28:11 -04:00
BCH_DATA_btree , fs_usage , journal_seq , flags ) ;
2019-03-15 18:20:46 -04:00
break ;
2018-11-01 15:10:01 -04:00
case KEY_TYPE_extent :
2019-08-16 09:59:56 -04:00
case KEY_TYPE_reflink_v :
2020-07-06 19:16:25 -04:00
ret = bch2_mark_extent ( c , old , new , offset , sectors ,
2020-07-09 18:28:11 -04:00
BCH_DATA_user , fs_usage , journal_seq , flags ) ;
2019-03-15 18:20:46 -04:00
break ;
2018-11-01 15:10:01 -04:00
case KEY_TYPE_stripe :
2020-07-06 19:16:25 -04:00
ret = bch2_mark_stripe ( c , old , new , fs_usage , journal_seq , flags ) ;
2019-03-15 18:20:46 -04:00
break ;
2019-01-24 20:00:57 -05:00
case KEY_TYPE_inode :
2020-12-10 13:13:56 -05:00
fs_usage - > nr_inodes + = new . k - > type = = KEY_TYPE_inode ;
fs_usage - > nr_inodes - = old . k - > type = = KEY_TYPE_inode ;
2019-03-15 18:20:46 -04:00
break ;
2018-11-01 15:10:01 -04:00
case KEY_TYPE_reservation : {
unsigned replicas = bkey_s_c_to_reservation ( k ) . v - > nr_replicas ;
sectors * = replicas ;
2019-01-21 15:32:13 -05:00
replicas = clamp_t ( unsigned , replicas , 1 ,
ARRAY_SIZE ( fs_usage - > persistent_reserved ) ) ;
2018-11-01 15:10:01 -04:00
2019-02-14 18:38:52 -05:00
fs_usage - > reserved + = sectors ;
2019-01-21 15:32:13 -05:00
fs_usage - > persistent_reserved [ replicas - 1 ] + = sectors ;
2019-03-15 18:20:46 -04:00
break ;
2018-11-01 15:10:01 -04:00
}
2017-03-16 22:18:50 -08:00
}
2019-03-15 18:20:46 -04:00
preempt_enable ( ) ;
return ret ;
2018-07-23 05:32:01 -04:00
}
2020-07-06 19:16:25 -04:00
int bch2_mark_key ( struct bch_fs * c , struct bkey_s_c new ,
2019-08-09 13:01:10 -04:00
unsigned offset , s64 sectors ,
2018-11-27 08:23:22 -05:00
struct bch_fs_usage * fs_usage ,
2018-11-22 22:50:35 -05:00
u64 journal_seq , unsigned flags )
{
2020-07-06 19:16:25 -04:00
struct bkey deleted ;
struct bkey_s_c old = ( struct bkey_s_c ) { & deleted , NULL } ;
2018-11-22 22:50:35 -05:00
int ret ;
2020-07-06 19:16:25 -04:00
bkey_init ( & deleted ) ;
2018-11-26 00:13:33 -05:00
percpu_down_read ( & c - > mark_lock ) ;
2020-07-06 19:16:25 -04:00
ret = bch2_mark_key_locked ( c , old , new , offset , sectors ,
fs_usage , journal_seq ,
BTREE_TRIGGER_INSERT | flags ) ;
2018-11-26 00:13:33 -05:00
percpu_up_read ( & c - > mark_lock ) ;
2018-11-24 17:09:44 -05:00
return ret ;
2017-03-16 22:18:50 -08:00
}
2019-04-17 15:49:28 -04:00
int bch2_mark_update ( struct btree_trans * trans ,
2019-12-30 13:08:26 -05:00
struct btree_iter * iter ,
2020-07-06 19:16:25 -04:00
struct bkey_i * new ,
2019-04-17 15:49:28 -04:00
struct bch_fs_usage * fs_usage ,
unsigned flags )
2018-11-05 02:31:48 -05:00
{
struct bch_fs * c = trans - > c ;
2020-07-06 19:16:25 -04:00
struct bkey_s_c old ;
struct bkey unpacked ;
2019-04-17 15:49:28 -04:00
int ret = 0 ;
2018-11-05 02:31:48 -05:00
2019-12-31 16:17:42 -05:00
if ( unlikely ( flags & BTREE_TRIGGER_NORUN ) )
return 0 ;
2018-11-01 15:10:01 -04:00
if ( ! btree_node_type_needs_gc ( iter - > btree_id ) )
2019-04-17 15:49:28 -04:00
return 0 ;
2018-11-22 22:50:35 -05:00
2020-07-06 19:16:25 -04:00
bkey_init ( & unpacked ) ;
old = ( struct bkey_s_c ) { & unpacked , NULL } ;
2019-04-15 14:58:00 -04:00
2020-07-06 19:16:25 -04:00
if ( ! btree_node_type_is_extents ( iter - > btree_id ) ) {
2020-12-10 13:13:56 -05:00
/* iterators should be uptodate, shouldn't get errors here: */
2020-07-06 19:16:25 -04:00
if ( btree_iter_type ( iter ) ! = BTREE_ITER_CACHED ) {
2020-12-10 13:13:56 -05:00
old = bch2_btree_iter_peek_slot ( iter ) ;
BUG_ON ( bkey_err ( old ) ) ;
2020-07-06 19:16:25 -04:00
} else {
struct bkey_cached * ck = ( void * ) iter - > l [ 0 ] . b ;
2019-04-17 15:49:45 -04:00
2020-07-06 19:16:25 -04:00
if ( ck - > valid )
old = bkey_i_to_s_c ( ck - > k ) ;
}
2018-11-05 02:31:48 -05:00
2020-07-06 19:16:25 -04:00
if ( old . k - > type = = new - > k . type ) {
bch2_mark_key_locked ( c , old , bkey_i_to_s_c ( new ) , 0 , 0 ,
fs_usage , trans - > journal_res . seq ,
BTREE_TRIGGER_INSERT | BTREE_TRIGGER_OVERWRITE | flags ) ;
} else {
bch2_mark_key_locked ( c , old , bkey_i_to_s_c ( new ) , 0 , 0 ,
fs_usage , trans - > journal_res . seq ,
BTREE_TRIGGER_INSERT | flags ) ;
bch2_mark_key_locked ( c , old , bkey_i_to_s_c ( new ) , 0 , 0 ,
fs_usage , trans - > journal_res . seq ,
BTREE_TRIGGER_OVERWRITE | flags ) ;
}
} else {
2021-02-10 16:13:57 -05:00
struct btree_iter * copy ;
2020-07-06 19:16:25 -04:00
BUG_ON ( btree_iter_type ( iter ) = = BTREE_ITER_CACHED ) ;
bch2_mark_key_locked ( c , old , bkey_i_to_s_c ( new ) ,
0 , new - > k . size ,
fs_usage , trans - > journal_res . seq ,
BTREE_TRIGGER_INSERT | flags ) ;
2021-02-10 16:13:57 -05:00
copy = bch2_trans_copy_iter ( trans , iter ) ;
2020-07-06 19:16:25 -04:00
2021-02-10 16:13:57 -05:00
for_each_btree_key_continue ( copy , 0 , old , ret ) {
unsigned offset = 0 ;
s64 sectors = - ( ( s64 ) old . k - > size ) ;
2020-07-06 19:16:25 -04:00
flags | = BTREE_TRIGGER_OVERWRITE ;
if ( bkey_cmp ( new - > k . p , bkey_start_pos ( old . k ) ) < = 0 )
2021-02-10 16:13:57 -05:00
break ;
2020-07-06 19:16:25 -04:00
switch ( bch2_extent_overlap ( & new - > k , old . k ) ) {
case BCH_EXTENT_OVERLAP_ALL :
offset = 0 ;
sectors = - ( ( s64 ) old . k - > size ) ;
break ;
case BCH_EXTENT_OVERLAP_BACK :
offset = bkey_start_offset ( & new - > k ) -
bkey_start_offset ( old . k ) ;
sectors = bkey_start_offset ( & new - > k ) -
old . k - > p . offset ;
break ;
case BCH_EXTENT_OVERLAP_FRONT :
offset = 0 ;
sectors = bkey_start_offset ( old . k ) -
new - > k . p . offset ;
break ;
case BCH_EXTENT_OVERLAP_MIDDLE :
offset = bkey_start_offset ( & new - > k ) -
bkey_start_offset ( old . k ) ;
sectors = - ( ( s64 ) new - > k . size ) ;
flags | = BTREE_TRIGGER_OVERWRITE_SPLIT ;
break ;
}
BUG_ON ( sectors > = 0 ) ;
2018-11-05 02:31:48 -05:00
2020-07-06 19:16:25 -04:00
ret = bch2_mark_key_locked ( c , old , bkey_i_to_s_c ( new ) ,
offset , sectors , fs_usage ,
trans - > journal_res . seq , flags ) ? : 1 ;
if ( ret < = 0 )
break ;
}
2021-02-10 16:13:57 -05:00
bch2_trans_iter_put ( trans , copy ) ;
2018-11-05 02:31:48 -05:00
}
2019-04-17 15:49:28 -04:00
return ret ;
2019-03-15 18:20:46 -04:00
}
2018-11-05 02:31:48 -05:00
2021-04-03 20:29:05 -04:00
static noinline __cold
void fs_usage_apply_warn ( struct btree_trans * trans ,
unsigned disk_res_sectors )
2019-03-15 18:20:46 -04:00
{
struct bch_fs * c = trans - > c ;
struct btree_insert_entry * i ;
char buf [ 200 ] ;
2021-04-03 20:29:05 -04:00
bch_err ( c , " disk usage increased more than %u sectors reserved " ,
2019-08-16 09:59:56 -04:00
disk_res_sectors ) ;
2019-03-15 18:20:46 -04:00
2019-09-22 18:49:16 -04:00
trans_for_each_update ( trans , i ) {
2019-01-21 15:32:13 -05:00
pr_err ( " while inserting " ) ;
2019-03-15 18:20:46 -04:00
bch2_bkey_val_to_text ( & PBUF ( buf ) , c , bkey_i_to_s_c ( i - > k ) ) ;
2019-01-21 15:32:13 -05:00
pr_err ( " %s " , buf ) ;
pr_err ( " overlapping with " ) ;
2020-06-28 18:11:12 -04:00
if ( btree_iter_type ( i - > iter ) ! = BTREE_ITER_CACHED ) {
2021-02-10 16:13:57 -05:00
struct btree_iter * copy = bch2_trans_copy_iter ( trans , i - > iter ) ;
struct bkey_s_c k ;
int ret ;
2018-11-22 22:50:35 -05:00
2021-02-10 16:13:57 -05:00
for_each_btree_key_continue ( copy , 0 , k , ret ) {
if ( btree_node_type_is_extents ( i - > iter - > btree_id )
2020-06-28 18:11:12 -04:00
? bkey_cmp ( i - > k - > k . p , bkey_start_pos ( k . k ) ) < = 0
: bkey_cmp ( i - > k - > k . p , k . k - > p ) )
break ;
bch2_bkey_val_to_text ( & PBUF ( buf ) , c , k ) ;
pr_err ( " %s " , buf ) ;
}
2021-02-10 16:13:57 -05:00
bch2_trans_iter_put ( trans , copy ) ;
2020-06-28 18:11:12 -04:00
} else {
struct bkey_cached * ck = ( void * ) i - > iter - > l [ 0 ] . b ;
2020-07-06 19:16:25 -04:00
if ( ck - > valid ) {
bch2_bkey_val_to_text ( & PBUF ( buf ) , c , bkey_i_to_s_c ( ck - > k ) ) ;
pr_err ( " %s " , buf ) ;
}
2019-01-21 15:32:13 -05:00
}
}
2018-11-05 02:31:48 -05:00
}
2021-04-03 20:29:05 -04:00
void bch2_trans_fs_usage_apply ( struct btree_trans * trans ,
struct replicas_delta_list * deltas )
{
struct bch_fs * c = trans - > c ;
static int warned_disk_usage = 0 ;
bool warn = false ;
unsigned disk_res_sectors = trans - > disk_res ? trans - > disk_res - > sectors : 0 ;
struct replicas_delta * d = deltas - > d ;
struct replicas_delta * top = ( void * ) deltas - > d + deltas - > used ;
struct bch_fs_usage * dst ;
s64 added = 0 , should_not_have_added ;
unsigned i ;
percpu_rwsem_assert_held ( & c - > mark_lock ) ;
preempt_disable ( ) ;
dst = fs_usage_ptr ( c , trans - > journal_res . seq , false ) ;
for ( d = deltas - > d ; d ! = top ; d = replicas_delta_next ( d ) ) {
switch ( d - > r . data_type ) {
case BCH_DATA_btree :
case BCH_DATA_user :
case BCH_DATA_parity :
added + = d - > delta ;
}
update_replicas ( c , dst , & d - > r , d - > delta ) ;
}
dst - > nr_inodes + = deltas - > nr_inodes ;
for ( i = 0 ; i < BCH_REPLICAS_MAX ; i + + ) {
added + = deltas - > persistent_reserved [ i ] ;
dst - > reserved + = deltas - > persistent_reserved [ i ] ;
dst - > persistent_reserved [ i ] + = deltas - > persistent_reserved [ i ] ;
}
/*
* Not allowed to reduce sectors_available except by getting a
* reservation :
*/
should_not_have_added = added - ( s64 ) disk_res_sectors ;
if ( unlikely ( should_not_have_added > 0 ) ) {
atomic64_sub ( should_not_have_added , & c - > sectors_available ) ;
added - = should_not_have_added ;
warn = true ;
}
if ( added > 0 ) {
trans - > disk_res - > sectors - = added ;
this_cpu_sub ( * c - > online_reserved , added ) ;
}
preempt_enable ( ) ;
if ( unlikely ( warn ) & & ! xchg ( & warned_disk_usage , 1 ) )
fs_usage_apply_warn ( trans , disk_res_sectors ) ;
}
2019-03-11 14:59:58 -04:00
/* trans_mark: */
2019-10-05 12:54:53 -04:00
static struct btree_iter * trans_get_update ( struct btree_trans * trans ,
enum btree_id btree_id , struct bpos pos ,
struct bkey_s_c * k )
2019-03-11 14:59:58 -04:00
{
2019-08-07 12:07:13 -04:00
struct btree_insert_entry * i ;
2019-03-11 14:59:58 -04:00
2019-09-22 18:49:16 -04:00
trans_for_each_update ( trans , i )
2019-09-07 14:16:00 -04:00
if ( i - > iter - > btree_id = = btree_id & &
2019-08-07 12:07:13 -04:00
( btree_node_type_is_extents ( btree_id )
? bkey_cmp ( pos , bkey_start_pos ( & i - > k - > k ) ) > = 0 & &
bkey_cmp ( pos , i - > k - > k . p ) < 0
: ! bkey_cmp ( pos , i - > iter - > pos ) ) ) {
2019-10-05 12:54:53 -04:00
* k = bkey_i_to_s_c ( i - > k ) ;
2021-03-19 20:40:31 -04:00
/* ugly hack.. */
BUG_ON ( btree_iter_live ( trans , i - > iter ) ) ;
trans - > iters_live | = 1ULL < < i - > iter - > idx ;
2019-10-05 12:54:53 -04:00
return i - > iter ;
2019-03-11 14:59:58 -04:00
}
2019-10-05 12:54:53 -04:00
return NULL ;
}
static int trans_get_key ( struct btree_trans * trans ,
enum btree_id btree_id , struct bpos pos ,
struct btree_iter * * iter ,
struct bkey_s_c * k )
{
2021-02-20 19:27:37 -05:00
unsigned flags = btree_id ! = BTREE_ID_alloc
2019-10-05 12:54:53 -04:00
? BTREE_ITER_SLOTS
: BTREE_ITER_CACHED ;
int ret ;
* iter = trans_get_update ( trans , btree_id , pos , k ) ;
if ( * iter )
return 1 ;
2019-09-26 22:21:39 -04:00
* iter = bch2_trans_get_iter ( trans , btree_id , pos ,
2019-10-05 12:54:53 -04:00
flags | BTREE_ITER_INTENT ) ;
* k = __bch2_btree_iter_peek ( * iter , flags ) ;
2019-03-11 14:59:58 -04:00
ret = bkey_err ( * k ) ;
if ( ret )
bch2_trans_iter_put ( trans , * iter ) ;
return ret ;
}
2021-01-22 18:01:07 -05:00
static struct bkey_alloc_buf *
bch2_trans_start_alloc_update ( struct btree_trans * trans , struct btree_iter * * _iter ,
const struct bch_extent_ptr * ptr ,
struct bkey_alloc_unpacked * u )
2019-03-11 14:59:58 -04:00
{
struct bch_fs * c = trans - > c ;
2020-10-19 22:36:24 -04:00
struct bch_dev * ca = bch_dev_bkey_exists ( c , ptr - > dev ) ;
struct bpos pos = POS ( ptr - > dev , PTR_BUCKET_NR ( ca , ptr ) ) ;
2020-06-03 23:46:15 -04:00
struct bucket * g ;
2020-10-19 22:36:24 -04:00
struct btree_iter * iter ;
struct bkey_s_c k ;
2021-01-22 18:01:07 -05:00
struct bkey_alloc_buf * a ;
2019-03-11 14:59:58 -04:00
int ret ;
2021-01-22 18:01:07 -05:00
a = bch2_trans_kmalloc ( trans , sizeof ( struct bkey_alloc_buf ) ) ;
if ( IS_ERR ( a ) )
return a ;
2021-02-20 19:27:37 -05:00
iter = trans_get_update ( trans , BTREE_ID_alloc , pos , & k ) ;
2019-10-05 12:54:53 -04:00
if ( iter ) {
2020-10-19 22:36:24 -04:00
* u = bch2_alloc_unpack ( k ) ;
2019-08-27 17:34:03 -04:00
} else {
2021-02-20 19:27:37 -05:00
iter = bch2_trans_get_iter ( trans , BTREE_ID_alloc , pos ,
2019-10-05 12:54:53 -04:00
BTREE_ITER_CACHED |
BTREE_ITER_CACHED_NOFILL |
BTREE_ITER_INTENT ) ;
ret = bch2_btree_iter_traverse ( iter ) ;
2020-10-19 22:36:24 -04:00
if ( ret ) {
bch2_trans_iter_put ( trans , iter ) ;
2021-01-22 18:01:07 -05:00
return ERR_PTR ( ret ) ;
2020-10-19 22:36:24 -04:00
}
2020-06-03 23:46:15 -04:00
2019-10-05 12:54:53 -04:00
percpu_down_read ( & c - > mark_lock ) ;
g = bucket ( ca , pos . offset ) ;
2021-01-22 18:01:07 -05:00
* u = alloc_mem_to_key ( iter , g , READ_ONCE ( g - > mark ) ) ;
2019-10-05 12:54:53 -04:00
percpu_up_read ( & c - > mark_lock ) ;
}
2020-06-03 23:46:15 -04:00
2020-10-19 22:36:24 -04:00
* _iter = iter ;
2021-01-22 18:01:07 -05:00
return a ;
2020-10-19 22:36:24 -04:00
}
static int bch2_trans_mark_pointer ( struct btree_trans * trans ,
struct bkey_s_c k , struct extent_ptr_decoded p ,
s64 sectors , enum bch_data_type data_type )
{
struct bch_fs * c = trans - > c ;
struct btree_iter * iter ;
struct bkey_alloc_unpacked u ;
2021-01-22 18:01:07 -05:00
struct bkey_alloc_buf * a ;
2020-10-19 22:36:24 -04:00
int ret ;
2021-01-22 18:01:07 -05:00
a = bch2_trans_start_alloc_update ( trans , & iter , & p . ptr , & u ) ;
if ( IS_ERR ( a ) )
return PTR_ERR ( a ) ;
2020-10-19 22:36:24 -04:00
ret = __mark_pointer ( c , k , & p . ptr , sectors , data_type , u . gen , & u . data_type ,
2020-06-03 18:27:07 -04:00
& u . dirty_sectors , & u . cached_sectors ) ;
if ( ret )
2019-10-26 14:58:36 -04:00
goto out ;
2019-03-11 14:59:58 -04:00
2021-01-22 18:01:07 -05:00
bch2_alloc_pack ( c , a , u ) ;
bch2_trans_update ( trans , iter , & a - > k , 0 ) ;
2019-03-11 14:59:58 -04:00
out :
bch2_trans_iter_put ( trans , iter ) ;
return ret ;
}
static int bch2_trans_mark_stripe_ptr ( struct btree_trans * trans ,
2021-01-11 13:51:23 -05:00
struct extent_ptr_decoded p ,
2020-07-09 18:31:51 -04:00
s64 sectors , enum bch_data_type data_type )
2019-03-11 14:59:58 -04:00
{
2019-08-16 09:59:56 -04:00
struct bch_fs * c = trans - > c ;
2019-03-11 14:59:58 -04:00
struct btree_iter * iter ;
struct bkey_s_c k ;
2019-12-31 19:37:10 -05:00
struct bkey_i_stripe * s ;
2020-07-09 18:31:51 -04:00
struct bch_replicas_padded r ;
2019-03-11 14:59:58 -04:00
int ret = 0 ;
2021-02-20 19:27:37 -05:00
ret = trans_get_key ( trans , BTREE_ID_stripes , POS ( 0 , p . ec . idx ) , & iter , & k ) ;
2019-08-27 17:34:03 -04:00
if ( ret < 0 )
2019-03-11 14:59:58 -04:00
return ret ;
if ( k . k - > type ! = KEY_TYPE_stripe ) {
2019-08-16 09:59:56 -04:00
bch2_fs_inconsistent ( c ,
" pointer to nonexistent stripe %llu " ,
2021-01-11 13:51:23 -05:00
( u64 ) p . ec . idx ) ;
ret = - EIO ;
goto out ;
}
if ( ! bch2_ptr_matches_stripe ( bkey_s_c_to_stripe ( k ) . v , p ) ) {
bch2_fs_inconsistent ( c ,
" stripe pointer doesn't match stripe %llu " ,
( u64 ) p . ec . idx ) ;
2019-08-16 09:59:56 -04:00
ret = - EIO ;
2019-03-11 14:59:58 -04:00
goto out ;
}
2019-12-31 19:37:10 -05:00
s = bch2_trans_kmalloc ( trans , bkey_bytes ( k . k ) ) ;
ret = PTR_ERR_OR_ZERO ( s ) ;
2019-03-11 14:59:58 -04:00
if ( ret )
goto out ;
2019-12-31 19:37:10 -05:00
bkey_reassemble ( & s - > k_i , k ) ;
2021-01-11 13:51:23 -05:00
stripe_blockcount_set ( & s - > v , p . ec . block ,
stripe_blockcount_get ( & s - > v , p . ec . block ) +
2019-10-07 15:57:47 -04:00
sectors ) ;
2019-12-31 19:37:10 -05:00
bch2_trans_update ( trans , iter , & s - > k_i , 0 ) ;
2020-07-09 18:31:51 -04:00
bch2_bkey_to_replicas ( & r . e , bkey_i_to_s_c ( & s - > k_i ) ) ;
r . e . data_type = data_type ;
update_replicas_list ( trans , & r . e , sectors ) ;
2019-03-11 14:59:58 -04:00
out :
bch2_trans_iter_put ( trans , iter ) ;
return ret ;
}
static int bch2_trans_mark_extent ( struct btree_trans * trans ,
2019-08-09 13:01:10 -04:00
struct bkey_s_c k , unsigned offset ,
s64 sectors , unsigned flags ,
enum bch_data_type data_type )
2019-03-11 14:59:58 -04:00
{
struct bkey_ptrs_c ptrs = bch2_bkey_ptrs_c ( k ) ;
const union bch_extent_entry * entry ;
struct extent_ptr_decoded p ;
struct bch_replicas_padded r ;
s64 dirty_sectors = 0 ;
bool stale ;
int ret ;
r . e . data_type = data_type ;
r . e . nr_devs = 0 ;
r . e . nr_required = 1 ;
BUG_ON ( ! sectors ) ;
bkey_for_each_ptr_decode ( k . k , ptrs , p , entry ) {
2020-07-09 18:28:11 -04:00
s64 disk_sectors = data_type = = BCH_DATA_btree
2019-03-11 14:59:58 -04:00
? sectors
2019-08-09 13:01:10 -04:00
: ptr_disk_sectors_delta ( p , offset , sectors , flags ) ;
2019-03-11 14:59:58 -04:00
2020-06-03 18:27:07 -04:00
ret = bch2_trans_mark_pointer ( trans , k , p , disk_sectors ,
2019-05-15 15:47:43 -04:00
data_type ) ;
2019-03-11 14:59:58 -04:00
if ( ret < 0 )
return ret ;
stale = ret > 0 ;
if ( p . ptr . cached ) {
2019-08-22 13:20:38 -04:00
if ( ! stale )
2019-05-15 15:47:43 -04:00
update_cached_sectors_list ( trans , p . ptr . dev ,
2019-03-11 14:59:58 -04:00
disk_sectors ) ;
2019-10-08 18:45:29 -04:00
} else if ( ! p . has_ec ) {
2019-03-11 14:59:58 -04:00
dirty_sectors + = disk_sectors ;
r . e . devs [ r . e . nr_devs + + ] = p . ptr . dev ;
} else {
2021-01-11 13:51:23 -05:00
ret = bch2_trans_mark_stripe_ptr ( trans , p ,
2020-07-09 18:31:51 -04:00
disk_sectors , data_type ) ;
2019-10-08 18:45:29 -04:00
if ( ret )
return ret ;
2019-03-11 14:59:58 -04:00
r . e . nr_required = 0 ;
}
}
2019-10-07 15:57:47 -04:00
if ( r . e . nr_devs )
update_replicas_list ( trans , & r . e , dirty_sectors ) ;
2019-03-11 14:59:58 -04:00
return 0 ;
}
2020-12-10 13:13:56 -05:00
static int bch2_trans_mark_stripe_alloc_ref ( struct btree_trans * trans ,
2021-01-22 18:01:07 -05:00
struct bkey_s_c_stripe s ,
unsigned idx , bool deleting )
2020-12-10 13:13:56 -05:00
{
2021-01-22 18:01:07 -05:00
struct bch_fs * c = trans - > c ;
const struct bch_extent_ptr * ptr = & s . v - > ptrs [ idx ] ;
struct bkey_alloc_buf * a ;
2020-12-10 13:13:56 -05:00
struct btree_iter * iter ;
struct bkey_alloc_unpacked u ;
2021-01-22 18:01:07 -05:00
bool parity = idx > = s . v - > nr_blocks - s . v - > nr_redundant ;
int ret = 0 ;
2020-12-10 13:13:56 -05:00
2021-01-22 18:01:07 -05:00
a = bch2_trans_start_alloc_update ( trans , & iter , ptr , & u ) ;
if ( IS_ERR ( a ) )
return PTR_ERR ( a ) ;
2020-12-10 13:13:56 -05:00
if ( parity ) {
2021-01-22 18:01:07 -05:00
s64 sectors = le16_to_cpu ( s . v - > sectors ) ;
if ( deleting )
sectors = - sectors ;
2020-12-10 13:13:56 -05:00
u . dirty_sectors + = sectors ;
u . data_type = u . dirty_sectors
? BCH_DATA_parity
: 0 ;
}
2021-01-22 18:01:07 -05:00
if ( ! deleting ) {
if ( bch2_fs_inconsistent_on ( u . stripe & & u . stripe ! = s . k - > p . offset , c ,
" bucket %llu:%llu gen %u: multiple stripes using same bucket (%u, %llu) " ,
iter - > pos . inode , iter - > pos . offset , u . gen ,
u . stripe , s . k - > p . offset ) ) {
ret = - EIO ;
goto err ;
}
2020-12-10 13:13:56 -05:00
2021-01-22 18:01:07 -05:00
u . stripe = s . k - > p . offset ;
u . stripe_redundancy = s . v - > nr_redundant ;
} else {
u . stripe = 0 ;
u . stripe_redundancy = 0 ;
}
bch2_alloc_pack ( c , a , u ) ;
bch2_trans_update ( trans , iter , & a - > k , 0 ) ;
2020-12-10 13:13:56 -05:00
err :
bch2_trans_iter_put ( trans , iter ) ;
return ret ;
}
2020-10-19 22:36:24 -04:00
static int bch2_trans_mark_stripe ( struct btree_trans * trans ,
2020-12-10 13:13:56 -05:00
struct bkey_s_c old , struct bkey_s_c new ,
2020-07-09 18:31:51 -04:00
unsigned flags )
2020-10-19 22:36:24 -04:00
{
2021-01-22 18:01:07 -05:00
struct bkey_s_c_stripe old_s = { NULL } ;
struct bkey_s_c_stripe new_s = { NULL } ;
2020-07-09 18:31:51 -04:00
struct bch_replicas_padded r ;
2020-10-19 22:36:24 -04:00
unsigned i ;
int ret = 0 ;
2021-01-22 18:01:07 -05:00
if ( old . k - > type = = KEY_TYPE_stripe )
old_s = bkey_s_c_to_stripe ( old ) ;
if ( new . k - > type = = KEY_TYPE_stripe )
new_s = bkey_s_c_to_stripe ( new ) ;
2020-10-19 22:36:24 -04:00
/*
2020-12-10 13:13:56 -05:00
* If the pointers aren ' t changing , we don ' t need to do anything :
2020-10-19 22:36:24 -04:00
*/
2021-01-22 18:01:07 -05:00
if ( new_s . k & & old_s . k & &
new_s . v - > nr_blocks = = old_s . v - > nr_blocks & &
new_s . v - > nr_redundant = = old_s . v - > nr_redundant & &
! memcmp ( old_s . v - > ptrs , new_s . v - > ptrs ,
new_s . v - > nr_blocks * sizeof ( struct bch_extent_ptr ) ) )
2020-12-10 13:13:56 -05:00
return 0 ;
2020-10-19 22:36:24 -04:00
2021-01-22 18:01:07 -05:00
if ( new_s . k ) {
s64 sectors = le16_to_cpu ( new_s . v - > sectors ) ;
2020-07-09 18:31:51 -04:00
2020-12-10 13:13:56 -05:00
bch2_bkey_to_replicas ( & r . e , new ) ;
2021-01-22 18:01:07 -05:00
update_replicas_list ( trans , & r . e , sectors * new_s . v - > nr_redundant ) ;
2020-10-19 22:36:24 -04:00
2021-01-22 18:01:07 -05:00
for ( i = 0 ; i < new_s . v - > nr_blocks ; i + + ) {
ret = bch2_trans_mark_stripe_alloc_ref ( trans , new_s ,
i , false ) ;
2020-12-10 13:13:56 -05:00
if ( ret )
return ret ;
2020-07-09 18:31:51 -04:00
}
2020-12-10 13:13:56 -05:00
}
2020-07-09 18:31:51 -04:00
2021-01-22 18:01:07 -05:00
if ( old_s . k ) {
s64 sectors = - ( ( s64 ) le16_to_cpu ( old_s . v - > sectors ) ) ;
2020-12-10 13:13:56 -05:00
bch2_bkey_to_replicas ( & r . e , old ) ;
2021-01-22 18:01:07 -05:00
update_replicas_list ( trans , & r . e , sectors * old_s . v - > nr_redundant ) ;
2020-12-10 13:13:56 -05:00
2021-01-22 18:01:07 -05:00
for ( i = 0 ; i < old_s . v - > nr_blocks ; i + + ) {
ret = bch2_trans_mark_stripe_alloc_ref ( trans , old_s ,
i , true ) ;
2020-12-10 13:13:56 -05:00
if ( ret )
return ret ;
}
2020-10-19 22:36:24 -04:00
}
return ret ;
}
2020-10-24 19:51:34 -04:00
static __le64 * bkey_refcount ( struct bkey_i * k )
{
switch ( k - > k . type ) {
case KEY_TYPE_reflink_v :
return & bkey_i_to_reflink_v ( k ) - > v . refcount ;
case KEY_TYPE_indirect_inline_data :
return & bkey_i_to_indirect_inline_data ( k ) - > v . refcount ;
default :
return NULL ;
}
}
2019-08-16 09:59:56 -04:00
static int __bch2_trans_mark_reflink_p ( struct btree_trans * trans ,
struct bkey_s_c_reflink_p p ,
u64 idx , unsigned sectors ,
unsigned flags )
{
struct bch_fs * c = trans - > c ;
struct btree_iter * iter ;
struct bkey_s_c k ;
2020-10-24 19:51:34 -04:00
struct bkey_i * n ;
__le64 * refcount ;
2019-08-16 09:59:56 -04:00
s64 ret ;
2021-02-20 19:27:37 -05:00
ret = trans_get_key ( trans , BTREE_ID_reflink ,
2019-08-16 09:59:56 -04:00
POS ( 0 , idx ) , & iter , & k ) ;
2019-08-27 17:34:03 -04:00
if ( ret < 0 )
2019-08-16 09:59:56 -04:00
return ret ;
2019-12-31 16:17:42 -05:00
if ( ( flags & BTREE_TRIGGER_OVERWRITE ) & &
2019-08-16 09:59:56 -04:00
( bkey_start_offset ( k . k ) < idx | |
k . k - > p . offset > idx + sectors ) )
goto out ;
2020-02-18 16:17:55 -05:00
sectors = k . k - > p . offset - idx ;
2019-08-16 09:59:56 -04:00
2020-10-24 19:51:34 -04:00
n = bch2_trans_kmalloc ( trans , bkey_bytes ( k . k ) ) ;
ret = PTR_ERR_OR_ZERO ( n ) ;
2019-08-16 09:59:56 -04:00
if ( ret )
goto err ;
2020-10-24 19:51:34 -04:00
bkey_reassemble ( n , k ) ;
refcount = bkey_refcount ( n ) ;
if ( ! refcount ) {
bch2_fs_inconsistent ( c ,
" %llu:%llu len %u points to nonexistent indirect extent %llu " ,
p . k - > p . inode , p . k - > p . offset , p . k - > size , idx ) ;
ret = - EIO ;
goto err ;
}
2019-08-16 09:59:56 -04:00
2020-10-24 19:51:34 -04:00
le64_add_cpu ( refcount , ! ( flags & BTREE_TRIGGER_OVERWRITE ) ? 1 : - 1 ) ;
2019-08-16 09:59:56 -04:00
2020-10-24 19:51:34 -04:00
if ( ! * refcount ) {
n - > k . type = KEY_TYPE_deleted ;
set_bkey_val_u64s ( & n - > k , 0 ) ;
2019-08-16 09:59:56 -04:00
}
2019-12-31 19:37:10 -05:00
2020-02-18 16:17:55 -05:00
bch2_btree_iter_set_pos ( iter , bkey_start_pos ( k . k ) ) ;
2020-10-24 19:51:34 -04:00
bch2_trans_update ( trans , iter , n , 0 ) ;
2019-08-16 09:59:56 -04:00
out :
2020-02-18 16:17:55 -05:00
ret = sectors ;
2019-08-16 09:59:56 -04:00
err :
bch2_trans_iter_put ( trans , iter ) ;
return ret ;
}
static int bch2_trans_mark_reflink_p ( struct btree_trans * trans ,
struct bkey_s_c_reflink_p p , unsigned offset ,
s64 sectors , unsigned flags )
{
u64 idx = le64_to_cpu ( p . v - > idx ) + offset ;
s64 ret = 0 ;
sectors = abs ( sectors ) ;
BUG_ON ( offset + sectors > p . k - > size ) ;
while ( sectors ) {
ret = __bch2_trans_mark_reflink_p ( trans , p , idx , sectors , flags ) ;
if ( ret < 0 )
break ;
idx + = ret ;
sectors = max_t ( s64 , 0LL , sectors - ret ) ;
ret = 0 ;
}
return ret ;
}
2020-12-10 13:13:56 -05:00
int bch2_trans_mark_key ( struct btree_trans * trans ,
struct bkey_s_c old ,
struct bkey_s_c new ,
2019-08-09 13:01:10 -04:00
unsigned offset , s64 sectors , unsigned flags )
2019-03-11 14:59:58 -04:00
{
struct bch_fs * c = trans - > c ;
2020-12-10 13:13:56 -05:00
struct bkey_s_c k = flags & BTREE_TRIGGER_INSERT ? new : old ;
struct replicas_delta_list * d ;
BUG_ON ( ! ( flags & ( BTREE_TRIGGER_INSERT | BTREE_TRIGGER_OVERWRITE ) ) ) ;
2019-03-11 14:59:58 -04:00
switch ( k . k - > type ) {
case KEY_TYPE_btree_ptr :
2020-02-07 13:38:02 -05:00
case KEY_TYPE_btree_ptr_v2 :
2019-12-31 16:17:42 -05:00
sectors = ! ( flags & BTREE_TRIGGER_OVERWRITE )
2019-05-24 11:56:20 -04:00
? c - > opts . btree_node_size
: - c - > opts . btree_node_size ;
2019-08-09 13:01:10 -04:00
return bch2_trans_mark_extent ( trans , k , offset , sectors ,
2020-07-09 18:28:11 -04:00
flags , BCH_DATA_btree ) ;
2019-03-11 14:59:58 -04:00
case KEY_TYPE_extent :
2019-08-16 09:59:56 -04:00
case KEY_TYPE_reflink_v :
2019-08-09 13:01:10 -04:00
return bch2_trans_mark_extent ( trans , k , offset , sectors ,
2020-07-09 18:28:11 -04:00
flags , BCH_DATA_user ) ;
2020-10-19 22:36:24 -04:00
case KEY_TYPE_stripe :
2020-12-10 13:13:56 -05:00
return bch2_trans_mark_stripe ( trans , old , new , flags ) ;
case KEY_TYPE_inode : {
int nr = ( new . k - > type = = KEY_TYPE_inode ) -
( old . k - > type = = KEY_TYPE_inode ) ;
if ( nr ) {
d = replicas_deltas_realloc ( trans , 0 ) ;
d - > nr_inodes + = nr ;
}
2019-05-15 15:47:43 -04:00
2019-03-11 14:59:58 -04:00
return 0 ;
2020-12-10 13:13:56 -05:00
}
2019-03-11 14:59:58 -04:00
case KEY_TYPE_reservation : {
unsigned replicas = bkey_s_c_to_reservation ( k ) . v - > nr_replicas ;
2019-05-21 15:49:56 -04:00
d = replicas_deltas_realloc ( trans , 0 ) ;
2019-05-15 15:47:43 -04:00
2019-03-11 14:59:58 -04:00
sectors * = replicas ;
replicas = clamp_t ( unsigned , replicas , 1 ,
2019-10-19 22:22:29 -04:00
ARRAY_SIZE ( d - > persistent_reserved ) ) ;
2019-03-11 14:59:58 -04:00
2019-10-19 22:22:29 -04:00
d - > persistent_reserved [ replicas - 1 ] + = sectors ;
2019-03-11 14:59:58 -04:00
return 0 ;
}
2019-08-16 09:59:56 -04:00
case KEY_TYPE_reflink_p :
return bch2_trans_mark_reflink_p ( trans ,
bkey_s_c_to_reflink_p ( k ) ,
offset , sectors , flags ) ;
2019-03-11 14:59:58 -04:00
default :
return 0 ;
}
}
int bch2_trans_mark_update ( struct btree_trans * trans ,
2019-06-24 17:50:52 -04:00
struct btree_iter * iter ,
2020-12-10 13:13:56 -05:00
struct bkey_i * new ,
2019-12-31 16:17:42 -05:00
unsigned flags )
2019-03-11 14:59:58 -04:00
{
2020-12-10 13:13:56 -05:00
struct bkey_s_c old ;
2019-03-11 14:59:58 -04:00
int ret ;
2019-12-31 16:17:42 -05:00
if ( unlikely ( flags & BTREE_TRIGGER_NORUN ) )
return 0 ;
2019-03-11 14:59:58 -04:00
if ( ! btree_node_type_needs_gc ( iter - > btree_id ) )
return 0 ;
2020-12-10 13:13:56 -05:00
if ( ! btree_node_type_is_extents ( iter - > btree_id ) ) {
/* iterators should be uptodate, shouldn't get errors here: */
if ( btree_iter_type ( iter ) ! = BTREE_ITER_CACHED ) {
old = bch2_btree_iter_peek_slot ( iter ) ;
BUG_ON ( bkey_err ( old ) ) ;
} else {
struct bkey_cached * ck = ( void * ) iter - > l [ 0 ] . b ;
2019-03-07 19:46:10 -05:00
2020-12-10 13:13:56 -05:00
BUG_ON ( ! ck - > valid ) ;
old = bkey_i_to_s_c ( ck - > k ) ;
}
2019-03-07 19:46:10 -05:00
2020-12-10 13:13:56 -05:00
if ( old . k - > type = = new - > k . type ) {
ret = bch2_trans_mark_key ( trans , old , bkey_i_to_s_c ( new ) , 0 , 0 ,
BTREE_TRIGGER_INSERT | BTREE_TRIGGER_OVERWRITE | flags ) ;
} else {
ret = bch2_trans_mark_key ( trans , old , bkey_i_to_s_c ( new ) , 0 , 0 ,
BTREE_TRIGGER_INSERT | flags ) ? :
bch2_trans_mark_key ( trans , old , bkey_i_to_s_c ( new ) , 0 , 0 ,
BTREE_TRIGGER_OVERWRITE | flags ) ;
}
} else {
2021-02-10 16:13:57 -05:00
struct btree_iter * copy ;
struct bkey _old ;
2019-03-11 14:59:58 -04:00
2020-12-10 13:13:56 -05:00
EBUG_ON ( btree_iter_type ( iter ) = = BTREE_ITER_CACHED ) ;
2019-03-11 14:59:58 -04:00
2021-02-10 16:13:57 -05:00
bkey_init ( & _old ) ;
old = ( struct bkey_s_c ) { & _old , NULL } ;
2020-12-10 13:13:56 -05:00
ret = bch2_trans_mark_key ( trans , old , bkey_i_to_s_c ( new ) ,
0 , new - > k . size ,
BTREE_TRIGGER_INSERT ) ;
if ( ret )
return ret ;
2021-02-10 16:13:57 -05:00
copy = bch2_trans_copy_iter ( trans , iter ) ;
2020-12-10 13:13:56 -05:00
2021-02-10 16:13:57 -05:00
for_each_btree_key_continue ( copy , 0 , old , ret ) {
unsigned offset = 0 ;
s64 sectors = - ( ( s64 ) old . k - > size ) ;
2020-12-10 13:13:56 -05:00
flags | = BTREE_TRIGGER_OVERWRITE ;
if ( bkey_cmp ( new - > k . p , bkey_start_pos ( old . k ) ) < = 0 )
2021-02-10 16:13:57 -05:00
break ;
2019-03-11 14:59:58 -04:00
2020-12-10 13:13:56 -05:00
switch ( bch2_extent_overlap ( & new - > k , old . k ) ) {
2019-03-11 14:59:58 -04:00
case BCH_EXTENT_OVERLAP_ALL :
2019-08-09 13:01:10 -04:00
offset = 0 ;
2020-12-10 13:13:56 -05:00
sectors = - ( ( s64 ) old . k - > size ) ;
2019-03-11 14:59:58 -04:00
break ;
case BCH_EXTENT_OVERLAP_BACK :
2020-12-10 13:13:56 -05:00
offset = bkey_start_offset ( & new - > k ) -
bkey_start_offset ( old . k ) ;
sectors = bkey_start_offset ( & new - > k ) -
old . k - > p . offset ;
2019-03-11 14:59:58 -04:00
break ;
case BCH_EXTENT_OVERLAP_FRONT :
2019-08-09 13:01:10 -04:00
offset = 0 ;
2020-12-10 13:13:56 -05:00
sectors = bkey_start_offset ( old . k ) -
new - > k . p . offset ;
2019-03-11 14:59:58 -04:00
break ;
case BCH_EXTENT_OVERLAP_MIDDLE :
2020-12-10 13:13:56 -05:00
offset = bkey_start_offset ( & new - > k ) -
bkey_start_offset ( old . k ) ;
sectors = - ( ( s64 ) new - > k . size ) ;
2019-12-31 16:17:42 -05:00
flags | = BTREE_TRIGGER_OVERWRITE_SPLIT ;
2019-03-11 14:59:58 -04:00
break ;
}
BUG_ON ( sectors > = 0 ) ;
2020-12-10 13:13:56 -05:00
ret = bch2_trans_mark_key ( trans , old , bkey_i_to_s_c ( new ) ,
offset , sectors , flags ) ;
if ( ret )
2021-02-10 16:13:57 -05:00
break ;
2020-12-10 13:13:56 -05:00
}
2021-02-10 16:13:57 -05:00
bch2_trans_iter_put ( trans , copy ) ;
2019-03-11 14:59:58 -04:00
}
2020-12-10 13:13:56 -05:00
return ret ;
2019-03-11 14:59:58 -04:00
}
2021-01-22 17:56:34 -05:00
static int __bch2_trans_mark_metadata_bucket ( struct btree_trans * trans ,
struct bch_dev * ca , size_t b ,
enum bch_data_type type ,
unsigned sectors )
{
struct bch_fs * c = trans - > c ;
struct btree_iter * iter ;
struct bkey_alloc_unpacked u ;
2021-01-22 18:01:07 -05:00
struct bkey_alloc_buf * a ;
2021-01-22 17:56:34 -05:00
struct bch_extent_ptr ptr = {
. dev = ca - > dev_idx ,
. offset = bucket_to_sector ( ca , b ) ,
} ;
int ret = 0 ;
2021-01-22 18:01:07 -05:00
a = bch2_trans_start_alloc_update ( trans , & iter , & ptr , & u ) ;
if ( IS_ERR ( a ) )
return PTR_ERR ( a ) ;
2021-01-22 17:56:34 -05:00
if ( u . data_type & & u . data_type ! = type ) {
bch2_fsck_err ( c , FSCK_CAN_IGNORE | FSCK_NEED_FSCK ,
" bucket %llu:%llu gen %u different types of data in same bucket: %s, %s \n "
" while marking %s " ,
iter - > pos . inode , iter - > pos . offset , u . gen ,
bch2_data_types [ u . data_type ] ,
bch2_data_types [ type ] ,
bch2_data_types [ type ] ) ;
ret = - EIO ;
goto out ;
}
if ( ( unsigned ) ( u . dirty_sectors + sectors ) > ca - > mi . bucket_size ) {
bch2_fsck_err ( c , FSCK_CAN_IGNORE | FSCK_NEED_FSCK ,
" bucket %llu:%llu gen %u data type %s sector count overflow: %u + %u > %u \n "
" while marking %s " ,
iter - > pos . inode , iter - > pos . offset , u . gen ,
bch2_data_types [ u . data_type ? : type ] ,
u . dirty_sectors , sectors , ca - > mi . bucket_size ,
bch2_data_types [ type ] ) ;
ret = - EIO ;
goto out ;
}
if ( u . data_type = = type & &
u . dirty_sectors = = sectors )
goto out ;
u . data_type = type ;
u . dirty_sectors = sectors ;
2021-01-22 18:01:07 -05:00
bch2_alloc_pack ( c , a , u ) ;
bch2_trans_update ( trans , iter , & a - > k , 0 ) ;
2021-01-22 17:56:34 -05:00
out :
bch2_trans_iter_put ( trans , iter ) ;
return ret ;
}
int bch2_trans_mark_metadata_bucket ( struct btree_trans * trans ,
struct disk_reservation * res ,
struct bch_dev * ca , size_t b ,
enum bch_data_type type ,
unsigned sectors )
{
return __bch2_trans_do ( trans , res , NULL , 0 ,
__bch2_trans_mark_metadata_bucket ( trans , ca , b , BCH_DATA_journal ,
ca - > mi . bucket_size ) ) ;
}
static int bch2_trans_mark_metadata_sectors ( struct btree_trans * trans ,
struct disk_reservation * res ,
struct bch_dev * ca ,
u64 start , u64 end ,
enum bch_data_type type ,
u64 * bucket , unsigned * bucket_sectors )
{
int ret ;
do {
u64 b = sector_to_bucket ( ca , start ) ;
unsigned sectors =
min_t ( u64 , bucket_to_sector ( ca , b + 1 ) , end ) - start ;
if ( b ! = * bucket ) {
if ( * bucket_sectors ) {
ret = bch2_trans_mark_metadata_bucket ( trans , res , ca ,
* bucket , type , * bucket_sectors ) ;
if ( ret )
return ret ;
}
* bucket = b ;
* bucket_sectors = 0 ;
}
* bucket_sectors + = sectors ;
start + = sectors ;
} while ( ! ret & & start < end ) ;
return 0 ;
}
static int __bch2_trans_mark_dev_sb ( struct btree_trans * trans ,
struct disk_reservation * res ,
struct bch_dev * ca )
{
struct bch_sb_layout * layout = & ca - > disk_sb . sb - > layout ;
u64 bucket = 0 ;
unsigned i , bucket_sectors = 0 ;
int ret ;
for ( i = 0 ; i < layout - > nr_superblocks ; i + + ) {
u64 offset = le64_to_cpu ( layout - > sb_offset [ i ] ) ;
if ( offset = = BCH_SB_SECTOR ) {
ret = bch2_trans_mark_metadata_sectors ( trans , res , ca ,
0 , BCH_SB_SECTOR ,
BCH_DATA_sb , & bucket , & bucket_sectors ) ;
if ( ret )
return ret ;
}
ret = bch2_trans_mark_metadata_sectors ( trans , res , ca , offset ,
offset + ( 1 < < layout - > sb_max_size_bits ) ,
BCH_DATA_sb , & bucket , & bucket_sectors ) ;
if ( ret )
return ret ;
}
if ( bucket_sectors ) {
ret = bch2_trans_mark_metadata_bucket ( trans , res , ca ,
bucket , BCH_DATA_sb , bucket_sectors ) ;
if ( ret )
return ret ;
}
for ( i = 0 ; i < ca - > journal . nr ; i + + ) {
ret = bch2_trans_mark_metadata_bucket ( trans , res , ca ,
ca - > journal . buckets [ i ] ,
BCH_DATA_journal , ca - > mi . bucket_size ) ;
if ( ret )
return ret ;
}
return 0 ;
}
int bch2_trans_mark_dev_sb ( struct bch_fs * c ,
struct disk_reservation * res ,
struct bch_dev * ca )
{
return bch2_trans_do ( c , res , NULL , 0 ,
__bch2_trans_mark_dev_sb ( & trans , res , ca ) ) ;
}
2017-03-16 22:18:50 -08:00
/* Disk reservations: */
# define SECTORS_CACHE 1024
int bch2_disk_reservation_add ( struct bch_fs * c , struct disk_reservation * res ,
2021-01-17 13:19:16 -05:00
u64 sectors , int flags )
2017-03-16 22:18:50 -08:00
{
2018-11-27 08:23:22 -05:00
struct bch_fs_pcpu * pcpu ;
2017-03-16 22:18:50 -08:00
u64 old , v , get ;
s64 sectors_available ;
int ret ;
2018-11-26 00:13:33 -05:00
percpu_down_read ( & c - > mark_lock ) ;
2017-03-16 22:18:50 -08:00
preempt_disable ( ) ;
2018-11-27 08:23:22 -05:00
pcpu = this_cpu_ptr ( c - > pcpu ) ;
2017-03-16 22:18:50 -08:00
2018-11-27 08:23:22 -05:00
if ( sectors < = pcpu - > sectors_available )
2017-03-16 22:18:50 -08:00
goto out ;
v = atomic64_read ( & c - > sectors_available ) ;
do {
old = v ;
get = min ( ( u64 ) sectors + SECTORS_CACHE , old ) ;
if ( get < sectors ) {
preempt_enable ( ) ;
goto recalculate ;
}
} while ( ( v = atomic64_cmpxchg ( & c - > sectors_available ,
old , old - get ) ) ! = old ) ;
2018-11-27 08:23:22 -05:00
pcpu - > sectors_available + = get ;
2017-03-16 22:18:50 -08:00
out :
2018-11-27 08:23:22 -05:00
pcpu - > sectors_available - = sectors ;
2019-02-10 19:34:47 -05:00
this_cpu_add ( * c - > online_reserved , sectors ) ;
2018-11-27 08:23:22 -05:00
res - > sectors + = sectors ;
2017-03-16 22:18:50 -08:00
preempt_enable ( ) ;
2018-11-26 00:13:33 -05:00
percpu_up_read ( & c - > mark_lock ) ;
2017-03-16 22:18:50 -08:00
return 0 ;
recalculate :
2020-12-03 14:17:33 -05:00
mutex_lock ( & c - > sectors_available_lock ) ;
2019-02-11 22:08:09 -05:00
2020-12-03 14:17:33 -05:00
percpu_u64_set ( & c - > pcpu - > sectors_available , 0 ) ;
sectors_available = avail_factor ( __bch2_fs_usage_read_short ( c ) . free ) ;
2017-03-16 22:18:50 -08:00
if ( sectors < = sectors_available | |
( flags & BCH_DISK_RESERVATION_NOFAIL ) ) {
atomic64_set ( & c - > sectors_available ,
max_t ( s64 , 0 , sectors_available - sectors ) ) ;
2019-02-10 19:34:47 -05:00
this_cpu_add ( * c - > online_reserved , sectors ) ;
2018-11-27 08:23:22 -05:00
res - > sectors + = sectors ;
2017-03-16 22:18:50 -08:00
ret = 0 ;
} else {
atomic64_set ( & c - > sectors_available , sectors_available ) ;
ret = - ENOSPC ;
}
2020-12-03 14:17:33 -05:00
mutex_unlock ( & c - > sectors_available_lock ) ;
percpu_up_read ( & c - > mark_lock ) ;
2017-03-16 22:18:50 -08:00
return ret ;
}
/* Startup/shutdown: */
static void buckets_free_rcu ( struct rcu_head * rcu )
{
struct bucket_array * buckets =
container_of ( rcu , struct bucket_array , rcu ) ;
kvpfree ( buckets ,
sizeof ( struct bucket_array ) +
buckets - > nbuckets * sizeof ( struct bucket ) ) ;
}
int bch2_dev_buckets_resize ( struct bch_fs * c , struct bch_dev * ca , u64 nbuckets )
{
struct bucket_array * buckets = NULL , * old_buckets = NULL ;
2018-11-19 01:16:07 -05:00
unsigned long * buckets_nouse = NULL ;
2017-03-16 22:18:50 -08:00
alloc_fifo free [ RESERVE_NR ] ;
alloc_fifo free_inc ;
alloc_heap alloc_heap ;
size_t btree_reserve = DIV_ROUND_UP ( BTREE_NODE_RESERVE ,
ca - > mi . bucket_size / c - > opts . btree_node_size ) ;
/* XXX: these should be tunable */
2018-11-04 22:09:51 -05:00
size_t reserve_none = max_t ( size_t , 1 , nbuckets > > 9 ) ;
2020-12-21 17:17:18 -05:00
size_t copygc_reserve = max_t ( size_t , 2 , nbuckets > > 6 ) ;
2018-11-04 22:09:51 -05:00
size_t free_inc_nr = max ( max_t ( size_t , 1 , nbuckets > > 12 ) ,
2019-01-13 16:02:22 -05:00
btree_reserve * 2 ) ;
2020-07-11 16:28:54 -04:00
bool resize = ca - > buckets [ 0 ] ! = NULL ;
2017-03-16 22:18:50 -08:00
int ret = - ENOMEM ;
unsigned i ;
memset ( & free , 0 , sizeof ( free ) ) ;
memset ( & free_inc , 0 , sizeof ( free_inc ) ) ;
memset ( & alloc_heap , 0 , sizeof ( alloc_heap ) ) ;
if ( ! ( buckets = kvpmalloc ( sizeof ( struct bucket_array ) +
nbuckets * sizeof ( struct bucket ) ,
GFP_KERNEL | __GFP_ZERO ) ) | |
2018-11-19 01:16:07 -05:00
! ( buckets_nouse = kvpmalloc ( BITS_TO_LONGS ( nbuckets ) *
2017-03-16 22:18:50 -08:00
sizeof ( unsigned long ) ,
GFP_KERNEL | __GFP_ZERO ) ) | |
! init_fifo ( & free [ RESERVE_MOVINGGC ] ,
copygc_reserve , GFP_KERNEL ) | |
! init_fifo ( & free [ RESERVE_NONE ] , reserve_none , GFP_KERNEL ) | |
2018-07-22 10:43:01 -04:00
! init_fifo ( & free_inc , free_inc_nr , GFP_KERNEL ) | |
2020-07-11 16:28:54 -04:00
! init_heap ( & alloc_heap , ALLOC_SCAN_BATCH ( ca ) < < 1 , GFP_KERNEL ) )
2017-03-16 22:18:50 -08:00
goto err ;
buckets - > first_bucket = ca - > mi . first_bucket ;
buckets - > nbuckets = nbuckets ;
2020-07-11 16:28:54 -04:00
bch2_copygc_stop ( c ) ;
2017-03-16 22:18:50 -08:00
if ( resize ) {
2020-06-17 17:30:38 -04:00
down_write ( & c - > gc_lock ) ;
2017-03-16 22:18:50 -08:00
down_write ( & ca - > bucket_lock ) ;
2018-11-26 00:13:33 -05:00
percpu_down_write ( & c - > mark_lock ) ;
2017-03-16 22:18:50 -08:00
}
old_buckets = bucket_array ( ca ) ;
if ( resize ) {
size_t n = min ( buckets - > nbuckets , old_buckets - > nbuckets ) ;
memcpy ( buckets - > b ,
old_buckets - > b ,
n * sizeof ( struct bucket ) ) ;
2018-11-19 01:16:07 -05:00
memcpy ( buckets_nouse ,
ca - > buckets_nouse ,
2017-03-16 22:18:50 -08:00
BITS_TO_LONGS ( n ) * sizeof ( unsigned long ) ) ;
}
2018-07-23 05:32:01 -04:00
rcu_assign_pointer ( ca - > buckets [ 0 ] , buckets ) ;
2017-03-16 22:18:50 -08:00
buckets = old_buckets ;
2018-11-19 01:16:07 -05:00
swap ( ca - > buckets_nouse , buckets_nouse ) ;
2017-03-16 22:18:50 -08:00
2020-06-17 17:30:38 -04:00
if ( resize ) {
2018-11-26 00:13:33 -05:00
percpu_up_write ( & c - > mark_lock ) ;
2020-06-17 17:30:38 -04:00
up_write ( & c - > gc_lock ) ;
}
2017-03-16 22:18:50 -08:00
spin_lock ( & c - > freelist_lock ) ;
for ( i = 0 ; i < RESERVE_NR ; i + + ) {
fifo_move ( & free [ i ] , & ca - > free [ i ] ) ;
swap ( ca - > free [ i ] , free [ i ] ) ;
}
fifo_move ( & free_inc , & ca - > free_inc ) ;
swap ( ca - > free_inc , free_inc ) ;
spin_unlock ( & c - > freelist_lock ) ;
/* with gc lock held, alloc_heap can't be in use: */
swap ( ca - > alloc_heap , alloc_heap ) ;
nbuckets = ca - > mi . nbuckets ;
2020-06-15 14:58:47 -04:00
if ( resize )
2017-03-16 22:18:50 -08:00
up_write ( & ca - > bucket_lock ) ;
ret = 0 ;
err :
free_heap ( & alloc_heap ) ;
free_fifo ( & free_inc ) ;
for ( i = 0 ; i < RESERVE_NR ; i + + )
free_fifo ( & free [ i ] ) ;
2018-11-19 01:16:07 -05:00
kvpfree ( buckets_nouse ,
2017-03-16 22:18:50 -08:00
BITS_TO_LONGS ( nbuckets ) * sizeof ( unsigned long ) ) ;
if ( buckets )
call_rcu ( & old_buckets - > rcu , buckets_free_rcu ) ;
return ret ;
}
void bch2_dev_buckets_free ( struct bch_dev * ca )
{
unsigned i ;
free_heap ( & ca - > alloc_heap ) ;
free_fifo ( & ca - > free_inc ) ;
for ( i = 0 ; i < RESERVE_NR ; i + + )
free_fifo ( & ca - > free [ i ] ) ;
2018-11-19 01:16:07 -05:00
kvpfree ( ca - > buckets_nouse ,
2017-03-16 22:18:50 -08:00
BITS_TO_LONGS ( ca - > mi . nbuckets ) * sizeof ( unsigned long ) ) ;
2018-07-23 05:32:01 -04:00
kvpfree ( rcu_dereference_protected ( ca - > buckets [ 0 ] , 1 ) ,
2017-03-16 22:18:50 -08:00
sizeof ( struct bucket_array ) +
ca - > mi . nbuckets * sizeof ( struct bucket ) ) ;
2021-01-21 21:52:06 -05:00
for ( i = 0 ; i < ARRAY_SIZE ( ca - > usage ) ; i + + )
free_percpu ( ca - > usage [ i ] ) ;
kfree ( ca - > usage_base ) ;
2017-03-16 22:18:50 -08:00
}
int bch2_dev_buckets_alloc ( struct bch_fs * c , struct bch_dev * ca )
{
2021-01-21 21:52:06 -05:00
unsigned i ;
ca - > usage_base = kzalloc ( sizeof ( struct bch_dev_usage ) , GFP_KERNEL ) ;
if ( ! ca - > usage_base )
2017-03-16 22:18:50 -08:00
return - ENOMEM ;
2021-01-21 21:52:06 -05:00
for ( i = 0 ; i < ARRAY_SIZE ( ca - > usage ) ; i + + ) {
ca - > usage [ i ] = alloc_percpu ( struct bch_dev_usage ) ;
if ( ! ca - > usage [ i ] )
return - ENOMEM ;
}
2017-03-16 22:18:50 -08:00
return bch2_dev_buckets_resize ( c , ca , ca - > mi . nbuckets ) ; ;
}