2017-03-16 22:18:50 -08:00
// SPDX-License-Identifier: GPL-2.0
/*
* Assorted bcachefs debug code
*
* Copyright 2010 , 2011 Kent Overstreet < kent . overstreet @ gmail . com >
* Copyright 2012 Google , Inc .
*/
# include "bcachefs.h"
# include "bkey_methods.h"
# include "btree_cache.h"
# include "btree_io.h"
# include "btree_iter.h"
2022-08-22 23:12:11 -04:00
# include "btree_locking.h"
2017-03-16 22:18:50 -08:00
# include "btree_update.h"
2024-04-03 19:15:53 -04:00
# include "btree_update_interior.h"
2017-03-16 22:18:50 -08:00
# include "buckets.h"
# include "debug.h"
# include "error.h"
# include "extents.h"
# include "fsck.h"
# include "inode.h"
# include "super.h"
# include <linux/console.h>
# include <linux/debugfs.h>
# include <linux/module.h>
# include <linux/random.h>
# include <linux/seq_file.h>
static struct dentry * bch_debug ;
2021-04-20 20:21:12 -04:00
static bool bch2_btree_verify_replica ( struct bch_fs * c , struct btree * b ,
struct extent_ptr_decoded pick )
2017-03-16 22:18:50 -08:00
{
struct btree * v = c - > verify_data ;
2021-04-20 20:21:12 -04:00
struct btree_node * n_ondisk = c - > verify_ondisk ;
struct btree_node * n_sorted = c - > verify_data - > data ;
struct bset * sorted , * inmemory = & b - > data - > keys ;
2017-03-16 22:18:50 -08:00
struct bio * bio ;
2023-01-03 17:32:16 -05:00
bool failed = false , saw_error = false ;
2017-03-16 22:18:50 -08:00
2024-04-30 15:37:51 -04:00
struct bch_dev * ca = bch2_dev_get_ioref ( c , pick . ptr . dev , READ ) ;
2024-05-03 12:55:55 -04:00
if ( ! ca )
2021-04-20 20:21:12 -04:00
return false ;
2017-03-16 22:18:50 -08:00
bio = bio_alloc_bioset ( ca - > disk_sb . bdev ,
2024-01-16 13:29:59 -05:00
buf_pages ( n_sorted , btree_buf_bytes ( b ) ) ,
2017-03-16 22:18:50 -08:00
REQ_OP_READ | REQ_META ,
2023-05-28 18:02:38 -04:00
GFP_NOFS ,
2017-03-16 22:18:50 -08:00
& c - > btree_bio ) ;
bio - > bi_iter . bi_sector = pick . ptr . offset ;
2024-01-16 13:29:59 -05:00
bch2_bio_map ( bio , n_sorted , btree_buf_bytes ( b ) ) ;
2017-03-16 22:18:50 -08:00
submit_bio_wait ( bio ) ;
bio_put ( bio ) ;
percpu_ref_put ( & ca - > io_ref ) ;
2024-01-16 13:29:59 -05:00
memcpy ( n_ondisk , n_sorted , btree_buf_bytes ( b ) ) ;
2017-03-16 22:18:50 -08:00
2021-04-20 20:21:12 -04:00
v - > written = 0 ;
2023-01-03 17:32:16 -05:00
if ( bch2_btree_node_read_done ( c , ca , v , false , & saw_error ) | | saw_error )
2021-04-20 20:21:12 -04:00
return false ;
2017-03-16 22:18:50 -08:00
n_sorted = c - > verify_data - > data ;
sorted = & n_sorted - > keys ;
if ( inmemory - > u64s ! = sorted - > u64s | |
memcmp ( inmemory - > start ,
sorted - > start ,
vstruct_end ( inmemory ) - ( void * ) inmemory - > start ) ) {
unsigned offset = 0 , sectors ;
struct bset * i ;
unsigned j ;
console_lock ( ) ;
printk ( KERN_ERR " *** in memory: \n " ) ;
2020-06-17 17:33:53 -04:00
bch2_dump_bset ( c , b , inmemory , 0 ) ;
2017-03-16 22:18:50 -08:00
printk ( KERN_ERR " *** read back in: \n " ) ;
2020-06-17 17:33:53 -04:00
bch2_dump_bset ( c , v , sorted , 0 ) ;
2017-03-16 22:18:50 -08:00
2021-04-20 20:21:12 -04:00
while ( offset < v - > written ) {
if ( ! offset ) {
2017-03-16 22:18:50 -08:00
i = & n_ondisk - > keys ;
sectors = vstruct_blocks ( n_ondisk , c - > block_bits ) < <
c - > block_bits ;
} else {
struct btree_node_entry * bne =
( void * ) n_ondisk + ( offset < < 9 ) ;
i = & bne - > keys ;
sectors = vstruct_blocks ( bne , c - > block_bits ) < <
c - > block_bits ;
}
printk ( KERN_ERR " *** on disk block %u: \n " , offset ) ;
2020-06-17 17:33:53 -04:00
bch2_dump_bset ( c , b , i , offset ) ;
2017-03-16 22:18:50 -08:00
offset + = sectors ;
}
for ( j = 0 ; j < le16_to_cpu ( inmemory - > u64s ) ; j + + )
if ( inmemory - > _data [ j ] ! = sorted - > _data [ j ] )
break ;
console_unlock ( ) ;
2021-04-20 20:21:12 -04:00
bch_err ( c , " verify failed at key %u " , j ) ;
failed = true ;
}
if ( v - > written ! = b - > written ) {
bch_err ( c , " written wrong: expected %u, got %u " ,
b - > written , v - > written ) ;
failed = true ;
}
return failed ;
}
void __bch2_btree_verify ( struct bch_fs * c , struct btree * b )
{
struct bkey_ptrs_c ptrs ;
struct extent_ptr_decoded p ;
const union bch_extent_entry * entry ;
struct btree * v ;
struct bset * inmemory = & b - > data - > keys ;
struct bkey_packed * k ;
bool failed = false ;
if ( c - > opts . nochanges )
return ;
2021-07-10 23:03:15 -04:00
bch2_btree_node_io_lock ( b ) ;
2021-04-20 20:21:12 -04:00
mutex_lock ( & c - > verify_lock ) ;
if ( ! c - > verify_ondisk ) {
2024-02-01 06:35:46 -05:00
c - > verify_ondisk = kvmalloc ( btree_buf_bytes ( b ) , GFP_KERNEL ) ;
2021-04-20 20:21:12 -04:00
if ( ! c - > verify_ondisk )
goto out ;
}
if ( ! c - > verify_data ) {
c - > verify_data = __bch2_btree_node_mem_alloc ( c ) ;
if ( ! c - > verify_data )
goto out ;
list_del_init ( & c - > verify_data - > list ) ;
}
BUG_ON ( b - > nsets ! = 1 ) ;
2023-03-04 23:05:55 -05:00
for ( k = inmemory - > start ; k ! = vstruct_last ( inmemory ) ; k = bkey_p_next ( k ) )
2023-09-12 18:41:22 -04:00
if ( k - > type = = KEY_TYPE_btree_ptr_v2 )
( ( struct bch_btree_ptr_v2 * ) bkeyp_val ( & b - > format , k ) ) - > mem_ptr = 0 ;
2021-04-20 20:21:12 -04:00
v = c - > verify_data ;
bkey_copy ( & v - > key , & b - > key ) ;
v - > c . level = b - > c . level ;
v - > c . btree_id = b - > c . btree_id ;
bch2_btree_keys_init ( v ) ;
ptrs = bch2_bkey_ptrs_c ( bkey_i_to_s_c ( & b - > key ) ) ;
bkey_for_each_ptr_decode ( & b - > key . k , ptrs , p , entry )
failed | = bch2_btree_verify_replica ( c , b , p ) ;
if ( failed ) {
2022-02-25 13:18:19 -05:00
struct printbuf buf = PRINTBUF ;
2021-04-20 20:21:12 -04:00
2022-02-25 13:18:19 -05:00
bch2_bkey_val_to_text ( & buf , c , bkey_i_to_s_c ( & b - > key ) ) ;
2024-03-17 21:51:19 -04:00
bch2_fs_fatal_error ( c , " : btree node verify failed for: %s \n " , buf . buf ) ;
2022-02-25 13:18:19 -05:00
printbuf_exit ( & buf ) ;
2017-03-16 22:18:50 -08:00
}
out :
mutex_unlock ( & c - > verify_lock ) ;
2021-07-10 23:03:15 -04:00
bch2_btree_node_io_unlock ( b ) ;
2017-03-16 22:18:50 -08:00
}
2023-03-06 02:53:25 -05:00
void bch2_btree_node_ondisk_to_text ( struct printbuf * out , struct bch_fs * c ,
const struct btree * b )
{
struct btree_node * n_ondisk = NULL ;
struct extent_ptr_decoded pick ;
struct bch_dev * ca ;
struct bio * bio = NULL ;
unsigned offset = 0 ;
int ret ;
if ( bch2_bkey_pick_read_device ( c , bkey_i_to_s_c ( & b - > key ) , NULL , & pick ) < = 0 ) {
prt_printf ( out , " error getting device to read from: invalid device \n " ) ;
return ;
}
2024-04-30 15:37:51 -04:00
ca = bch2_dev_get_ioref ( c , pick . ptr . dev , READ ) ;
2024-05-03 12:55:55 -04:00
if ( ! ca ) {
2023-03-06 02:53:25 -05:00
prt_printf ( out , " error getting device to read from: not online \n " ) ;
return ;
}
2024-02-01 06:35:46 -05:00
n_ondisk = kvmalloc ( btree_buf_bytes ( b ) , GFP_KERNEL ) ;
2023-03-06 02:53:25 -05:00
if ( ! n_ondisk ) {
prt_printf ( out , " memory allocation failure \n " ) ;
goto out ;
}
bio = bio_alloc_bioset ( ca - > disk_sb . bdev ,
2024-01-16 13:29:59 -05:00
buf_pages ( n_ondisk , btree_buf_bytes ( b ) ) ,
2023-03-06 02:53:25 -05:00
REQ_OP_READ | REQ_META ,
2023-05-28 18:02:38 -04:00
GFP_NOFS ,
2023-03-06 02:53:25 -05:00
& c - > btree_bio ) ;
bio - > bi_iter . bi_sector = pick . ptr . offset ;
2024-01-16 13:29:59 -05:00
bch2_bio_map ( bio , n_ondisk , btree_buf_bytes ( b ) ) ;
2023-03-06 02:53:25 -05:00
ret = submit_bio_wait ( bio ) ;
if ( ret ) {
prt_printf ( out , " IO error reading btree node: %s \n " , bch2_err_str ( ret ) ) ;
goto out ;
}
while ( offset < btree_sectors ( c ) ) {
struct bset * i ;
struct nonce nonce ;
struct bch_csum csum ;
struct bkey_packed * k ;
unsigned sectors ;
if ( ! offset ) {
i = & n_ondisk - > keys ;
if ( ! bch2_checksum_type_valid ( c , BSET_CSUM_TYPE ( i ) ) ) {
prt_printf ( out , " unknown checksum type at offset %u: %llu \n " ,
offset , BSET_CSUM_TYPE ( i ) ) ;
goto out ;
}
nonce = btree_nonce ( i , offset < < 9 ) ;
csum = csum_vstruct ( c , BSET_CSUM_TYPE ( i ) , nonce , n_ondisk ) ;
if ( bch2_crc_cmp ( csum , n_ondisk - > csum ) ) {
prt_printf ( out , " invalid checksum \n " ) ;
goto out ;
}
bset_encrypt ( c , i , offset < < 9 ) ;
sectors = vstruct_sectors ( n_ondisk , c - > block_bits ) ;
} else {
struct btree_node_entry * bne = ( void * ) n_ondisk + ( offset < < 9 ) ;
i = & bne - > keys ;
if ( i - > seq ! = n_ondisk - > keys . seq )
break ;
if ( ! bch2_checksum_type_valid ( c , BSET_CSUM_TYPE ( i ) ) ) {
prt_printf ( out , " unknown checksum type at offset %u: %llu \n " ,
offset , BSET_CSUM_TYPE ( i ) ) ;
goto out ;
}
nonce = btree_nonce ( i , offset < < 9 ) ;
csum = csum_vstruct ( c , BSET_CSUM_TYPE ( i ) , nonce , bne ) ;
if ( bch2_crc_cmp ( csum , bne - > csum ) ) {
prt_printf ( out , " invalid checksum " ) ;
goto out ;
}
bset_encrypt ( c , i , offset < < 9 ) ;
sectors = vstruct_sectors ( bne , c - > block_bits ) ;
}
prt_printf ( out , " offset %u version %u, journal seq %llu \n " ,
offset ,
le16_to_cpu ( i - > version ) ,
le64_to_cpu ( i - > journal_seq ) ) ;
offset + = sectors ;
printbuf_indent_add ( out , 4 ) ;
for ( k = i - > start ; k ! = vstruct_last ( i ) ; k = bkey_p_next ( k ) ) {
struct bkey u ;
bch2_bkey_val_to_text ( out , c , bkey_disassemble ( b , k , & u ) ) ;
prt_newline ( out ) ;
}
printbuf_indent_sub ( out , 4 ) ;
}
out :
if ( bio )
bio_put ( bio ) ;
2024-02-01 06:35:46 -05:00
kvfree ( n_ondisk ) ;
2023-03-06 02:53:25 -05:00
percpu_ref_put ( & ca - > io_ref ) ;
}
2017-03-16 22:18:50 -08:00
# ifdef CONFIG_DEBUG_FS
/* XXX: bch_fs refcounting */
struct dump_iter {
2022-02-26 11:48:34 -05:00
struct bch_fs * c ;
2017-03-16 22:18:50 -08:00
enum btree_id id ;
2022-02-26 11:48:34 -05:00
struct bpos from ;
2022-07-20 16:50:26 -04:00
struct bpos prev_node ;
2022-02-26 11:48:34 -05:00
u64 iter ;
2017-03-16 22:18:50 -08:00
2022-02-25 13:18:19 -05:00
struct printbuf buf ;
2017-03-16 22:18:50 -08:00
char __user * ubuf ; /* destination user buffer */
size_t size ; /* size of requested read */
ssize_t ret ; /* bytes read so far */
} ;
2022-08-14 16:11:35 -04:00
static ssize_t flush_buf ( struct dump_iter * i )
2017-03-16 22:18:50 -08:00
{
2022-02-25 13:18:19 -05:00
if ( i - > buf . pos ) {
size_t bytes = min_t ( size_t , i - > buf . pos , i - > size ) ;
2023-09-19 17:09:22 -04:00
int copied = bytes - copy_to_user ( i - > ubuf , i - > buf . buf , bytes ) ;
2017-03-16 22:18:50 -08:00
2023-09-19 17:09:22 -04:00
i - > ret + = copied ;
i - > ubuf + = copied ;
i - > size - = copied ;
i - > buf . pos - = copied ;
memmove ( i - > buf . buf , i - > buf . buf + copied , i - > buf . pos ) ;
2017-03-16 22:18:50 -08:00
2023-09-19 17:09:22 -04:00
if ( copied ! = bytes )
return - EFAULT ;
2017-03-16 22:18:50 -08:00
}
2022-08-14 16:11:35 -04:00
return i - > size ? 0 : i - > ret ;
2017-03-16 22:18:50 -08:00
}
static int bch2_dump_open ( struct inode * inode , struct file * file )
{
struct btree_debug * bd = inode - > i_private ;
struct dump_iter * i ;
i = kzalloc ( sizeof ( struct dump_iter ) , GFP_KERNEL ) ;
if ( ! i )
return - ENOMEM ;
file - > private_data = i ;
i - > from = POS_MIN ;
2022-02-26 11:48:34 -05:00
i - > iter = 0 ;
2017-03-16 22:18:50 -08:00
i - > c = container_of ( bd , struct bch_fs , btree_debug [ bd - > id ] ) ;
i - > id = bd - > id ;
2022-02-25 13:18:19 -05:00
i - > buf = PRINTBUF ;
2017-03-16 22:18:50 -08:00
return 0 ;
}
static int bch2_dump_release ( struct inode * inode , struct file * file )
{
2022-02-25 13:18:19 -05:00
struct dump_iter * i = file - > private_data ;
printbuf_exit ( & i - > buf ) ;
kfree ( i ) ;
2017-03-16 22:18:50 -08:00
return 0 ;
}
static ssize_t bch2_read_btree ( struct file * file , char __user * buf ,
size_t size , loff_t * ppos )
{
struct dump_iter * i = file - > private_data ;
i - > ubuf = buf ;
i - > size = size ;
i - > ret = 0 ;
2023-12-16 22:30:09 -05:00
return flush_buf ( i ) ? :
bch2_trans_run ( i - > c ,
for_each_btree_key ( trans , iter , i - > id , i - > from ,
2024-04-07 18:05:34 -04:00
BTREE_ITER_prefetch |
BTREE_ITER_all_snapshots , k , ( {
2023-12-16 22:30:09 -05:00
bch2_bkey_val_to_text ( & i - > buf , i - > c , k ) ;
prt_newline ( & i - > buf ) ;
bch2_trans_unlock ( trans ) ;
i - > from = bpos_successor ( iter . pos ) ;
flush_buf ( i ) ;
} ) ) ) ? :
i - > ret ;
2017-03-16 22:18:50 -08:00
}
static const struct file_operations btree_debug_ops = {
. owner = THIS_MODULE ,
. open = bch2_dump_open ,
. release = bch2_dump_release ,
. read = bch2_read_btree ,
} ;
static ssize_t bch2_read_btree_formats ( struct file * file , char __user * buf ,
size_t size , loff_t * ppos )
{
struct dump_iter * i = file - > private_data ;
2023-09-12 17:16:02 -04:00
struct btree_trans * trans ;
2021-08-30 15:18:31 -04:00
struct btree_iter iter ;
2017-03-16 22:18:50 -08:00
struct btree * b ;
2022-08-14 16:11:35 -04:00
ssize_t ret ;
2017-03-16 22:18:50 -08:00
i - > ubuf = buf ;
i - > size = size ;
i - > ret = 0 ;
2022-08-14 16:11:35 -04:00
ret = flush_buf ( i ) ;
if ( ret )
return ret ;
2017-03-16 22:18:50 -08:00
2022-11-24 03:12:22 -05:00
if ( bpos_eq ( SPOS_MAX , i - > from ) )
2017-03-16 22:18:50 -08:00
return i - > ret ;
2023-09-12 17:16:02 -04:00
trans = bch2_trans_get ( i - > c ) ;
2023-06-21 06:44:44 -04:00
retry :
2023-09-12 17:16:02 -04:00
bch2_trans_begin ( trans ) ;
2019-03-25 15:10:15 -04:00
2023-09-12 17:16:02 -04:00
for_each_btree_node ( trans , iter , i - > id , i - > from , 0 , b , ret ) {
2022-08-14 16:11:35 -04:00
bch2_btree_node_to_text ( & i - > buf , i - > c , b ) ;
2022-11-24 03:12:22 -05:00
i - > from = ! bpos_eq ( SPOS_MAX , b - > key . k . p )
bcachefs: Start using bpos.snapshot field
This patch starts treating the bpos.snapshot field like part of the key
in the btree code:
* bpos_successor() and bpos_predecessor() now include the snapshot field
* Keys in btrees that will be using snapshots (extents, inodes, dirents
and xattrs) now always have their snapshot field set to U32_MAX
The btree iterator code gets a new flag, BTREE_ITER_ALL_SNAPSHOTS, that
determines whether we're iterating over keys in all snapshots or not -
internally, this controlls whether bkey_(successor|predecessor)
increment/decrement the snapshot field, or only the higher bits of the
key.
We add a new member to struct btree_iter, iter->snapshot: when
BTREE_ITER_ALL_SNAPSHOTS is not set, iter->pos.snapshot should always
equal iter->snapshot, which will be 0 for btrees that don't use
snapshots, and alsways U32_MAX for btrees that will use snapshots
(until we enable snapshot creation).
This patch also introduces a new metadata version number, and compat
code for reading from/writing to older versions - this isn't a forced
upgrade (yet).
Signed-off-by: Kent Overstreet <kent.overstreet@gmail.com>
Signed-off-by: Kent Overstreet <kent.overstreet@linux.dev>
2021-03-24 18:02:16 -04:00
? bpos_successor ( b - > key . k . p )
2017-03-16 22:18:50 -08:00
: b - > key . k . p ;
2023-06-21 06:44:44 -04:00
2023-09-12 17:16:02 -04:00
ret = drop_locks_do ( trans , flush_buf ( i ) ) ;
2023-06-21 06:44:44 -04:00
if ( ret )
break ;
2017-03-16 22:18:50 -08:00
}
2023-09-12 17:16:02 -04:00
bch2_trans_iter_exit ( trans , & iter ) ;
2021-03-19 20:29:11 -04:00
2023-06-21 06:44:44 -04:00
if ( bch2_err_matches ( ret , BCH_ERR_transaction_restart ) )
goto retry ;
2023-09-12 17:16:02 -04:00
bch2_trans_put ( trans ) ;
2017-03-16 22:18:50 -08:00
2022-08-14 16:11:35 -04:00
if ( ! ret )
ret = flush_buf ( i ) ;
return ret ? : i - > ret ;
2017-03-16 22:18:50 -08:00
}
static const struct file_operations btree_format_debug_ops = {
. owner = THIS_MODULE ,
. open = bch2_dump_open ,
. release = bch2_dump_release ,
. read = bch2_read_btree_formats ,
} ;
static ssize_t bch2_read_bfloat_failed ( struct file * file , char __user * buf ,
size_t size , loff_t * ppos )
{
struct dump_iter * i = file - > private_data ;
i - > ubuf = buf ;
i - > size = size ;
i - > ret = 0 ;
2023-12-16 22:30:09 -05:00
return flush_buf ( i ) ? :
bch2_trans_run ( i - > c ,
for_each_btree_key ( trans , iter , i - > id , i - > from ,
2024-04-07 18:05:34 -04:00
BTREE_ITER_prefetch |
BTREE_ITER_all_snapshots , k , ( {
2023-12-04 00:39:38 -05:00
struct btree_path_level * l =
& btree_iter_path ( trans , & iter ) - > l [ 0 ] ;
2023-12-16 22:30:09 -05:00
struct bkey_packed * _k =
bch2_btree_node_iter_peek ( & l - > iter , l - > b ) ;
if ( bpos_gt ( l - > b - > key . k . p , i - > prev_node ) ) {
bch2_btree_node_to_text ( & i - > buf , i - > c , l - > b ) ;
i - > prev_node = l - > b - > key . k . p ;
}
bch2_bfloat_to_text ( & i - > buf , l - > b , _k ) ;
bch2_trans_unlock ( trans ) ;
i - > from = bpos_successor ( iter . pos ) ;
flush_buf ( i ) ;
} ) ) ) ? :
i - > ret ;
2017-03-16 22:18:50 -08:00
}
static const struct file_operations bfloat_failed_debug_ops = {
. owner = THIS_MODULE ,
. open = bch2_dump_open ,
. release = bch2_dump_release ,
. read = bch2_read_bfloat_failed ,
} ;
2022-02-26 11:48:34 -05:00
static void bch2_cached_btree_node_to_text ( struct printbuf * out , struct bch_fs * c ,
struct btree * b )
{
2023-02-03 21:01:40 -05:00
if ( ! out - > nr_tabstops )
printbuf_tabstop_push ( out , 32 ) ;
2022-02-26 11:48:34 -05:00
2024-04-10 16:08:24 -04:00
prt_printf ( out , " %px btree=%s l=%u \n " , b , bch2_btree_id_str ( b - > c . btree_id ) , b - > c . level ) ;
2022-02-26 11:48:34 -05:00
2023-02-03 21:01:40 -05:00
printbuf_indent_add ( out , 2 ) ;
2022-02-26 11:48:34 -05:00
bch2_bkey_val_to_text ( out , c , bkey_i_to_s_c ( & b - > key ) ) ;
2023-02-03 21:01:40 -05:00
prt_newline ( out ) ;
2024-04-10 16:08:24 -04:00
prt_printf ( out , " flags: \t " ) ;
2023-02-03 21:01:40 -05:00
prt_bitflags ( out , bch2_btree_node_flags , b - > flags ) ;
prt_newline ( out ) ;
2024-04-10 16:08:24 -04:00
prt_printf ( out , " pcpu read locks: \t %u \n " , b - > c . lock . readers ! = NULL ) ;
prt_printf ( out , " written: \t %u \n " , b - > written ) ;
prt_printf ( out , " writes blocked: \t %u \n " , ! list_empty_careful ( & b - > write_blocked ) ) ;
prt_printf ( out , " will make reachable: \t %lx \n " , b - > will_make_reachable ) ;
2023-02-03 21:01:40 -05:00
2024-04-10 16:08:24 -04:00
prt_printf ( out , " journal pin %px: \t %llu \n " ,
& b - > writes [ 0 ] . journal , b - > writes [ 0 ] . journal . seq ) ;
prt_printf ( out , " journal pin %px: \t %llu \n " ,
& b - > writes [ 1 ] . journal , b - > writes [ 1 ] . journal . seq ) ;
2023-02-03 21:01:40 -05:00
printbuf_indent_sub ( out , 2 ) ;
2022-02-26 11:48:34 -05:00
}
static ssize_t bch2_cached_btree_nodes_read ( struct file * file , char __user * buf ,
size_t size , loff_t * ppos )
{
struct dump_iter * i = file - > private_data ;
struct bch_fs * c = i - > c ;
bool done = false ;
2022-08-14 16:11:35 -04:00
ssize_t ret = 0 ;
2022-02-26 11:48:34 -05:00
i - > ubuf = buf ;
i - > size = size ;
i - > ret = 0 ;
do {
struct bucket_table * tbl ;
struct rhash_head * pos ;
struct btree * b ;
2022-08-14 16:11:35 -04:00
ret = flush_buf ( i ) ;
if ( ret )
return ret ;
2022-02-26 11:48:34 -05:00
rcu_read_lock ( ) ;
i - > buf . atomic + + ;
tbl = rht_dereference_rcu ( c - > btree_cache . table . tbl ,
& c - > btree_cache . table ) ;
if ( i - > iter < tbl - > size ) {
rht_for_each_entry_rcu ( b , pos , tbl , i - > iter , hash )
bch2_cached_btree_node_to_text ( & i - > buf , c , b ) ;
2022-10-19 18:31:33 -04:00
i - > iter + + ;
2022-02-26 11:48:34 -05:00
} else {
done = true ;
}
- - i - > buf . atomic ;
rcu_read_unlock ( ) ;
} while ( ! done ) ;
if ( i - > buf . allocation_failure )
2022-08-14 16:11:35 -04:00
ret = - ENOMEM ;
if ( ! ret )
ret = flush_buf ( i ) ;
2022-02-26 11:48:34 -05:00
2022-08-14 16:11:35 -04:00
return ret ? : i - > ret ;
2022-02-26 11:48:34 -05:00
}
static const struct file_operations cached_btree_nodes_ops = {
. owner = THIS_MODULE ,
. open = bch2_dump_open ,
. release = bch2_dump_release ,
. read = bch2_cached_btree_nodes_read ,
} ;
2024-06-22 22:11:01 -04:00
typedef int ( * list_cmp_fn ) ( const struct list_head * l , const struct list_head * r ) ;
static void list_sort ( struct list_head * head , list_cmp_fn cmp )
{
struct list_head * pos ;
list_for_each ( pos , head )
while ( ! list_is_last ( pos , head ) & &
cmp ( pos , pos - > next ) > 0 ) {
struct list_head * pos2 , * next = pos - > next ;
list_del ( next ) ;
list_for_each ( pos2 , head )
if ( cmp ( next , pos2 ) < 0 )
goto pos_found ;
BUG ( ) ;
pos_found :
list_add_tail ( next , pos2 ) ;
}
}
static int list_ptr_order_cmp ( const struct list_head * l , const struct list_head * r )
{
return cmp_int ( l , r ) ;
}
2022-06-17 20:12:02 -04:00
static ssize_t bch2_btree_transactions_read ( struct file * file , char __user * buf ,
size_t size , loff_t * ppos )
{
struct dump_iter * i = file - > private_data ;
struct bch_fs * c = i - > c ;
struct btree_trans * trans ;
2022-08-14 16:11:35 -04:00
ssize_t ret = 0 ;
2022-06-17 20:12:02 -04:00
i - > ubuf = buf ;
i - > size = size ;
i - > ret = 0 ;
2023-06-19 21:01:13 -04:00
restart :
seqmutex_lock ( & c - > btree_trans_lock ) ;
2024-06-22 22:11:01 -04:00
list_sort ( & c - > btree_trans_list , list_ptr_order_cmp ) ;
2023-12-11 11:11:22 -05:00
2024-06-22 22:11:01 -04:00
list_for_each_entry ( trans , & c - > btree_trans_list , list ) {
2024-06-28 21:08:01 -04:00
if ( ( ulong ) trans < = i - > iter )
2022-06-17 20:12:02 -04:00
continue ;
2024-06-22 22:11:01 -04:00
i - > iter = ( ulong ) trans ;
2024-06-22 22:02:09 -04:00
if ( ! closure_get_not_zero ( & trans - > ref ) )
continue ;
2023-06-19 21:01:13 -04:00
2024-06-22 22:02:09 -04:00
u32 seq = seqmutex_unlock ( & c - > btree_trans_lock ) ;
2022-06-17 20:12:02 -04:00
bch2_btree_trans_to_text ( & i - > buf , trans ) ;
2024-04-10 16:08:24 -04:00
prt_printf ( & i - > buf , " backtrace: \n " ) ;
2022-06-17 20:12:02 -04:00
printbuf_indent_add ( & i - > buf , 2 ) ;
2024-06-22 22:11:01 -04:00
bch2_prt_task_backtrace ( & i - > buf , trans - > locking_wait . task , 0 , GFP_KERNEL ) ;
2022-06-17 20:12:02 -04:00
printbuf_indent_sub ( & i - > buf , 2 ) ;
prt_newline ( & i - > buf ) ;
2023-06-19 21:01:13 -04:00
closure_put ( & trans - > ref ) ;
2024-06-22 22:02:09 -04:00
ret = flush_buf ( i ) ;
if ( ret )
goto unlocked ;
2023-06-19 21:01:13 -04:00
if ( ! seqmutex_relock ( & c - > btree_trans_lock , seq ) )
goto restart ;
}
seqmutex_unlock ( & c - > btree_trans_lock ) ;
unlocked :
2022-06-17 20:12:02 -04:00
if ( i - > buf . allocation_failure )
2022-08-14 16:11:35 -04:00
ret = - ENOMEM ;
if ( ! ret )
ret = flush_buf ( i ) ;
2022-06-17 20:12:02 -04:00
2022-08-14 16:11:35 -04:00
return ret ? : i - > ret ;
2022-06-17 20:12:02 -04:00
}
static const struct file_operations btree_transactions_ops = {
. owner = THIS_MODULE ,
. open = bch2_dump_open ,
. release = bch2_dump_release ,
. read = bch2_btree_transactions_read ,
} ;
2022-02-26 11:48:34 -05:00
static ssize_t bch2_journal_pins_read ( struct file * file , char __user * buf ,
size_t size , loff_t * ppos )
{
struct dump_iter * i = file - > private_data ;
struct bch_fs * c = i - > c ;
bool done = false ;
int err ;
i - > ubuf = buf ;
i - > size = size ;
i - > ret = 0 ;
2024-04-03 19:15:53 -04:00
while ( 1 ) {
2022-02-26 11:48:34 -05:00
err = flush_buf ( i ) ;
if ( err )
return err ;
if ( ! i - > size )
break ;
2024-04-03 19:15:53 -04:00
if ( done )
break ;
2022-02-26 11:48:34 -05:00
done = bch2_journal_seq_pins_to_text ( & i - > buf , & c - > journal , & i - > iter ) ;
i - > iter + + ;
2024-04-03 19:15:53 -04:00
}
2022-02-26 11:48:34 -05:00
if ( i - > buf . allocation_failure )
return - ENOMEM ;
return i - > ret ;
}
static const struct file_operations journal_pins_ops = {
. owner = THIS_MODULE ,
. open = bch2_dump_open ,
. release = bch2_dump_release ,
. read = bch2_journal_pins_read ,
} ;
2024-04-03 19:15:53 -04:00
static ssize_t bch2_btree_updates_read ( struct file * file , char __user * buf ,
size_t size , loff_t * ppos )
{
struct dump_iter * i = file - > private_data ;
struct bch_fs * c = i - > c ;
int err ;
i - > ubuf = buf ;
i - > size = size ;
i - > ret = 0 ;
if ( ! i - > iter ) {
bch2_btree_updates_to_text ( & i - > buf , c ) ;
i - > iter + + ;
}
err = flush_buf ( i ) ;
if ( err )
return err ;
if ( i - > buf . allocation_failure )
return - ENOMEM ;
return i - > ret ;
}
static const struct file_operations btree_updates_ops = {
. owner = THIS_MODULE ,
. open = bch2_dump_open ,
. release = bch2_dump_release ,
. read = bch2_btree_updates_read ,
} ;
2023-12-23 22:43:33 -05:00
static int btree_transaction_stats_open ( struct inode * inode , struct file * file )
2022-07-14 20:33:09 +12:00
{
struct bch_fs * c = inode - > i_private ;
struct dump_iter * i ;
i = kzalloc ( sizeof ( struct dump_iter ) , GFP_KERNEL ) ;
if ( ! i )
return - ENOMEM ;
2023-12-23 22:43:33 -05:00
i - > iter = 1 ;
2022-07-14 20:33:09 +12:00
i - > c = c ;
i - > buf = PRINTBUF ;
file - > private_data = i ;
return 0 ;
}
2023-12-23 22:43:33 -05:00
static int btree_transaction_stats_release ( struct inode * inode , struct file * file )
2022-07-14 20:33:09 +12:00
{
struct dump_iter * i = file - > private_data ;
printbuf_exit ( & i - > buf ) ;
kfree ( i ) ;
return 0 ;
}
2023-12-23 22:43:33 -05:00
static ssize_t btree_transaction_stats_read ( struct file * file , char __user * buf ,
size_t size , loff_t * ppos )
2022-07-14 20:33:09 +12:00
{
struct dump_iter * i = file - > private_data ;
2022-08-11 19:36:24 -04:00
struct bch_fs * c = i - > c ;
2022-07-14 20:33:09 +12:00
int err ;
i - > ubuf = buf ;
i - > size = size ;
i - > ret = 0 ;
2022-08-11 21:06:02 -04:00
while ( 1 ) {
2022-08-11 19:36:24 -04:00
struct btree_transaction_stats * s = & c - > btree_transaction_stats [ i - > iter ] ;
2022-07-14 20:33:09 +12:00
err = flush_buf ( i ) ;
if ( err )
return err ;
if ( ! i - > size )
break ;
2022-10-17 07:03:11 -04:00
if ( i - > iter = = ARRAY_SIZE ( bch2_btree_transaction_fns ) | |
! bch2_btree_transaction_fns [ i - > iter ] )
2022-08-11 21:06:02 -04:00
break ;
2024-04-10 16:08:24 -04:00
prt_printf ( & i - > buf , " %s: \n " , bch2_btree_transaction_fns [ i - > iter ] ) ;
2022-08-11 19:36:24 -04:00
printbuf_indent_add ( & i - > buf , 2 ) ;
2022-08-11 20:14:54 -04:00
mutex_lock ( & s - > lock ) ;
2024-04-10 16:08:24 -04:00
prt_printf ( & i - > buf , " Max mem used: %u \n " , s - > max_mem ) ;
prt_printf ( & i - > buf , " Transaction duration: \n " ) ;
2023-12-23 22:43:33 -05:00
printbuf_indent_add ( & i - > buf , 2 ) ;
bch2_time_stats_to_text ( & i - > buf , & s - > duration ) ;
printbuf_indent_sub ( & i - > buf , 2 ) ;
2022-08-11 20:14:54 -04:00
if ( IS_ENABLED ( CONFIG_BCACHEFS_LOCK_TIME_STATS ) ) {
2024-04-10 16:08:24 -04:00
prt_printf ( & i - > buf , " Lock hold times: \n " ) ;
2022-08-11 20:14:54 -04:00
printbuf_indent_add ( & i - > buf , 2 ) ;
bch2_time_stats_to_text ( & i - > buf , & s - > lock_hold_times ) ;
printbuf_indent_sub ( & i - > buf , 2 ) ;
}
if ( s - > max_paths_text ) {
2024-04-10 16:08:24 -04:00
prt_printf ( & i - > buf , " Maximum allocated btree paths (%u): \n " , s - > nr_max_paths ) ;
2022-08-11 20:14:54 -04:00
printbuf_indent_add ( & i - > buf , 2 ) ;
prt_str_indented ( & i - > buf , s - > max_paths_text ) ;
printbuf_indent_sub ( & i - > buf , 2 ) ;
}
mutex_unlock ( & s - > lock ) ;
2022-08-11 19:36:24 -04:00
printbuf_indent_sub ( & i - > buf , 2 ) ;
2022-07-14 20:33:09 +12:00
prt_newline ( & i - > buf ) ;
i - > iter + + ;
}
if ( i - > buf . allocation_failure )
return - ENOMEM ;
return i - > ret ;
}
2023-12-23 22:43:33 -05:00
static const struct file_operations btree_transaction_stats_op = {
. owner = THIS_MODULE ,
. open = btree_transaction_stats_open ,
. release = btree_transaction_stats_release ,
. read = btree_transaction_stats_read ,
2022-07-14 20:33:09 +12:00
} ;
2024-06-22 20:59:09 -04:00
/* walk btree transactions until we find a deadlock and print it */
static void btree_deadlock_to_text ( struct printbuf * out , struct bch_fs * c )
2022-08-22 23:12:11 -04:00
{
struct btree_trans * trans ;
2024-06-28 21:08:01 -04:00
ulong iter = 0 ;
2023-06-19 21:01:13 -04:00
restart :
seqmutex_lock ( & c - > btree_trans_lock ) ;
2024-06-28 21:08:01 -04:00
list_sort ( & c - > btree_trans_list , list_ptr_order_cmp ) ;
2023-12-11 11:11:22 -05:00
2024-06-28 21:08:01 -04:00
list_for_each_entry ( trans , & c - > btree_trans_list , list ) {
if ( ( ulong ) trans < = iter )
2022-10-02 01:41:08 -04:00
continue ;
2024-06-28 21:08:01 -04:00
iter = ( ulong ) trans ;
2024-06-22 20:59:09 -04:00
2024-06-22 22:02:09 -04:00
if ( ! closure_get_not_zero ( & trans - > ref ) )
continue ;
2023-06-19 21:01:13 -04:00
2024-06-22 20:59:09 -04:00
u32 seq = seqmutex_unlock ( & c - > btree_trans_lock ) ;
2022-10-02 01:41:08 -04:00
2024-06-22 20:59:09 -04:00
bool found = bch2_check_for_deadlock ( trans , out ) ! = 0 ;
2023-06-19 21:01:13 -04:00
closure_put ( & trans - > ref ) ;
2024-06-22 20:59:09 -04:00
if ( found )
return ;
2023-06-19 21:01:13 -04:00
if ( ! seqmutex_relock ( & c - > btree_trans_lock , seq ) )
goto restart ;
2022-10-02 01:41:08 -04:00
}
2023-06-19 21:01:13 -04:00
seqmutex_unlock ( & c - > btree_trans_lock ) ;
2024-06-22 20:59:09 -04:00
}
static ssize_t bch2_btree_deadlock_read ( struct file * file , char __user * buf ,
size_t size , loff_t * ppos )
{
struct dump_iter * i = file - > private_data ;
struct bch_fs * c = i - > c ;
ssize_t ret = 0 ;
i - > ubuf = buf ;
i - > size = size ;
i - > ret = 0 ;
if ( ! i - > iter ) {
btree_deadlock_to_text ( & i - > buf , c ) ;
i - > iter + + ;
}
2022-08-22 23:12:11 -04:00
if ( i - > buf . allocation_failure )
ret = - ENOMEM ;
if ( ! ret )
ret = flush_buf ( i ) ;
return ret ? : i - > ret ;
}
static const struct file_operations btree_deadlock_ops = {
. owner = THIS_MODULE ,
. open = bch2_dump_open ,
. release = bch2_dump_release ,
. read = bch2_btree_deadlock_read ,
} ;
2017-03-16 22:18:50 -08:00
void bch2_fs_debug_exit ( struct bch_fs * c )
{
2022-02-26 11:48:34 -05:00
if ( ! IS_ERR_OR_NULL ( c - > fs_debug_dir ) )
debugfs_remove_recursive ( c - > fs_debug_dir ) ;
2017-03-16 22:18:50 -08:00
}
2024-03-14 10:02:18 -06:00
static void bch2_fs_debug_btree_init ( struct bch_fs * c , struct btree_debug * bd )
{
struct dentry * d ;
d = debugfs_create_dir ( bch2_btree_id_str ( bd - > id ) , c - > btree_debug_dir ) ;
debugfs_create_file ( " keys " , 0400 , d , bd , & btree_debug_ops ) ;
debugfs_create_file ( " formats " , 0400 , d , bd , & btree_format_debug_ops ) ;
debugfs_create_file ( " bfloat-failed " , 0400 , d , bd ,
& bfloat_failed_debug_ops ) ;
}
2017-03-16 22:18:50 -08:00
void bch2_fs_debug_init ( struct bch_fs * c )
{
struct btree_debug * bd ;
char name [ 100 ] ;
if ( IS_ERR_OR_NULL ( bch_debug ) )
return ;
snprintf ( name , sizeof ( name ) , " %pU " , c - > sb . user_uuid . b ) ;
2022-02-26 11:48:34 -05:00
c - > fs_debug_dir = debugfs_create_dir ( name , bch_debug ) ;
if ( IS_ERR_OR_NULL ( c - > fs_debug_dir ) )
return ;
debugfs_create_file ( " cached_btree_nodes " , 0400 , c - > fs_debug_dir ,
c - > btree_debug , & cached_btree_nodes_ops ) ;
2022-06-17 20:12:02 -04:00
debugfs_create_file ( " btree_transactions " , 0400 , c - > fs_debug_dir ,
c - > btree_debug , & btree_transactions_ops ) ;
2022-02-26 11:48:34 -05:00
debugfs_create_file ( " journal_pins " , 0400 , c - > fs_debug_dir ,
c - > btree_debug , & journal_pins_ops ) ;
2024-04-03 19:15:53 -04:00
debugfs_create_file ( " btree_updates " , 0400 , c - > fs_debug_dir ,
c - > btree_debug , & btree_updates_ops ) ;
2022-08-11 20:14:54 -04:00
debugfs_create_file ( " btree_transaction_stats " , 0400 , c - > fs_debug_dir ,
2023-12-23 22:43:33 -05:00
c , & btree_transaction_stats_op ) ;
2022-07-14 20:33:09 +12:00
2022-08-22 23:12:11 -04:00
debugfs_create_file ( " btree_deadlock " , 0400 , c - > fs_debug_dir ,
c - > btree_debug , & btree_deadlock_ops ) ;
2022-02-26 11:48:34 -05:00
c - > btree_debug_dir = debugfs_create_dir ( " btrees " , c - > fs_debug_dir ) ;
if ( IS_ERR_OR_NULL ( c - > btree_debug_dir ) )
2017-03-16 22:18:50 -08:00
return ;
for ( bd = c - > btree_debug ;
bd < c - > btree_debug + ARRAY_SIZE ( c - > btree_debug ) ;
bd + + ) {
bd - > id = bd - c - > btree_debug ;
2024-03-14 10:02:18 -06:00
bch2_fs_debug_btree_init ( c , bd ) ;
2017-03-16 22:18:50 -08:00
}
}
# endif
void bch2_debug_exit ( void )
{
if ( ! IS_ERR_OR_NULL ( bch_debug ) )
debugfs_remove_recursive ( bch_debug ) ;
}
int __init bch2_debug_init ( void )
{
bch_debug = debugfs_create_dir ( " bcachefs " , NULL ) ;
2024-01-03 13:44:43 -05:00
return 0 ;
2017-03-16 22:18:50 -08:00
}