2001-12-11 14:42:30 +03:00
/*
2004-03-30 23:35:44 +04:00
* Copyright ( C ) 2002 - 2004 Sistina Software , Inc . All rights reserved .
2018-04-20 18:43:50 +03:00
* Copyright ( C ) 2004 - 2007 Red Hat , Inc . All rights reserved .
2001-12-11 14:42:30 +03:00
*
2004-03-30 23:35:44 +04:00
* This file is part of LVM2 .
*
* This copyrighted material is made available to anyone wishing to use ,
* modify , copy , or redistribute it subject to the terms and conditions
2007-08-21 00:55:30 +04:00
* of the GNU Lesser General Public License v .2 .1 .
2004-03-30 23:35:44 +04:00
*
2007-08-21 00:55:30 +04:00
* You should have received a copy of the GNU Lesser General Public License
2004-03-30 23:35:44 +04:00
* along with this program ; if not , write to the Free Software Foundation ,
2016-01-21 13:49:46 +03:00
* Inc . , 51 Franklin Street , Fifth Floor , Boston , MA 02110 - 1301 USA
2001-12-11 14:42:30 +03:00
*/
2018-06-08 15:40:53 +03:00
# include "base/memory/zalloc.h"
2018-05-14 12:30:20 +03:00
# include "lib/misc/lib.h"
# include "lib/label/label.h"
# include "lib/misc/crc.h"
# include "lib/mm/xlate.h"
# include "lib/cache/lvmcache.h"
# include "lib/device/bcache.h"
# include "lib/commands/toolcontext.h"
# include "lib/activate/activate.h"
2018-12-07 23:35:22 +03:00
# include "lib/label/hints.h"
2019-03-04 21:13:09 +03:00
# include "lib/metadata/metadata.h"
2002-11-18 17:04:08 +03:00
# include <sys/stat.h>
# include <fcntl.h>
# include <unistd.h>
2018-06-08 15:40:53 +03:00
# include <sys/types.h>
2002-11-18 17:04:08 +03:00
/* FIXME Allow for larger labels? Restricted to single sector currently */
2001-12-11 14:42:30 +03:00
2019-03-04 21:13:09 +03:00
static uint64_t _current_bcache_size_bytes ;
2002-01-10 18:01:58 +03:00
/*
* Internal labeller struct .
*/
struct labeller_i {
2008-11-04 01:14:30 +03:00
struct dm_list list ;
2001-12-11 14:42:30 +03:00
2002-01-10 18:01:58 +03:00
struct labeller * l ;
char name [ 0 ] ;
} ;
2001-12-13 11:40:47 +03:00
2008-11-04 01:14:30 +03:00
static struct dm_list _labellers ;
2001-12-11 14:42:30 +03:00
2002-01-10 18:01:58 +03:00
static struct labeller_i * _alloc_li ( const char * name , struct labeller * l )
2001-12-11 14:42:30 +03:00
{
2002-01-10 18:01:58 +03:00
struct labeller_i * li ;
size_t len ;
2001-12-11 14:42:30 +03:00
2002-01-10 18:01:58 +03:00
len = sizeof ( * li ) + strlen ( name ) + 1 ;
2001-12-11 14:42:30 +03:00
2018-06-08 15:40:53 +03:00
if ( ! ( li = malloc ( len ) ) ) {
2002-01-16 03:01:36 +03:00
log_error ( " Couldn't allocate memory for labeller list object. " ) ;
2002-01-10 18:01:58 +03:00
return NULL ;
}
li - > l = l ;
strcpy ( li - > name , name ) ;
return li ;
2001-12-12 12:05:44 +03:00
}
2001-12-11 14:42:30 +03:00
2002-01-10 18:01:58 +03:00
int label_init ( void )
{
2008-11-04 01:14:30 +03:00
dm_list_init ( & _labellers ) ;
2002-01-10 19:48:28 +03:00
return 1 ;
2001-12-11 14:42:30 +03:00
}
2002-01-10 18:01:58 +03:00
void label_exit ( void )
2001-12-14 16:15:15 +03:00
{
2012-02-08 15:12:18 +04:00
struct labeller_i * li , * tli ;
2002-01-10 18:01:58 +03:00
2012-02-08 15:12:18 +04:00
dm_list_iterate_items_safe ( li , tli , & _labellers ) {
dm_list_del ( & li - > list ) ;
2002-11-18 17:04:08 +03:00
li - > l - > ops - > destroy ( li - > l ) ;
2018-06-08 15:40:53 +03:00
free ( li ) ;
2002-01-10 18:01:58 +03:00
}
2004-05-05 01:25:57 +04:00
2008-11-04 01:14:30 +03:00
dm_list_init ( & _labellers ) ;
2001-12-14 16:15:15 +03:00
}
2013-07-29 17:58:18 +04:00
int label_register_handler ( struct labeller * handler )
2001-12-11 14:42:30 +03:00
{
2002-01-10 18:01:58 +03:00
struct labeller_i * li ;
2013-07-29 17:58:18 +04:00
if ( ! ( li = _alloc_li ( handler - > fmt - > name , handler ) ) )
2008-01-30 16:19:47 +03:00
return_0 ;
2001-12-11 14:42:30 +03:00
2008-11-04 01:14:30 +03:00
dm_list_add ( & _labellers , & li - > list ) ;
2002-01-10 18:01:58 +03:00
return 1 ;
2001-12-11 14:42:30 +03:00
}
2002-01-10 18:01:58 +03:00
struct labeller * label_get_handler ( const char * name )
2001-12-11 14:42:30 +03:00
{
2002-01-10 18:01:58 +03:00
struct labeller_i * li ;
2001-12-11 14:42:30 +03:00
2008-11-04 01:14:30 +03:00
dm_list_iterate_items ( li , & _labellers )
2002-01-10 18:01:58 +03:00
if ( ! strcmp ( li - > name , name ) )
return li - > l ;
2001-12-11 14:42:30 +03:00
2002-01-10 18:01:58 +03:00
return NULL ;
}
2001-12-11 14:42:30 +03:00
2002-11-18 17:04:08 +03:00
/* FIXME Also wipe associated metadata area headers? */
2002-01-11 13:43:32 +03:00
int label_remove ( struct device * dev )
2001-12-11 14:42:30 +03:00
{
2018-02-20 00:40:44 +03:00
char readbuf [ LABEL_SIZE ] __attribute__ ( ( aligned ( 8 ) ) ) ;
2002-11-18 17:04:08 +03:00
int r = 1 ;
uint64_t sector ;
int wipe ;
struct labeller_i * li ;
struct label_header * lh ;
2017-08-11 22:32:04 +03:00
struct lvmcache_info * info ;
2002-11-18 17:04:08 +03:00
log_very_verbose ( " Scanning for labels to wipe from %s " , dev_name ( dev ) ) ;
2018-05-16 21:24:00 +03:00
if ( ! label_scan_open_excl ( dev ) ) {
2018-02-20 00:40:44 +03:00
log_error ( " Failed to open device %s " , dev_name ( dev ) ) ;
return 0 ;
2002-11-18 17:04:08 +03:00
}
/* Scan first few sectors for anything looking like a label */
for ( sector = 0 ; sector < LABEL_SCAN_SECTORS ;
sector + = LABEL_SIZE > > SECTOR_SHIFT ) {
2018-02-20 00:40:44 +03:00
memset ( readbuf , 0 , sizeof ( readbuf ) ) ;
2018-02-27 20:26:04 +03:00
if ( ! dev_read_bytes ( dev , sector < < SECTOR_SHIFT , LABEL_SIZE , readbuf ) ) {
2018-02-20 00:40:44 +03:00
log_error ( " Failed to read label from %s sector %llu " ,
dev_name ( dev ) , ( unsigned long long ) sector ) ;
continue ;
}
lh = ( struct label_header * ) readbuf ;
2002-11-18 17:04:08 +03:00
wipe = 0 ;
2006-05-10 01:23:51 +04:00
if ( ! strncmp ( ( char * ) lh - > id , LABEL_ID , sizeof ( lh - > id ) ) ) {
2002-11-18 17:04:08 +03:00
if ( xlate64 ( lh - > sector_xl ) = = sector )
wipe = 1 ;
} else {
2008-11-04 01:14:30 +03:00
dm_list_iterate_items ( li , & _labellers ) {
2018-02-20 00:40:44 +03:00
if ( li - > l - > ops - > can_handle ( li - > l , ( char * ) lh , sector ) ) {
2002-11-18 17:04:08 +03:00
wipe = 1 ;
break ;
}
}
}
if ( wipe ) {
2018-02-20 00:40:44 +03:00
log_very_verbose ( " %s: Wiping label at sector %llu " ,
dev_name ( dev ) , ( unsigned long long ) sector ) ;
2018-02-27 20:26:04 +03:00
if ( ! dev_write_zeros ( dev , sector < < SECTOR_SHIFT , LABEL_SIZE ) ) {
2018-02-20 00:40:44 +03:00
log_error ( " Failed to remove label from %s at sector %llu " ,
dev_name ( dev ) , ( unsigned long long ) sector ) ;
r = 0 ;
} else {
2017-08-11 22:32:04 +03:00
/* Also remove the PV record from cache. */
info = lvmcache_info_from_pvid ( dev - > pvid , dev , 0 ) ;
if ( info )
lvmcache_del ( info ) ;
2002-11-18 17:04:08 +03:00
}
}
}
return r ;
2001-12-11 14:42:30 +03:00
}
2002-11-18 17:04:08 +03:00
/* Caller may need to use label_get_handler to create label struct! */
int label_write ( struct device * dev , struct label * label )
{
2010-07-09 19:34:40 +04:00
char buf [ LABEL_SIZE ] __attribute__ ( ( aligned ( 8 ) ) ) ;
2002-11-18 17:04:08 +03:00
struct label_header * lh = ( struct label_header * ) buf ;
2018-10-30 00:53:17 +03:00
uint64_t offset ;
2002-11-18 17:04:08 +03:00
int r = 1 ;
2003-08-27 01:12:06 +04:00
if ( ! label - > labeller - > ops - > write ) {
2009-07-16 00:02:46 +04:00
log_error ( " Label handler does not support label writes " ) ;
2003-08-27 01:12:06 +04:00
return 0 ;
}
2002-11-18 17:04:08 +03:00
if ( ( LABEL_SIZE + ( label - > sector < < SECTOR_SHIFT ) ) > LABEL_SCAN_SIZE ) {
log_error ( " Label sector % " PRIu64 " beyond range (%ld) " ,
label - > sector , LABEL_SCAN_SECTORS ) ;
return 0 ;
}
memset ( buf , 0 , LABEL_SIZE ) ;
2006-05-10 01:23:51 +04:00
strncpy ( ( char * ) lh - > id , LABEL_ID , sizeof ( lh - > id ) ) ;
2002-11-18 17:04:08 +03:00
lh - > sector_xl = xlate64 ( label - > sector ) ;
lh - > offset_xl = xlate32 ( sizeof ( * lh ) ) ;
2008-01-30 16:19:47 +03:00
if ( ! ( label - > labeller - > ops - > write ) ( label , buf ) )
return_0 ;
2002-11-18 17:04:08 +03:00
2010-09-27 23:09:34 +04:00
lh - > crc_xl = xlate32 ( calc_crc ( INITIAL_CRC , ( uint8_t * ) & lh - > offset_xl , LABEL_SIZE -
( ( uint8_t * ) & lh - > offset_xl - ( uint8_t * ) lh ) ) ) ;
2002-11-18 17:04:08 +03:00
2016-11-01 13:02:01 +03:00
log_very_verbose ( " %s: Writing label to sector % " PRIu64 " with stored offset % "
PRIu32 " . " , dev_name ( dev ) , label - > sector ,
xlate32 ( lh - > offset_xl ) ) ;
2018-02-20 00:40:44 +03:00
if ( ! label_scan_open ( dev ) ) {
log_error ( " Failed to open device %s " , dev_name ( dev ) ) ;
return 0 ;
}
2018-10-30 00:53:17 +03:00
offset = label - > sector < < SECTOR_SHIFT ;
dev_set_last_byte ( dev , offset + LABEL_SIZE ) ;
if ( ! dev_write_bytes ( dev , offset , LABEL_SIZE , buf ) ) {
2013-01-08 02:30:29 +04:00
log_debug_devs ( " Failed to write label to %s " , dev_name ( dev ) ) ;
2002-11-18 17:04:08 +03:00
r = 0 ;
}
2018-10-30 00:53:17 +03:00
dev_unset_last_byte ( dev ) ;
2002-11-18 17:04:08 +03:00
return r ;
2001-12-11 14:42:30 +03:00
}
2002-11-18 17:04:08 +03:00
void label_destroy ( struct label * label )
2001-12-11 19:49:40 +03:00
{
2002-11-18 17:04:08 +03:00
label - > labeller - > ops - > destroy_label ( label - > labeller , label ) ;
2018-06-08 15:40:53 +03:00
free ( label ) ;
2002-11-18 17:04:08 +03:00
}
struct label * label_create ( struct labeller * labeller )
{
struct label * label ;
2018-06-08 15:40:53 +03:00
if ( ! ( label = zalloc ( sizeof ( * label ) ) ) ) {
2002-11-18 17:04:08 +03:00
log_error ( " label allocaction failed " ) ;
return NULL ;
}
label - > labeller = labeller ;
labeller - > ops - > initialise_label ( labeller , label ) ;
return label ;
2001-12-11 19:49:40 +03:00
}
2018-02-07 00:18:11 +03:00
/* global variable for accessing the bcache populated by label scan */
struct bcache * scan_bcache ;
2018-02-15 19:27:43 +03:00
# define BCACHE_BLOCK_SIZE_IN_SECTORS 256 /* 256*512 = 128K */
2018-02-07 00:18:11 +03:00
static bool _in_bcache ( struct device * dev )
{
2018-02-14 01:17:02 +03:00
if ( ! dev )
return NULL ;
2018-02-07 00:18:11 +03:00
return ( dev - > flags & DEV_IN_BCACHE ) ? true : false ;
}
static struct labeller * _find_lvm_header ( struct device * dev ,
char * scan_buf ,
2018-05-11 00:27:34 +03:00
uint32_t scan_buf_sectors ,
2018-02-07 00:18:11 +03:00
char * label_buf ,
uint64_t * label_sector ,
2018-05-11 00:27:34 +03:00
uint64_t block_sector ,
uint64_t start_sector )
2018-02-07 00:18:11 +03:00
{
struct labeller_i * li ;
struct labeller * labeller_ret = NULL ;
struct label_header * lh ;
uint64_t sector ;
int found = 0 ;
/*
* Find which sector in scan_buf starts with a valid label ,
* and copy it into label_buf .
*/
2018-05-11 00:27:34 +03:00
for ( sector = start_sector ; sector < start_sector + LABEL_SCAN_SECTORS ;
2018-02-07 00:18:11 +03:00
sector + = LABEL_SIZE > > SECTOR_SHIFT ) {
2018-05-11 00:27:34 +03:00
/*
* The scan_buf passed in is a bcache block , which is
* BCACHE_BLOCK_SIZE_IN_SECTORS large . So if start_sector is
* one of the last couple sectors in that buffer , we need to
* break early .
*/
if ( sector > = scan_buf_sectors )
break ;
2018-02-07 00:18:11 +03:00
lh = ( struct label_header * ) ( scan_buf + ( sector < < SECTOR_SHIFT ) ) ;
if ( ! strncmp ( ( char * ) lh - > id , LABEL_ID , sizeof ( lh - > id ) ) ) {
if ( found ) {
log_error ( " Ignoring additional label on %s at sector %llu " ,
2018-05-11 00:27:34 +03:00
dev_name ( dev ) , ( unsigned long long ) ( block_sector + sector ) ) ;
2018-02-07 00:18:11 +03:00
}
2018-05-11 00:27:34 +03:00
if ( xlate64 ( lh - > sector_xl ) ! = sector ) {
log_warn ( " %s: Label for sector %llu found at sector %llu - ignoring. " ,
dev_name ( dev ) ,
( unsigned long long ) xlate64 ( lh - > sector_xl ) ,
( unsigned long long ) ( block_sector + sector ) ) ;
2018-02-07 00:18:11 +03:00
continue ;
}
2018-05-11 00:27:34 +03:00
if ( calc_crc ( INITIAL_CRC , ( uint8_t * ) & lh - > offset_xl ,
LABEL_SIZE - ( ( uint8_t * ) & lh - > offset_xl - ( uint8_t * ) lh ) ) ! = xlate32 ( lh - > crc_xl ) ) {
2018-02-07 00:18:11 +03:00
log_very_verbose ( " Label checksum incorrect on %s - ignoring " , dev_name ( dev ) ) ;
continue ;
}
if ( found )
continue ;
}
dm_list_iterate_items ( li , & _labellers ) {
2018-05-11 00:27:34 +03:00
if ( li - > l - > ops - > can_handle ( li - > l , ( char * ) lh , block_sector + sector ) ) {
2018-02-07 00:18:11 +03:00
log_very_verbose ( " %s: %s label detected at sector %llu " ,
dev_name ( dev ) , li - > name ,
2018-05-11 00:27:34 +03:00
( unsigned long long ) ( block_sector + sector ) ) ;
2018-02-07 00:18:11 +03:00
if ( found ) {
log_error ( " Ignoring additional label on %s at sector %llu " ,
dev_name ( dev ) ,
2018-05-11 00:27:34 +03:00
( unsigned long long ) ( block_sector + sector ) ) ;
2018-02-07 00:18:11 +03:00
continue ;
}
labeller_ret = li - > l ;
found = 1 ;
memcpy ( label_buf , lh , LABEL_SIZE ) ;
if ( label_sector )
2018-05-11 00:27:34 +03:00
* label_sector = block_sector + sector ;
2018-02-07 00:18:11 +03:00
break ;
}
}
}
return labeller_ret ;
}
/*
* Process / parse the headers from the data read from a device .
* Populates lvmcache with device / mda locations / vgname
* so that vg_read ( vgname ) will know which devices / locations
* to read metadata from .
*
* If during processing , headers / metadata are found to be needed
* beyond the range of the scanned block , then additional reads
* are performed in the processing functions to get that data .
*/
2018-05-04 01:12:07 +03:00
static int _process_block ( struct cmd_context * cmd , struct dev_filter * f ,
2018-05-11 00:27:34 +03:00
struct device * dev , struct block * bb ,
uint64_t block_sector , uint64_t start_sector ,
int * is_lvm_device )
2018-02-07 00:18:11 +03:00
{
char label_buf [ LABEL_SIZE ] __attribute__ ( ( aligned ( 8 ) ) ) ;
struct label * label = NULL ;
struct labeller * labeller ;
2018-12-01 00:26:26 +03:00
uint64_t sector = 0 ;
2018-02-07 00:18:11 +03:00
int ret = 0 ;
2018-05-04 01:12:07 +03:00
int pass ;
2018-12-07 23:35:22 +03:00
dev - > flags & = ~ DEV_SCAN_FOUND_LABEL ;
2018-05-04 01:12:07 +03:00
/*
* The device may have signatures that exclude it from being processed .
* If filters were applied before bcache data was available , some
* filters may have deferred their check until the point where bcache
* data had been read ( here ) . They set this flag to indicate that the
* filters should be retested now that data from the device is ready .
*/
2018-05-11 00:27:34 +03:00
if ( f & & ( dev - > flags & DEV_FILTER_AFTER_SCAN ) ) {
2018-05-04 01:12:07 +03:00
dev - > flags & = ~ DEV_FILTER_AFTER_SCAN ;
log_debug_devs ( " Scan filtering %s " , dev_name ( dev ) ) ;
2018-12-07 23:35:22 +03:00
pass = f - > passes_filter ( cmd , f , dev , NULL ) ;
2018-05-04 01:12:07 +03:00
if ( ( pass = = - EAGAIN ) | | ( dev - > flags & DEV_FILTER_AFTER_SCAN ) ) {
/* Shouldn't happen */
dev - > flags & = ~ DEV_FILTER_OUT_SCAN ;
log_debug_devs ( " Scan filter should not be deferred %s " , dev_name ( dev ) ) ;
pass = 1 ;
}
if ( ! pass ) {
log_very_verbose ( " %s: Not processing filtered " , dev_name ( dev ) ) ;
dev - > flags | = DEV_FILTER_OUT_SCAN ;
* is_lvm_device = 0 ;
goto_out ;
}
}
2018-02-07 00:18:11 +03:00
/*
* Finds the data sector containing the label and copies into label_buf .
* label_buf : struct label_header + struct pv_header + struct pv_header_extension
*
* FIXME : we don ' t need to copy one sector from bb - > data into label_buf ,
* we can just point label_buf at one sector in ld - > buf .
*/
2018-05-11 00:27:34 +03:00
if ( ! ( labeller = _find_lvm_header ( dev , bb - > data , BCACHE_BLOCK_SIZE_IN_SECTORS , label_buf , & sector , block_sector , start_sector ) ) ) {
2018-02-07 00:18:11 +03:00
/*
* Non - PVs exit here
*
* FIXME : check for PVs with errors that also exit here !
* i . e . this code cannot distinguish between a non - lvm
* device an an lvm device with errors .
*/
log_very_verbose ( " %s: No lvm label detected " , dev_name ( dev ) ) ;
2018-03-01 21:40:37 +03:00
lvmcache_del_dev ( dev ) ; /* FIXME: if this is needed, fix it. */
2018-02-07 00:18:11 +03:00
* is_lvm_device = 0 ;
goto_out ;
}
2018-12-07 23:35:22 +03:00
dev - > flags | = DEV_SCAN_FOUND_LABEL ;
2018-02-07 00:18:11 +03:00
* is_lvm_device = 1 ;
/*
* This is the point where the scanning code dives into the rest of
* lvm . ops - > read ( ) is usually _text_read ( ) which reads the pv_header ,
* mda locations , mda contents . As these bits of data are read , they
* are saved into lvmcache as info / vginfo structs .
*/
if ( ( ret = ( labeller - > ops - > read ) ( labeller , dev , label_buf , & label ) ) & & label ) {
label - > dev = dev ;
label - > sector = sector ;
} else {
/* FIXME: handle errors */
2018-03-01 21:40:37 +03:00
lvmcache_del_dev ( dev ) ;
2018-02-07 00:18:11 +03:00
}
out :
return ret ;
}
2018-02-13 17:58:35 +03:00
static int _scan_dev_open ( struct device * dev )
{
2018-05-25 19:14:12 +03:00
struct dm_list * name_list ;
struct dm_str_list * name_sl ;
2018-02-13 17:58:35 +03:00
const char * name ;
2018-05-25 19:14:12 +03:00
struct stat sbuf ;
int retried = 0 ;
2018-02-13 17:58:35 +03:00
int flags = 0 ;
int fd ;
2018-02-14 01:17:02 +03:00
if ( ! dev )
return 0 ;
2018-02-13 17:58:35 +03:00
if ( dev - > flags & DEV_IN_BCACHE ) {
2018-05-25 19:14:12 +03:00
/* Shouldn't happen */
log_error ( " Device open %s has DEV_IN_BCACHE already set " , dev_name ( dev ) ) ;
2018-02-13 17:58:35 +03:00
dev - > flags & = ~ DEV_IN_BCACHE ;
}
if ( dev - > bcache_fd > 0 ) {
2018-05-25 19:14:12 +03:00
/* Shouldn't happen */
log_error ( " Device open %s already open with fd %d " ,
2018-02-13 17:58:35 +03:00
dev_name ( dev ) , dev - > bcache_fd ) ;
return 0 ;
}
2018-05-25 19:14:12 +03:00
/*
* All the names for this device ( major : minor ) are kept on
* dev - > aliases , the first one is the primary / preferred name .
*/
if ( ! ( name_list = dm_list_first ( & dev - > aliases ) ) ) {
/* Shouldn't happen */
log_error ( " Device open %s %d:%d has no path names. " ,
dev_name ( dev ) , ( int ) MAJOR ( dev - > dev ) , ( int ) MINOR ( dev - > dev ) ) ;
2018-02-13 17:58:35 +03:00
return 0 ;
}
2018-05-25 19:14:12 +03:00
name_sl = dm_list_item ( name_list , struct dm_str_list ) ;
name = name_sl - > str ;
2018-02-13 17:58:35 +03:00
flags | = O_DIRECT ;
flags | = O_NOATIME ;
2018-06-20 19:32:45 +03:00
/*
* FIXME : udev is a train wreck when we open RDWR and close , so we
* need to only use RDWR when we actually need to write , and use
* RDONLY otherwise . Fix , disable or scrap udev nonsense so we can
* just open with RDWR by default .
*/
if ( dev - > flags & DEV_BCACHE_EXCL ) {
2018-02-13 17:58:35 +03:00
flags | = O_EXCL ;
2018-06-20 19:32:45 +03:00
flags | = O_RDWR ;
} else if ( dev - > flags & DEV_BCACHE_WRITE ) {
flags | = O_RDWR ;
} else {
flags | = O_RDONLY ;
}
2018-02-13 17:58:35 +03:00
2018-05-25 19:14:12 +03:00
retry_open :
2018-02-13 17:58:35 +03:00
fd = open ( name , flags , 0777 ) ;
if ( fd < 0 ) {
if ( ( errno = = EBUSY ) & & ( flags & O_EXCL ) ) {
log_error ( " Can't open %s exclusively. Mounted filesystem? " ,
dev_name ( dev ) ) ;
} else {
2018-05-25 19:14:12 +03:00
int major , minor ;
/*
* Shouldn ' t happen , if it does , print stat info to help figure
* out what ' s wrong .
*/
major = ( int ) MAJOR ( dev - > dev ) ;
minor = ( int ) MINOR ( dev - > dev ) ;
log_error ( " Device open %s %d:%d failed errno %d " , name , major , minor , errno ) ;
if ( stat ( name , & sbuf ) ) {
log_debug_devs ( " Device open %s %d:%d stat failed errno %d " ,
name , major , minor , errno ) ;
} else if ( sbuf . st_rdev ! = dev - > dev ) {
log_debug_devs ( " Device open %s %d:%d stat %d:%d does not match. " ,
name , major , minor ,
( int ) MAJOR ( sbuf . st_rdev ) , ( int ) MINOR ( sbuf . st_rdev ) ) ;
}
if ( ! retried ) {
/*
* FIXME : remove this , the theory for this retry is that
* there may be a udev race that we can sometimes mask by
* retrying . This is here until we can figure out if it ' s
* needed and if so fix the real problem .
*/
usleep ( 5000 ) ;
log_debug_devs ( " Device open %s retry " , dev_name ( dev ) ) ;
retried = 1 ;
goto retry_open ;
}
2018-02-13 17:58:35 +03:00
}
return 0 ;
}
dev - > flags | = DEV_IN_BCACHE ;
dev - > bcache_fd = fd ;
return 1 ;
}
static int _scan_dev_close ( struct device * dev )
{
if ( ! ( dev - > flags & DEV_IN_BCACHE ) )
log_error ( " scan_dev_close %s no DEV_IN_BCACHE set " , dev_name ( dev ) ) ;
dev - > flags & = ~ DEV_IN_BCACHE ;
dev - > flags & = ~ DEV_BCACHE_EXCL ;
if ( dev - > bcache_fd < 0 ) {
log_error ( " scan_dev_close %s already closed " , dev_name ( dev ) ) ;
return 0 ;
}
if ( close ( dev - > bcache_fd ) )
log_warn ( " close %s errno %d " , dev_name ( dev ) , errno ) ;
dev - > bcache_fd = - 1 ;
return 1 ;
}
2018-05-30 01:02:27 +03:00
static void _drop_bad_aliases ( struct device * dev )
{
struct dm_str_list * strl , * strl2 ;
const char * name ;
struct stat sbuf ;
int major = ( int ) MAJOR ( dev - > dev ) ;
int minor = ( int ) MINOR ( dev - > dev ) ;
int bad ;
dm_list_iterate_items_safe ( strl , strl2 , & dev - > aliases ) {
name = strl - > str ;
bad = 0 ;
if ( stat ( name , & sbuf ) ) {
bad = 1 ;
log_debug_devs ( " Device path check %d:%d %s stat failed errno %d " ,
major , minor , name , errno ) ;
} else if ( sbuf . st_rdev ! = dev - > dev ) {
bad = 1 ;
log_debug_devs ( " Device path check %d:%d %s stat %d:%d does not match. " ,
major , minor , name ,
( int ) MAJOR ( sbuf . st_rdev ) , ( int ) MINOR ( sbuf . st_rdev ) ) ;
}
if ( bad ) {
log_debug_devs ( " Device path check %d:%d dropping path %s. " , major , minor , name ) ;
dev_cache_failed_path ( dev , name ) ;
}
}
}
2018-02-07 00:18:11 +03:00
/*
* Read or reread label / metadata from selected devs .
*
* Reads and looks at label_header , pv_header , pv_header_extension ,
* mda_header , raw_locns , vg metadata from each device .
*
* Effect is populating lvmcache with latest info / vginfo ( PV / VG ) data
* from the devs . If a scanned device does not have a label_header ,
* its info is removed from lvmcache .
*/
2018-05-04 01:12:07 +03:00
static int _scan_list ( struct cmd_context * cmd , struct dev_filter * f ,
struct dm_list * devs , int * failed )
2018-02-07 00:18:11 +03:00
{
struct dm_list wait_devs ;
struct dm_list done_devs ;
2018-05-25 19:14:12 +03:00
struct dm_list reopen_devs ;
2018-02-07 00:18:11 +03:00
struct device_list * devl , * devl2 ;
struct block * bb ;
2018-05-25 19:14:12 +03:00
int retried_open = 0 ;
2018-04-06 21:12:26 +03:00
int scan_read_errors = 0 ;
int scan_process_errors = 0 ;
2018-02-07 00:18:11 +03:00
int scan_failed_count = 0 ;
int rem_prefetches ;
2018-05-04 01:12:07 +03:00
int submit_count ;
2018-02-07 00:18:11 +03:00
int scan_failed ;
int is_lvm_device ;
2018-04-06 21:12:26 +03:00
int error ;
2018-03-01 21:40:37 +03:00
int ret ;
2018-02-07 00:18:11 +03:00
dm_list_init ( & wait_devs ) ;
dm_list_init ( & done_devs ) ;
2018-05-25 19:14:12 +03:00
dm_list_init ( & reopen_devs ) ;
2018-02-07 00:18:11 +03:00
2018-04-06 21:12:26 +03:00
log_debug_devs ( " Scanning %d devices for VG info " , dm_list_size ( devs ) ) ;
2018-02-07 00:18:11 +03:00
scan_more :
rem_prefetches = bcache_max_prefetches ( scan_bcache ) ;
2018-05-04 01:12:07 +03:00
submit_count = 0 ;
2018-02-07 00:18:11 +03:00
dm_list_iterate_items_safe ( devl , devl2 , devs ) {
/*
* If we prefetch more devs than blocks in the cache , then the
* cache will wait for earlier reads to complete , toss the
* results , and reuse those blocks before we ' ve had a chance to
* use them . So , prefetch as many as are available , wait for
* and process them , then repeat .
*/
if ( ! rem_prefetches )
break ;
if ( ! _in_bcache ( devl - > dev ) ) {
2018-02-13 17:58:35 +03:00
if ( ! _scan_dev_open ( devl - > dev ) ) {
2018-03-01 21:40:37 +03:00
log_debug_devs ( " Scan failed to open %s. " , dev_name ( devl - > dev ) ) ;
2018-02-13 17:58:35 +03:00
dm_list_del ( & devl - > list ) ;
2018-05-25 19:14:12 +03:00
dm_list_add ( & reopen_devs , & devl - > list ) ;
2018-02-07 00:18:11 +03:00
continue ;
}
}
2018-02-13 17:58:35 +03:00
bcache_prefetch ( scan_bcache , devl - > dev - > bcache_fd , 0 ) ;
2018-02-07 00:18:11 +03:00
rem_prefetches - - ;
2018-05-04 01:12:07 +03:00
submit_count + + ;
2018-02-07 00:18:11 +03:00
dm_list_del ( & devl - > list ) ;
dm_list_add ( & wait_devs , & devl - > list ) ;
}
2018-05-04 01:12:07 +03:00
log_debug_devs ( " Scanning submitted %d reads " , submit_count ) ;
2018-02-07 00:18:11 +03:00
dm_list_iterate_items_safe ( devl , devl2 , & wait_devs ) {
bb = NULL ;
2018-04-06 21:12:26 +03:00
error = 0 ;
scan_failed = 0 ;
is_lvm_device = 0 ;
2018-02-07 00:18:11 +03:00
2018-05-10 15:26:08 +03:00
if ( ! bcache_get ( scan_bcache , devl - > dev - > bcache_fd , 0 , 0 , & bb ) ) {
2018-04-06 21:12:26 +03:00
log_debug_devs ( " Scan failed to read %s error %d. " , dev_name ( devl - > dev ) , error ) ;
2018-02-07 00:18:11 +03:00
scan_failed = 1 ;
2018-04-06 21:12:26 +03:00
scan_read_errors + + ;
scan_failed_count + + ;
2018-03-01 21:40:37 +03:00
lvmcache_del_dev ( devl - > dev ) ;
2018-02-07 00:18:11 +03:00
} else {
2018-05-30 01:02:27 +03:00
log_debug_devs ( " Processing data from device %s %d:%d fd %d block %p " ,
dev_name ( devl - > dev ) ,
( int ) MAJOR ( devl - > dev - > dev ) ,
( int ) MINOR ( devl - > dev - > dev ) ,
devl - > dev - > bcache_fd , bb ) ;
2018-03-01 21:40:37 +03:00
2018-05-11 00:27:34 +03:00
ret = _process_block ( cmd , f , devl - > dev , bb , 0 , 0 , & is_lvm_device ) ;
2018-03-01 21:40:37 +03:00
if ( ! ret & & is_lvm_device ) {
2018-03-09 20:39:12 +03:00
log_debug_devs ( " Scan failed to process %s " , dev_name ( devl - > dev ) ) ;
2018-03-01 21:40:37 +03:00
scan_failed = 1 ;
2018-04-06 21:12:26 +03:00
scan_process_errors + + ;
scan_failed_count + + ;
2018-03-01 21:40:37 +03:00
lvmcache_del_dev ( devl - > dev ) ;
}
2018-02-07 00:18:11 +03:00
}
if ( bb )
bcache_put ( bb ) ;
/*
* Keep the bcache block of lvm devices we have processed so
* that the vg_read phase can reuse it . If bcache failed to
* read the block , or the device does not belong to lvm , then
* drop it from bcache .
*/
if ( scan_failed | | ! is_lvm_device ) {
2018-02-13 17:58:35 +03:00
bcache_invalidate_fd ( scan_bcache , devl - > dev - > bcache_fd ) ;
_scan_dev_close ( devl - > dev ) ;
2018-02-07 00:18:11 +03:00
}
dm_list_del ( & devl - > list ) ;
dm_list_add ( & done_devs , & devl - > list ) ;
}
if ( ! dm_list_empty ( devs ) )
goto scan_more ;
2018-05-25 19:14:12 +03:00
/*
* We ' re done scanning all the devs . If we failed to open any of them
* the first time through , refresh device paths and retry . We failed
* to open the devs on the reopen_devs list .
*
* FIXME : it ' s not clear if or why this helps .
*/
if ( ! dm_list_empty ( & reopen_devs ) ) {
if ( retried_open ) {
/* Don't try again. */
scan_failed_count + = dm_list_size ( & reopen_devs ) ;
dm_list_splice ( & done_devs , & reopen_devs ) ;
goto out ;
}
retried_open = 1 ;
2018-05-30 01:02:27 +03:00
dm_list_iterate_items_safe ( devl , devl2 , & reopen_devs ) {
_drop_bad_aliases ( devl - > dev ) ;
if ( dm_list_empty ( & devl - > dev - > aliases ) ) {
log_warn ( " WARNING: Scan ignoring device %d:%d with no paths. " ,
( int ) MAJOR ( devl - > dev - > dev ) ,
( int ) MINOR ( devl - > dev - > dev ) ) ;
dm_list_del ( & devl - > list ) ;
lvmcache_del_dev ( devl - > dev ) ;
scan_failed_count + + ;
}
}
2018-05-25 19:14:12 +03:00
/*
* This will search the system ' s / dev for new path names and
* could help us reopen the device if it finds a new preferred
* path name for this dev ' s major : minor . It does that by
* inserting a new preferred path name on dev - > aliases . open
* uses the first name from that list .
*/
log_debug_devs ( " Scanning refreshing device paths. " ) ;
dev_cache_scan ( ) ;
/* Put devs that failed to open back on the original list to retry. */
dm_list_splice ( devs , & reopen_devs ) ;
goto scan_more ;
}
out :
log_debug_devs ( " Scanned devices: read errors %d process errors %d failed %d " ,
scan_read_errors , scan_process_errors , scan_failed_count ) ;
2018-02-07 00:18:11 +03:00
2018-02-13 17:58:35 +03:00
if ( failed )
* failed = scan_failed_count ;
2018-02-15 01:15:30 +03:00
dm_list_splice ( devs , & done_devs ) ;
2018-02-13 17:58:35 +03:00
return 1 ;
2018-02-07 00:18:11 +03:00
}
2018-05-15 20:16:58 +03:00
/*
2019-03-01 22:55:59 +03:00
* num_devs is the number of devices the caller is going to scan .
* When 0 the caller doesn ' t know , and we use the default cache size .
* When non - zero , allocate at least num_devs bcache blocks .
* num_devs doesn ' t really tell us how many bcache blocks we ' ll use
* because it includes lvm devs and non - lvm devs , and each lvm dev
* will often use a number of bcache blocks .
2018-05-15 20:16:58 +03:00
*
2019-03-01 22:55:59 +03:00
* We don ' t know ahead of time if we will find some VG metadata
* that is larger than the total size of the bcache , which would
* prevent us from reading / writing the VG since we do not dynamically
* increase the bcache size when we find it ' s too small . In these
* cases the user would need to set io_memory_size to be larger
* than the max VG metadata size ( lvm does not impose any limit on
* the metadata size . )
2018-05-15 20:16:58 +03:00
*/
2019-03-04 20:18:34 +03:00
# define MIN_BCACHE_BLOCKS 32 /* 4MB */
2018-05-15 20:16:58 +03:00
# define MAX_BCACHE_BLOCKS 1024
2018-02-27 21:35:45 +03:00
2019-03-01 22:55:59 +03:00
static int _setup_bcache ( int num_devs )
2018-02-15 00:45:31 +03:00
{
2018-11-16 21:21:20 +03:00
struct io_engine * ioe = NULL ;
2019-03-01 22:55:59 +03:00
int iomem_kb = io_memory_size ( ) ;
int block_size_kb = ( BCACHE_BLOCK_SIZE_IN_SECTORS * 512 ) / 1024 ;
int cache_blocks ;
cache_blocks = iomem_kb / block_size_kb ;
2018-02-15 00:45:31 +03:00
2018-02-27 21:35:45 +03:00
if ( cache_blocks < MIN_BCACHE_BLOCKS )
cache_blocks = MIN_BCACHE_BLOCKS ;
2018-02-15 00:45:31 +03:00
2018-05-15 20:16:58 +03:00
if ( cache_blocks > MAX_BCACHE_BLOCKS )
cache_blocks = MAX_BCACHE_BLOCKS ;
2019-03-04 21:13:09 +03:00
_current_bcache_size_bytes = cache_blocks * BCACHE_BLOCK_SIZE_IN_SECTORS * 512 ;
2018-11-16 21:21:20 +03:00
if ( use_aio ( ) ) {
if ( ! ( ioe = create_async_io_engine ( ) ) ) {
log_warn ( " Failed to set up async io, using sync io. " ) ;
init_use_aio ( 0 ) ;
}
}
if ( ! ioe ) {
if ( ! ( ioe = create_sync_io_engine ( ) ) ) {
log_error ( " Failed to set up sync io. " ) ;
return 0 ;
}
2018-02-15 00:45:31 +03:00
}
if ( ! ( scan_bcache = bcache_create ( BCACHE_BLOCK_SIZE_IN_SECTORS , cache_blocks , ioe ) ) ) {
log_error ( " Failed to create bcache with %d cache blocks. " , cache_blocks ) ;
return 0 ;
}
return 1 ;
}
2018-12-07 23:35:22 +03:00
static void _free_hints ( struct dm_list * hints )
{
struct hint * hint , * hint2 ;
dm_list_iterate_items_safe ( hint , hint2 , hints ) {
dm_list_del ( & hint - > list ) ;
free ( hint ) ;
}
}
2018-02-07 00:18:11 +03:00
/*
* Scan and cache lvm data from all devices on the system .
* The cache should be empty / reset before calling this .
*/
int label_scan ( struct cmd_context * cmd )
{
struct dm_list all_devs ;
2018-12-07 23:35:22 +03:00
struct dm_list scan_devs ;
2019-04-11 19:49:18 +03:00
struct dm_list hints_list ;
2018-02-07 00:18:11 +03:00
struct dev_iter * iter ;
2018-05-14 21:38:16 +03:00
struct device_list * devl , * devl2 ;
2018-02-07 00:18:11 +03:00
struct device * dev ;
2019-03-04 21:13:09 +03:00
uint64_t max_metadata_size_bytes ;
2018-12-07 23:35:22 +03:00
int newhints = 0 ;
2018-02-07 00:18:11 +03:00
log_debug_devs ( " Finding devices to scan " ) ;
dm_list_init ( & all_devs ) ;
2018-12-07 23:35:22 +03:00
dm_list_init ( & scan_devs ) ;
2019-04-11 19:49:18 +03:00
dm_list_init ( & hints_list ) ;
2018-02-07 00:18:11 +03:00
/*
* Iterate through all the devices in dev - cache ( block devs that appear
* under / dev that could possibly hold a PV and are not excluded by
* filters ) . Read each to see if it ' s an lvm device , and if so
* populate lvmcache with some basic info about the device and the VG
* on it . This info will be used by the vg_read ( ) phase of the
* command .
*/
2018-04-09 19:13:43 +03:00
dev_cache_scan ( ) ;
2018-02-07 00:18:11 +03:00
2018-12-04 23:06:46 +03:00
if ( ! ( iter = dev_iter_create ( cmd - > filter , 0 ) ) ) {
2018-02-07 00:18:11 +03:00
log_error ( " Scanning failed to get devices. " ) ;
return 0 ;
}
2018-06-15 19:03:55 +03:00
while ( ( dev = dev_iter_get ( cmd , iter ) ) ) {
2018-06-08 15:40:53 +03:00
if ( ! ( devl = zalloc ( sizeof ( * devl ) ) ) )
2018-06-01 18:40:28 +03:00
continue ;
2018-02-07 00:18:11 +03:00
devl - > dev = dev ;
dm_list_add ( & all_devs , & devl - > list ) ;
/*
* label_scan should not generally be called a second time ,
* so this will usually not be true .
*/
2018-02-13 17:58:35 +03:00
if ( _in_bcache ( dev ) ) {
bcache_invalidate_fd ( scan_bcache , dev - > bcache_fd ) ;
_scan_dev_close ( dev ) ;
}
2018-06-15 19:42:10 +03:00
/*
* When md devices exist that use the old superblock at the
* end of the device , then in order to detect and filter out
* the component devices of those md devs , we need to enable
* the full md filter which scans both the start and the end
* of every device . This doubles the amount of scanning i / o ,
* which we want to avoid . FIXME : it may not be worth the
* cost of double i / o just to avoid displaying md component
* devs in ' pvs ' , which is a pretty harmless effect from a
* pretty uncommon situation .
*/
if ( dev_is_md_with_end_superblock ( cmd - > dev_types , dev ) )
cmd - > use_full_md_check = 1 ;
2018-02-07 00:18:11 +03:00
} ;
dev_iter_destroy ( iter ) ;
if ( ! scan_bcache ) {
2018-02-15 00:45:31 +03:00
if ( ! _setup_bcache ( dm_list_size ( & all_devs ) ) )
2018-02-07 00:18:11 +03:00
return 0 ;
}
2018-12-07 23:35:22 +03:00
/*
* In some common cases we can avoid scanning all devices .
*
* TODO : if the command is using hints and a single vgname
* arg , we can also take the vg lock here , prior to scanning .
* This means we would not need to rescan the PVs in the VG
* in vg_read ( skip lvmcache_label_rescan_vg ) after the
* vg lock is usually taken . ( Some commands are already
* able to avoid rescan in vg_read , but locking early would
* apply to more cases . )
*/
2019-04-11 19:49:18 +03:00
if ( ! get_hints ( cmd , & hints_list , & newhints , & all_devs , & scan_devs ) ) {
2018-12-07 23:35:22 +03:00
dm_list_splice ( & scan_devs , & all_devs ) ;
2019-04-11 19:49:18 +03:00
dm_list_init ( & hints_list ) ;
}
2018-12-07 23:35:22 +03:00
log_debug ( " Will scan %d devices skip %d " , dm_list_size ( & scan_devs ) , dm_list_size ( & all_devs ) ) ;
/*
* Do the main scan .
*/
_scan_list ( cmd , cmd - > filter , & scan_devs , NULL ) ;
2019-03-04 21:13:09 +03:00
/*
* Metadata could be larger than total size of bcache , and bcache
* cannot currently be resized during the command . If this is the
* case ( or within reach ) , warn that io_memory_size needs to be
* set larger .
*
* Even if bcache out of space did not cause a failure during scan , it
* may cause a failure during the next vg_read phase or during vg_write .
*
* If there was an error during scan , we could recreate bcache here
* with a larger size and then restart label_scan . But , this does not
* address the problem of writing new metadata that excedes the bcache
* size and failing , which would often be hit first , i . e . we ' ll fail
* to write new metadata exceding the max size before we have a chance
* to read any metadata with that size , unless we find an existing vg
* that has been previously created with the larger size .
*
* If the largest metadata is within 1 MB of the bcache size , then start
* warning .
*/
max_metadata_size_bytes = lvmcache_max_metadata_size ( ) ;
if ( max_metadata_size_bytes + ( 1024 * 1024 ) > _current_bcache_size_bytes ) {
/* we want bcache to be 1MB larger than the max metadata seen */
uint64_t want_size_kb = ( max_metadata_size_bytes / 1024 ) + 1024 ;
uint64_t remainder ;
if ( ( remainder = ( want_size_kb % 1024 ) ) )
want_size_kb = want_size_kb + 1024 - remainder ;
log_warn ( " WARNING: metadata may not be usable with current io_memory_size %d KiB " ,
io_memory_size ( ) ) ;
log_warn ( " WARNING: increase lvm.conf io_memory_size to at least %llu KiB " ,
( unsigned long long ) want_size_kb ) ;
}
2018-12-07 23:35:22 +03:00
dm_list_init ( & cmd - > hints ) ;
2019-04-11 19:49:18 +03:00
if ( ! dm_list_empty ( & hints_list ) ) {
if ( ! validate_hints ( cmd , & hints_list ) ) {
2018-12-07 23:35:22 +03:00
/*
* We scanned a subset of all devices based on hints .
* With the results from the scan we may decide that
* the hints are not valid , so scan all others .
*/
log_debug ( " Will scan %d remaining devices " , dm_list_size ( & all_devs ) ) ;
_scan_list ( cmd , cmd - > filter , & all_devs , NULL ) ;
2019-04-11 19:49:18 +03:00
_free_hints ( & hints_list ) ;
2018-12-07 23:35:22 +03:00
newhints = 0 ;
} else {
/* The hints may be used by another device iteration. */
2019-04-11 19:49:18 +03:00
dm_list_splice ( & cmd - > hints , & hints_list ) ;
2018-12-07 23:35:22 +03:00
}
}
2018-02-13 17:58:35 +03:00
2018-05-14 21:38:16 +03:00
dm_list_iterate_items_safe ( devl , devl2 , & all_devs ) {
dm_list_del ( & devl - > list ) ;
2018-06-08 15:40:53 +03:00
free ( devl ) ;
2018-05-14 21:38:16 +03:00
}
2018-12-07 23:35:22 +03:00
dm_list_iterate_items_safe ( devl , devl2 , & scan_devs ) {
dm_list_del ( & devl - > list ) ;
free ( devl ) ;
}
if ( newhints )
write_hint_file ( cmd , newhints ) ;
2018-02-13 17:58:35 +03:00
return 1 ;
2018-02-07 00:18:11 +03:00
}
/*
* Scan and cache lvm data from the listed devices . If a device is already
* scanned and cached , this replaces the previously cached lvm data for the
* device . This is called when vg_read ( ) wants to guarantee that it is using
* the latest data from the devices in the VG ( since the scan populated bcache
* without a lock . )
*/
2018-05-04 01:12:07 +03:00
int label_scan_devs ( struct cmd_context * cmd , struct dev_filter * f , struct dm_list * devs )
2018-02-07 00:18:11 +03:00
{
struct device_list * devl ;
2018-03-07 00:05:27 +03:00
/* FIXME: get rid of this, it's only needed for lvmetad in which
case we should be setting up bcache in one place . */
if ( ! scan_bcache ) {
if ( ! _setup_bcache ( 0 ) )
return 0 ;
}
2018-02-07 00:18:11 +03:00
dm_list_iterate_items ( devl , devs ) {
2018-02-13 17:58:35 +03:00
if ( _in_bcache ( devl - > dev ) ) {
bcache_invalidate_fd ( scan_bcache , devl - > dev - > bcache_fd ) ;
_scan_dev_close ( devl - > dev ) ;
}
}
2018-05-04 01:12:07 +03:00
_scan_list ( cmd , f , devs , NULL ) ;
2018-02-13 17:58:35 +03:00
/* FIXME: this function should probably fail if any devs couldn't be scanned */
return 1 ;
}
int label_scan_devs_excl ( struct dm_list * devs )
{
struct device_list * devl ;
int failed = 0 ;
dm_list_iterate_items ( devl , devs ) {
if ( _in_bcache ( devl - > dev ) ) {
bcache_invalidate_fd ( scan_bcache , devl - > dev - > bcache_fd ) ;
_scan_dev_close ( devl - > dev ) ;
}
/*
* With this flag set , _scan_dev_open ( ) done by
* _scan_list ( ) will do open EXCL
*/
devl - > dev - > flags | = DEV_BCACHE_EXCL ;
2018-02-07 00:18:11 +03:00
}
2018-05-04 01:12:07 +03:00
_scan_list ( NULL , NULL , devs , & failed ) ;
2018-02-13 17:58:35 +03:00
if ( failed )
return 0 ;
return 1 ;
2018-02-07 00:18:11 +03:00
}
void label_scan_invalidate ( struct device * dev )
{
if ( _in_bcache ( dev ) ) {
2018-02-13 17:58:35 +03:00
bcache_invalidate_fd ( scan_bcache , dev - > bcache_fd ) ;
_scan_dev_close ( dev ) ;
2018-02-07 00:18:11 +03:00
}
}
2018-02-16 23:18:55 +03:00
/*
* If a PV is stacked on an LV , then the LV is kept open
* in bcache , and needs to be closed so the open fd doesn ' t
* interfere with processing the LV .
*/
void label_scan_invalidate_lv ( struct cmd_context * cmd , struct logical_volume * lv )
{
struct lvinfo lvinfo ;
struct device * dev ;
dev_t devt ;
2018-10-15 17:29:09 +03:00
if ( ! lv_info ( cmd , lv , 0 , & lvinfo , 0 , 0 ) )
return ;
2018-02-16 23:18:55 +03:00
devt = MKDEV ( lvinfo . major , lvinfo . minor ) ;
2019-04-05 22:03:38 +03:00
if ( ( dev = dev_cache_get_by_devt ( cmd , devt , NULL , NULL ) ) )
2018-02-16 23:18:55 +03:00
label_scan_invalidate ( dev ) ;
}
2018-02-07 00:18:11 +03:00
/*
2018-02-28 01:35:47 +03:00
* Empty the bcache of all blocks and close all open fds ,
* but keep the bcache set up .
2018-02-07 00:18:11 +03:00
*/
2018-02-28 01:35:47 +03:00
void label_scan_drop ( struct cmd_context * cmd )
2018-02-07 00:18:11 +03:00
{
struct dev_iter * iter ;
struct device * dev ;
2018-05-04 01:12:07 +03:00
if ( ! ( iter = dev_iter_create ( NULL , 0 ) ) )
2018-02-07 00:18:11 +03:00
return ;
2018-06-15 19:03:55 +03:00
while ( ( dev = dev_iter_get ( cmd , iter ) ) ) {
2018-02-20 00:40:44 +03:00
if ( _in_bcache ( dev ) )
_scan_dev_close ( dev ) ;
}
2018-02-07 00:18:11 +03:00
dev_iter_destroy ( iter ) ;
2018-02-28 01:35:47 +03:00
}
/*
* Close devices that are open because bcache is holding blocks for them .
* Destroy the bcache .
*/
void label_scan_destroy ( struct cmd_context * cmd )
{
if ( ! scan_bcache )
return ;
label_scan_drop ( cmd ) ;
2018-02-07 00:18:11 +03:00
bcache_destroy ( scan_bcache ) ;
scan_bcache = NULL ;
}
/*
* Read ( or re - read ) and process ( or re - process ) the data for a device . This
* will reset ( clear and repopulate ) the bcache and lvmcache info for this
* device . There are only a couple odd places that want to reread a specific
* device , this is not a commonly used function .
*/
2018-05-11 22:16:49 +03:00
int label_read ( struct device * dev )
2018-02-07 00:18:11 +03:00
{
struct dm_list one_dev ;
struct device_list * devl ;
2018-02-13 17:58:35 +03:00
int failed = 0 ;
2018-02-07 00:18:11 +03:00
/* scanning is done by list, so make a single item list for this dev */
2018-06-08 15:40:53 +03:00
if ( ! ( devl = zalloc ( sizeof ( * devl ) ) ) )
2018-02-07 00:18:11 +03:00
return 0 ;
devl - > dev = dev ;
dm_list_init ( & one_dev ) ;
dm_list_add ( & one_dev , & devl - > list ) ;
2018-02-13 17:58:35 +03:00
if ( _in_bcache ( dev ) ) {
bcache_invalidate_fd ( scan_bcache , dev - > bcache_fd ) ;
_scan_dev_close ( dev ) ;
}
2018-02-07 00:18:11 +03:00
2018-05-04 01:12:07 +03:00
_scan_list ( NULL , NULL , & one_dev , & failed ) ;
2018-02-07 00:18:11 +03:00
2018-06-08 15:40:53 +03:00
free ( devl ) ;
2018-02-07 00:18:11 +03:00
2018-02-13 17:58:35 +03:00
if ( failed )
return 0 ;
return 1 ;
2018-02-07 00:18:11 +03:00
}
/*
* Read a label from a specfic , non - zero sector . This is used in only
2018-05-11 00:27:34 +03:00
* one place : pvck / pv_analyze .
2018-02-07 00:18:11 +03:00
*/
2018-05-11 00:27:34 +03:00
int label_read_sector ( struct device * dev , uint64_t read_sector )
2018-02-07 00:18:11 +03:00
{
2018-05-11 00:27:34 +03:00
struct block * bb = NULL ;
uint64_t block_num ;
uint64_t block_sector ;
uint64_t start_sector ;
int is_lvm_device = 0 ;
int result ;
int ret ;
block_num = read_sector / BCACHE_BLOCK_SIZE_IN_SECTORS ;
block_sector = block_num * BCACHE_BLOCK_SIZE_IN_SECTORS ;
start_sector = read_sector % BCACHE_BLOCK_SIZE_IN_SECTORS ;
2018-10-15 17:39:28 +03:00
if ( ! label_scan_open ( dev ) ) {
log_error ( " Error opening device %s for prefetch %llu sector. " ,
dev_name ( dev ) , ( unsigned long long ) block_num ) ;
return false ;
}
2018-05-11 00:27:34 +03:00
bcache_prefetch ( scan_bcache , dev - > bcache_fd , block_num ) ;
if ( ! bcache_get ( scan_bcache , dev - > bcache_fd , block_num , 0 , & bb ) ) {
log_error ( " Scan failed to read %s at %llu " ,
dev_name ( dev ) , ( unsigned long long ) block_num ) ;
ret = 0 ;
goto out ;
2018-02-07 00:18:11 +03:00
}
2018-05-11 00:27:34 +03:00
/*
* TODO : check if scan_sector is larger than the bcache block size .
* If it is , we need to fetch a later block from bcache .
*/
result = _process_block ( NULL , NULL , dev , bb , block_sector , start_sector , & is_lvm_device ) ;
if ( ! result & & is_lvm_device ) {
log_error ( " Scan failed to process %s " , dev_name ( dev ) ) ;
ret = 0 ;
goto out ;
2018-02-07 00:18:11 +03:00
}
2018-05-11 00:27:34 +03:00
if ( ! result | | ! is_lvm_device ) {
log_error ( " Could not find LVM label on %s " , dev_name ( dev ) ) ;
ret = 0 ;
goto out ;
}
ret = 1 ;
out :
if ( bb )
bcache_put ( bb ) ;
return ret ;
2018-02-07 00:18:11 +03:00
}
2018-02-15 01:21:27 +03:00
/*
* This is only needed when commands are using lvmetad , in which case they
* don ' t do an initial label_scan , but may later need to rescan certain devs
* from disk and call this function . FIXME : is there some better number to
2018-05-15 20:16:58 +03:00
* choose here ? How should we predict the number of devices that might need
* scanning when using lvmetad ?
2018-02-15 01:21:27 +03:00
*/
int label_scan_setup_bcache ( void )
{
if ( ! scan_bcache ) {
2018-02-27 21:35:45 +03:00
if ( ! _setup_bcache ( 0 ) )
2018-02-15 01:21:27 +03:00
return 0 ;
}
return 1 ;
}
2018-02-20 00:40:44 +03:00
/*
* This is needed to write to a new non - lvm device .
* Scanning that dev would not keep it open or in
* bcache , but to use bcache_write we need the dev
* to be open so we can use dev - > bcache_fd to write .
*/
int label_scan_open ( struct device * dev )
{
if ( ! _in_bcache ( dev ) )
return _scan_dev_open ( dev ) ;
return 1 ;
}
2018-05-16 21:24:00 +03:00
int label_scan_open_excl ( struct device * dev )
{
2018-06-20 19:32:45 +03:00
if ( _in_bcache ( dev ) & & ! ( dev - > flags & DEV_BCACHE_EXCL ) ) {
/* FIXME: avoid tossing out bcache blocks just to replace fd. */
log_debug ( " Close and reopen excl %s " , dev_name ( dev ) ) ;
bcache_invalidate_fd ( scan_bcache , dev - > bcache_fd ) ;
_scan_dev_close ( dev ) ;
}
2018-05-16 21:24:00 +03:00
dev - > flags | = DEV_BCACHE_EXCL ;
2018-06-20 19:32:45 +03:00
dev - > flags | = DEV_BCACHE_WRITE ;
2018-05-16 21:24:00 +03:00
return label_scan_open ( dev ) ;
}
2019-04-26 22:49:27 +03:00
int label_scan_open_rw ( struct device * dev )
{
if ( _in_bcache ( dev ) & & ! ( dev - > flags & DEV_BCACHE_WRITE ) ) {
/* FIXME: avoid tossing out bcache blocks just to replace fd. */
log_debug ( " Close and reopen rw %s " , dev_name ( dev ) ) ;
bcache_invalidate_fd ( scan_bcache , dev - > bcache_fd ) ;
_scan_dev_close ( dev ) ;
}
dev - > flags | = DEV_BCACHE_WRITE ;
return label_scan_open ( dev ) ;
}
2018-05-09 18:34:28 +03:00
bool dev_read_bytes ( struct device * dev , uint64_t start , size_t len , void * data )
2018-02-27 20:26:04 +03:00
{
if ( ! scan_bcache ) {
2018-05-11 17:50:25 +03:00
/* Should not happen */
log_error ( " dev_read bcache not set up %s " , dev_name ( dev ) ) ;
return false ;
2018-02-27 20:26:04 +03:00
}
if ( dev - > bcache_fd < = 0 ) {
2018-03-09 20:39:12 +03:00
/* This is not often needed, perhaps only with lvmetad. */
if ( ! label_scan_open ( dev ) ) {
2018-06-06 18:05:08 +03:00
log_error ( " Error opening device %s for reading at %llu length %u. " ,
dev_name ( dev ) , ( unsigned long long ) start , ( uint32_t ) len ) ;
2018-03-09 20:39:12 +03:00
return false ;
}
2018-02-27 20:26:04 +03:00
}
2018-02-28 00:03:56 +03:00
if ( ! bcache_read_bytes ( scan_bcache , dev - > bcache_fd , start , len , data ) ) {
2018-06-06 18:05:08 +03:00
log_error ( " Error reading device %s at %llu length %u. " ,
dev_name ( dev ) , ( unsigned long long ) start , ( uint32_t ) len ) ;
2018-02-28 00:03:56 +03:00
label_scan_invalidate ( dev ) ;
return false ;
}
return true ;
2018-02-27 20:26:04 +03:00
}
2018-05-09 18:34:28 +03:00
bool dev_write_bytes ( struct device * dev , uint64_t start , size_t len , void * data )
2018-02-27 20:26:04 +03:00
{
2018-04-09 21:57:44 +03:00
if ( test_mode ( ) )
return true ;
2018-02-27 20:26:04 +03:00
if ( ! scan_bcache ) {
2018-05-11 17:50:25 +03:00
/* Should not happen */
log_error ( " dev_write bcache not set up %s " , dev_name ( dev ) ) ;
return false ;
2018-02-27 20:26:04 +03:00
}
2018-08-01 18:26:28 +03:00
if ( _in_bcache ( dev ) & & ! ( dev - > flags & DEV_BCACHE_WRITE ) ) {
2018-06-20 19:32:45 +03:00
/* FIXME: avoid tossing out bcache blocks just to replace fd. */
log_debug ( " Close and reopen to write %s " , dev_name ( dev ) ) ;
bcache_invalidate_fd ( scan_bcache , dev - > bcache_fd ) ;
_scan_dev_close ( dev ) ;
dev - > flags | = DEV_BCACHE_WRITE ;
label_scan_open ( dev ) ;
}
2018-02-27 20:26:04 +03:00
if ( dev - > bcache_fd < = 0 ) {
2018-03-09 20:39:12 +03:00
/* This is not often needed, perhaps only with lvmetad. */
2018-06-20 19:32:45 +03:00
dev - > flags | = DEV_BCACHE_WRITE ;
2018-03-09 20:39:12 +03:00
if ( ! label_scan_open ( dev ) ) {
2018-06-06 18:05:08 +03:00
log_error ( " Error opening device %s for writing at %llu length %u. " ,
dev_name ( dev ) , ( unsigned long long ) start , ( uint32_t ) len ) ;
2018-03-09 20:39:12 +03:00
return false ;
}
2018-02-27 20:26:04 +03:00
}
2018-02-28 00:03:56 +03:00
if ( ! bcache_write_bytes ( scan_bcache , dev - > bcache_fd , start , len , data ) ) {
2018-06-06 18:05:08 +03:00
log_error ( " Error writing device %s at %llu length %u. " ,
dev_name ( dev ) , ( unsigned long long ) start , ( uint32_t ) len ) ;
2018-05-01 17:33:55 +03:00
label_scan_invalidate ( dev ) ;
return false ;
}
if ( ! bcache_flush ( scan_bcache ) ) {
2018-06-06 18:05:08 +03:00
log_error ( " Error writing device %s at %llu length %u. " ,
dev_name ( dev ) , ( unsigned long long ) start , ( uint32_t ) len ) ;
2018-02-28 00:03:56 +03:00
label_scan_invalidate ( dev ) ;
return false ;
}
return true ;
2018-02-27 20:26:04 +03:00
}
2018-05-09 18:34:28 +03:00
bool dev_write_zeros ( struct device * dev , uint64_t start , size_t len )
2018-02-27 20:26:04 +03:00
{
2018-04-09 21:57:44 +03:00
if ( test_mode ( ) )
return true ;
2018-02-27 20:26:04 +03:00
if ( ! scan_bcache ) {
2018-05-11 17:50:25 +03:00
log_error ( " dev_write_zeros bcache not set up %s " , dev_name ( dev ) ) ;
2018-05-09 18:34:28 +03:00
return false ;
2018-02-27 20:26:04 +03:00
}
2018-08-01 18:26:28 +03:00
if ( _in_bcache ( dev ) & & ! ( dev - > flags & DEV_BCACHE_WRITE ) ) {
2018-06-20 19:32:45 +03:00
/* FIXME: avoid tossing out bcache blocks just to replace fd. */
log_debug ( " Close and reopen to write %s " , dev_name ( dev ) ) ;
bcache_invalidate_fd ( scan_bcache , dev - > bcache_fd ) ;
_scan_dev_close ( dev ) ;
dev - > flags | = DEV_BCACHE_WRITE ;
label_scan_open ( dev ) ;
}
2018-02-27 20:26:04 +03:00
if ( dev - > bcache_fd < = 0 ) {
2018-03-09 20:39:12 +03:00
/* This is not often needed, perhaps only with lvmetad. */
2018-06-20 19:32:45 +03:00
dev - > flags | = DEV_BCACHE_WRITE ;
2018-03-09 20:39:12 +03:00
if ( ! label_scan_open ( dev ) ) {
2018-06-06 18:05:08 +03:00
log_error ( " Error opening device %s for writing at %llu length %u. " ,
dev_name ( dev ) , ( unsigned long long ) start , ( uint32_t ) len ) ;
2018-03-09 20:39:12 +03:00
return false ;
}
2018-02-27 20:26:04 +03:00
}
2018-10-30 00:53:17 +03:00
dev_set_last_byte ( dev , start + len ) ;
2018-05-03 12:21:14 +03:00
if ( ! bcache_zero_bytes ( scan_bcache , dev - > bcache_fd , start , len ) ) {
2018-06-06 18:05:08 +03:00
log_error ( " Error writing device %s at %llu length %u. " ,
dev_name ( dev ) , ( unsigned long long ) start , ( uint32_t ) len ) ;
2018-10-30 00:53:17 +03:00
dev_unset_last_byte ( dev ) ;
2018-05-01 17:33:55 +03:00
label_scan_invalidate ( dev ) ;
return false ;
}
if ( ! bcache_flush ( scan_bcache ) ) {
2018-06-06 18:05:08 +03:00
log_error ( " Error writing device %s at %llu length %u. " ,
dev_name ( dev ) , ( unsigned long long ) start , ( uint32_t ) len ) ;
2018-10-30 00:53:17 +03:00
dev_unset_last_byte ( dev ) ;
2018-02-28 00:03:56 +03:00
label_scan_invalidate ( dev ) ;
return false ;
}
2018-10-30 00:53:17 +03:00
dev_unset_last_byte ( dev ) ;
2018-02-28 00:03:56 +03:00
return true ;
2018-02-27 20:26:04 +03:00
}
2018-05-09 18:34:28 +03:00
bool dev_set_bytes ( struct device * dev , uint64_t start , size_t len , uint8_t val )
{
if ( test_mode ( ) )
return true ;
if ( ! scan_bcache ) {
2018-05-11 17:50:25 +03:00
log_error ( " dev_set_bytes bcache not set up %s " , dev_name ( dev ) ) ;
2018-05-09 18:34:28 +03:00
return false ;
}
2018-08-01 18:26:28 +03:00
if ( _in_bcache ( dev ) & & ! ( dev - > flags & DEV_BCACHE_WRITE ) ) {
2018-06-20 19:32:45 +03:00
/* FIXME: avoid tossing out bcache blocks just to replace fd. */
log_debug ( " Close and reopen to write %s " , dev_name ( dev ) ) ;
bcache_invalidate_fd ( scan_bcache , dev - > bcache_fd ) ;
_scan_dev_close ( dev ) ;
2018-11-03 19:19:33 +03:00
/* goes to label_scan_open() since bcache_fd < 0 */
2018-06-20 19:32:45 +03:00
}
2018-05-09 18:34:28 +03:00
if ( dev - > bcache_fd < = 0 ) {
/* This is not often needed, perhaps only with lvmetad. */
2018-06-20 19:32:45 +03:00
dev - > flags | = DEV_BCACHE_WRITE ;
2018-05-09 18:34:28 +03:00
if ( ! label_scan_open ( dev ) ) {
2018-06-06 18:05:08 +03:00
log_error ( " Error opening device %s for writing at %llu length %u. " ,
dev_name ( dev ) , ( unsigned long long ) start , ( uint32_t ) len ) ;
2018-05-09 18:34:28 +03:00
return false ;
}
}
2018-10-30 00:53:17 +03:00
dev_set_last_byte ( dev , start + len ) ;
2018-05-09 18:34:28 +03:00
if ( ! bcache_set_bytes ( scan_bcache , dev - > bcache_fd , start , len , val ) ) {
2018-06-06 18:05:08 +03:00
log_error ( " Error writing device %s at %llu length %u. " ,
dev_name ( dev ) , ( unsigned long long ) start , ( uint32_t ) len ) ;
2018-10-30 00:53:17 +03:00
dev_unset_last_byte ( dev ) ;
2018-05-09 18:34:28 +03:00
label_scan_invalidate ( dev ) ;
return false ;
}
if ( ! bcache_flush ( scan_bcache ) ) {
2018-06-06 18:05:08 +03:00
log_error ( " Error writing device %s at %llu length %u. " ,
dev_name ( dev ) , ( unsigned long long ) start , ( uint32_t ) len ) ;
2018-10-30 00:53:17 +03:00
dev_unset_last_byte ( dev ) ;
2018-05-09 18:34:28 +03:00
label_scan_invalidate ( dev ) ;
return false ;
}
2018-10-30 00:53:17 +03:00
dev_unset_last_byte ( dev ) ;
2018-05-09 18:34:28 +03:00
return true ;
}
2018-10-30 00:53:17 +03:00
void dev_set_last_byte ( struct device * dev , uint64_t offset )
{
unsigned int phys_block_size = 0 ;
unsigned int block_size = 0 ;
2018-11-03 00:19:47 +03:00
if ( ! dev_get_block_size ( dev , & phys_block_size , & block_size ) ) {
stack ;
/* FIXME ASSERT or regular error testing is missing */
return ;
}
2018-10-30 00:53:17 +03:00
bcache_set_last_byte ( scan_bcache , dev - > bcache_fd , offset , phys_block_size ) ;
}
void dev_unset_last_byte ( struct device * dev )
{
bcache_unset_last_byte ( scan_bcache , dev - > bcache_fd ) ;
}