2011-08-11 09:00:20 +04:00
/*
2017-03-16 23:03:51 +03:00
* Copyright ( C ) 2005 - 2017 Red Hat , Inc . All rights reserved .
2011-08-11 09:00:20 +04:00
*
* This file is part of LVM2 .
*
* This copyrighted material is made available to anyone wishing to use ,
* modify , copy , or redistribute it subject to the terms and conditions
* of the GNU Lesser General Public License v .2 .1 .
*
* You should have received a copy of the GNU Lesser General Public License
* along with this program ; if not , write to the Free Software Foundation ,
2016-01-21 13:49:46 +03:00
* Inc . , 51 Franklin Street , Fifth Floor , Boston , MA 02110 - 1301 USA
2011-08-11 09:00:20 +04:00
*/
2018-05-14 12:30:20 +03:00
# include "lib/misc/lib.h"
2018-12-03 20:15:44 +03:00
# include "daemons/dmeventd/plugins/lvm2/dmeventd_lvm.h"
2018-05-14 12:30:20 +03:00
# include "daemons/dmeventd/libdevmapper-event.h"
2018-12-03 20:15:44 +03:00
# include "lib/config/defaults.h"
2015-10-10 17:58:31 +03:00
2016-09-21 01:38:38 +03:00
/* Hold enough elements for the mximum number of RAID images */
# define RAID_DEVS_ELEMS ((DEFAULT_RAID_MAX_IMAGES + 63) / 64)
2015-10-13 12:28:57 +03:00
struct dso_state {
struct dm_pool * mem ;
char cmd_lvconvert [ 512 ] ;
2016-09-21 01:38:38 +03:00
uint64_t raid_devs [ RAID_DEVS_ELEMS ] ;
2015-10-13 12:28:57 +03:00
int failed ;
2016-09-21 01:38:38 +03:00
int warned ;
2015-10-13 12:28:57 +03:00
} ;
2015-10-10 17:58:31 +03:00
DM_EVENT_LOG_FN ( " raid " )
2011-08-11 09:00:20 +04:00
/* FIXME Reformat to 80 char lines. */
2015-10-13 12:37:14 +03:00
static int _process_raid_event ( struct dso_state * state , char * params , const char * device )
2011-12-06 23:30:15 +04:00
{
2015-10-13 12:37:14 +03:00
struct dm_status_raid * status ;
const char * d ;
2016-09-21 01:38:38 +03:00
int dead = 0 , r = 1 ;
2016-12-09 15:58:19 +03:00
uint32_t dev ;
2014-07-21 06:33:21 +04:00
2015-10-13 12:37:14 +03:00
if ( ! dm_get_status_raid ( state - > mem , params , & status ) ) {
2015-10-09 22:57:48 +03:00
log_error ( " Failed to process status line for %s. " , device ) ;
2015-10-13 12:37:14 +03:00
return 0 ;
2011-08-11 09:00:20 +04:00
}
2016-09-21 01:38:38 +03:00
d = status - > dev_health ;
while ( ( d = strchr ( d , ' D ' ) ) ) {
2016-12-09 15:58:19 +03:00
dev = ( uint32_t ) ( d - status - > dev_health ) ;
2016-09-21 01:38:38 +03:00
2016-12-09 15:58:19 +03:00
if ( ! ( state - > raid_devs [ dev / 64 ] & ( UINT64_C ( 1 ) < < ( dev % 64 ) ) ) ) {
state - > raid_devs [ dev / 64 ] | = ( UINT64_C ( 1 ) < < ( dev % 64 ) ) ;
log_warn ( " WARNING: Device #%u of %s array, %s, has failed. " ,
dev , status - > raid_type , device ) ;
}
2016-09-21 01:38:38 +03:00
d + + ;
dead = 1 ;
}
2017-06-14 16:39:50 +03:00
/*
* if we are converting from non - RAID to RAID ( e . g . linear - > raid1 )
* and too many original devices die , such that we cannot continue
* the " recover " operation , the sync action will go to " idle " , the
* unsynced devs will remain at ' a ' , and the original devices will
* NOT SWITCH TO ' D ' , but will remain at ' A ' - hoping to be revived .
*
* This is simply the way the kernel works . . .
*/
if ( ! strcmp ( status - > sync_action , " idle " ) & &
2017-06-24 01:06:12 +03:00
( status - > dev_health [ 0 ] = = ' a ' ) & &
( status - > insync_regions < status - > total_regions ) ) {
2017-06-14 16:39:50 +03:00
log_error ( " Primary sources for new RAID, %s, have failed. " ,
device ) ;
dead = 1 ; /* run it through LVM repair */
}
2016-09-21 01:38:38 +03:00
if ( dead ) {
2019-09-20 18:35:35 +03:00
/*
2020-10-03 14:52:37 +03:00
* Use the first event to run a repair ignoring any additional ones .
2019-09-20 18:35:35 +03:00
*
* We presume lvconvert to do pre - repair
* checks to avoid bloat in this plugin .
*/
if ( ! state - > warned & & status - > insync_regions < status - > total_regions ) {
state - > warned = 1 ;
log_warn ( " WARNING: waiting for resynchronization to finish "
" before initiating repair on RAID device %s. " , device ) ;
/* Fall through to allow lvconvert to run. */
2019-09-20 18:26:36 +03:00
}
2015-10-22 11:38:40 +03:00
if ( state - > failed )
goto out ; /* already reported */
2015-10-13 12:37:14 +03:00
state - > failed = 1 ;
/* if repair goes OK, report success even if lvscan has failed */
if ( ! dmeventd_lvm2_run_with_lock ( state - > cmd_lvconvert ) ) {
2016-10-31 20:03:06 +03:00
log_error ( " Repair of RAID device %s failed. " , device ) ;
2016-09-21 01:38:38 +03:00
r = 0 ;
2011-08-11 09:00:20 +04:00
}
2015-10-13 12:37:14 +03:00
} else {
state - > failed = 0 ;
2017-06-24 01:06:12 +03:00
if ( status - > insync_regions = = status - > total_regions )
memset ( & state - > raid_devs , 0 , sizeof ( state - > raid_devs ) ) ;
2015-10-13 12:37:14 +03:00
log_info ( " %s array, %s, is %s in-sync. " ,
status - > raid_type , device ,
( status - > insync_regions = = status - > total_regions ) ? " now " : " not " ) ;
2011-08-11 09:00:20 +04:00
}
2015-10-22 11:38:40 +03:00
out :
2015-10-13 12:37:14 +03:00
dm_pool_free ( state - > mem , status ) ;
2011-08-11 09:00:20 +04:00
2016-09-21 01:38:38 +03:00
return r ;
2011-08-11 09:00:20 +04:00
}
void process_event ( struct dm_task * dmt ,
enum dm_event_mask event __attribute__ ( ( unused ) ) ,
2015-10-12 12:40:51 +03:00
void * * user )
2011-08-11 09:00:20 +04:00
{
2015-10-13 12:37:14 +03:00
struct dso_state * state = * user ;
2011-08-11 09:00:20 +04:00
void * next = NULL ;
uint64_t start , length ;
char * target_type = NULL ;
char * params ;
const char * device = dm_task_get_name ( dmt ) ;
do {
next = dm_get_next_target ( dmt , next , & start , & length ,
& target_type , & params ) ;
if ( ! target_type ) {
2015-10-09 22:57:48 +03:00
log_info ( " %s mapping lost. " , device ) ;
2011-08-11 09:00:20 +04:00
continue ;
}
if ( strcmp ( target_type , " raid " ) ) {
2015-10-09 22:57:48 +03:00
log_info ( " %s has non-raid portion. " , device ) ;
2011-08-11 09:00:20 +04:00
continue ;
}
2015-10-13 12:37:14 +03:00
if ( ! _process_raid_event ( state , params , device ) )
2015-10-09 22:57:48 +03:00
log_error ( " Failed to process event for %s. " ,
device ) ;
2011-08-11 09:00:20 +04:00
} while ( next ) ;
}
int register_device ( const char * device ,
const char * uuid __attribute__ ( ( unused ) ) ,
int major __attribute__ ( ( unused ) ) ,
int minor __attribute__ ( ( unused ) ) ,
2015-10-12 12:40:51 +03:00
void * * user )
2011-08-11 09:00:20 +04:00
{
2015-10-13 12:28:57 +03:00
struct dso_state * state ;
if ( ! dmeventd_lvm2_init_with_pool ( " raid_state " , state ) )
goto_bad ;
2017-03-16 23:03:51 +03:00
if ( ! dmeventd_lvm2_command ( state - > mem , state - > cmd_lvconvert , sizeof ( state - > cmd_lvconvert ) ,
2017-06-23 22:15:37 +03:00
" lvconvert --repair --use-policies " , device ) )
2015-10-13 12:28:57 +03:00
goto_bad ;
* user = state ;
2011-12-22 20:37:01 +04:00
2015-10-09 22:57:48 +03:00
log_info ( " Monitoring RAID device %s for events. " , device ) ;
2011-12-22 20:37:01 +04:00
return 1 ;
2015-10-13 12:28:57 +03:00
bad :
log_error ( " Failed to monitor RAID %s. " , device ) ;
2017-02-13 21:00:59 +03:00
if ( state )
dmeventd_lvm2_exit_with_pool ( state ) ;
2015-10-13 12:28:57 +03:00
return 0 ;
2011-08-11 09:00:20 +04:00
}
int unregister_device ( const char * device ,
const char * uuid __attribute__ ( ( unused ) ) ,
int major __attribute__ ( ( unused ) ) ,
int minor __attribute__ ( ( unused ) ) ,
2015-10-12 12:40:51 +03:00
void * * user )
2011-08-11 09:00:20 +04:00
{
2015-10-13 12:28:57 +03:00
struct dso_state * state = * user ;
dmeventd_lvm2_exit_with_pool ( state ) ;
2015-10-09 22:57:48 +03:00
log_info ( " No longer monitoring RAID device %s for events. " ,
device ) ;
2011-12-22 20:37:01 +04:00
2011-08-11 09:00:20 +04:00
return 1 ;
}