1999-08-14 07:10:03 +04:00
/* $NetBSD: rf_disks.c,v 1.13 1999/08/14 03:10:03 oster Exp $ */
1999-02-24 03:00:03 +03:00
/*-
* Copyright ( c ) 1999 The NetBSD Foundation , Inc .
* All rights reserved .
*
* This code is derived from software contributed to The NetBSD Foundation
* by Greg Oster
*
* Redistribution and use in source and binary forms , with or without
* modification , are permitted provided that the following conditions
* are met :
* 1. Redistributions of source code must retain the above copyright
* notice , this list of conditions and the following disclaimer .
* 2. Redistributions in binary form must reproduce the above copyright
* notice , this list of conditions and the following disclaimer in the
* documentation and / or other materials provided with the distribution .
* 3. All advertising materials mentioning features or use of this software
* must display the following acknowledgement :
* This product includes software developed by the NetBSD
* Foundation , Inc . and its contributors .
* 4. Neither the name of The NetBSD Foundation nor the names of its
* contributors may be used to endorse or promote products derived
* from this software without specific prior written permission .
*
* THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION , INC . AND CONTRIBUTORS
* ` ` AS IS ' ' AND ANY EXPRESS OR IMPLIED WARRANTIES , INCLUDING , BUT NOT LIMITED
* TO , THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
* PURPOSE ARE DISCLAIMED . IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
* BE LIABLE FOR ANY DIRECT , INDIRECT , INCIDENTAL , SPECIAL , EXEMPLARY , OR
* CONSEQUENTIAL DAMAGES ( INCLUDING , BUT NOT LIMITED TO , PROCUREMENT OF
* SUBSTITUTE GOODS OR SERVICES ; LOSS OF USE , DATA , OR PROFITS ; OR BUSINESS
* INTERRUPTION ) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY , WHETHER IN
* CONTRACT , STRICT LIABILITY , OR TORT ( INCLUDING NEGLIGENCE OR OTHERWISE )
* ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE , EVEN IF ADVISED OF THE
* POSSIBILITY OF SUCH DAMAGE .
*/
1998-11-13 07:20:26 +03:00
/*
* Copyright ( c ) 1995 Carnegie - Mellon University .
* All rights reserved .
*
* Author : Mark Holland
*
* Permission to use , copy , modify and distribute this software and
* its documentation is hereby granted , provided that both the copyright
* notice and this permission notice appear in all copies of the
* software , derivative works or modified versions , and any portions
* thereof , and that both notices appear in supporting documentation .
*
* CARNEGIE MELLON ALLOWS FREE USE OF THIS SOFTWARE IN ITS " AS IS "
* CONDITION . CARNEGIE MELLON DISCLAIMS ANY LIABILITY OF ANY KIND
* FOR ANY DAMAGES WHATSOEVER RESULTING FROM THE USE OF THIS SOFTWARE .
*
* Carnegie Mellon requests users of this software to return to
*
* Software Distribution Coordinator or Software . Distribution @ CS . CMU . EDU
* School of Computer Science
* Carnegie Mellon University
* Pittsburgh PA 15213 - 3890
*
* any improvements or extensions that they make and grant Carnegie the
* rights to redistribute these changes .
*/
/***************************************************************
* rf_disks . c - - code to perform operations on the actual disks
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
# include "rf_types.h"
# include "rf_raid.h"
# include "rf_alloclist.h"
# include "rf_utils.h"
# include "rf_configure.h"
# include "rf_general.h"
# include "rf_options.h"
# include <sys/types.h>
# include <sys/param.h>
# include <sys/systm.h>
# include <sys/proc.h>
# include <sys/ioctl.h>
# include <sys/fcntl.h>
# include <sys/vnode.h>
1999-02-24 03:00:03 +03:00
/* XXX these should be in a header file somewhere */
1999-02-05 03:06:06 +03:00
int raidlookup __P ( ( char * , struct proc * p , struct vnode * * ) ) ;
1999-02-24 03:00:03 +03:00
int raidwrite_component_label ( dev_t , struct vnode * , RF_ComponentLabel_t * ) ;
int raidread_component_label ( dev_t , struct vnode * , RF_ComponentLabel_t * ) ;
void rf_UnconfigureVnodes ( RF_Raid_t * ) ;
int rf_CheckLabels ( RF_Raid_t * , RF_Config_t * ) ;
1998-11-13 07:20:26 +03:00
# define DPRINTF6(a,b,c,d,e,f) if (rf_diskDebug) printf(a,b,c,d,e,f)
# define DPRINTF7(a,b,c,d,e,f,g) if (rf_diskDebug) printf(a,b,c,d,e,f,g)
1999-02-24 03:00:03 +03:00
/**************************************************************************
1998-11-13 07:20:26 +03:00
*
* initialize the disks comprising the array
*
1999-02-24 03:00:03 +03:00
* We want the spare disks to have regular row , col numbers so that we can
* easily substitue a spare for a failed disk . But , the driver code assumes
* throughout that the array contains numRow by numCol _non - spare_ disks , so
* it ' s not clear how to fit in the spares . This is an unfortunate holdover
* from raidSim . The quick and dirty fix is to make row zero bigger than the
* rest , and put all the spares in it . This probably needs to get changed
* eventually .
1998-11-13 07:20:26 +03:00
*
1999-02-24 03:00:03 +03:00
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
1999-02-05 03:06:06 +03:00
int
1999-02-24 03:00:03 +03:00
rf_ConfigureDisks ( listp , raidPtr , cfgPtr )
RF_ShutdownList_t * * listp ;
RF_Raid_t * raidPtr ;
RF_Config_t * cfgPtr ;
1998-11-13 07:20:26 +03:00
{
1999-02-05 03:06:06 +03:00
RF_RaidDisk_t * * disks ;
RF_SectorCount_t min_numblks = ( RF_SectorCount_t ) 0x7FFFFFFFFFFFLL ;
RF_RowCol_t r , c ;
1999-02-24 03:00:03 +03:00
int bs , ret ;
1999-02-05 03:06:06 +03:00
unsigned i , count , foundone = 0 , numFailuresThisRow ;
1999-02-24 03:00:03 +03:00
int num_rows_done , num_cols_done ;
1999-03-02 06:18:48 +03:00
int force ;
1999-02-05 03:06:06 +03:00
num_rows_done = 0 ;
num_cols_done = 0 ;
1999-03-02 06:18:48 +03:00
force = cfgPtr - > force ;
1999-02-05 03:06:06 +03:00
1999-02-24 03:00:03 +03:00
RF_CallocAndAdd ( disks , raidPtr - > numRow , sizeof ( RF_RaidDisk_t * ) ,
( RF_RaidDisk_t * * ) , raidPtr - > cleanupList ) ;
1999-02-05 03:06:06 +03:00
if ( disks = = NULL ) {
ret = ENOMEM ;
goto fail ;
}
raidPtr - > Disks = disks ;
/* get space for the device-specific stuff... */
RF_CallocAndAdd ( raidPtr - > raid_cinfo , raidPtr - > numRow ,
sizeof ( struct raidcinfo * ) , ( struct raidcinfo * * ) ,
raidPtr - > cleanupList ) ;
if ( raidPtr - > raid_cinfo = = NULL ) {
ret = ENOMEM ;
goto fail ;
}
for ( r = 0 ; r < raidPtr - > numRow ; r + + ) {
numFailuresThisRow = 0 ;
1999-02-24 03:00:03 +03:00
/* We allocate RF_MAXSPARE on the first row so that we
have room to do hot - swapping of spares */
RF_CallocAndAdd ( disks [ r ] , raidPtr - > numCol
+ ( ( r = = 0 ) ? RF_MAXSPARE : 0 ) ,
sizeof ( RF_RaidDisk_t ) , ( RF_RaidDisk_t * ) ,
raidPtr - > cleanupList ) ;
1999-02-05 03:06:06 +03:00
if ( disks [ r ] = = NULL ) {
ret = ENOMEM ;
goto fail ;
}
/* get more space for device specific stuff.. */
RF_CallocAndAdd ( raidPtr - > raid_cinfo [ r ] ,
raidPtr - > numCol + ( ( r = = 0 ) ? raidPtr - > numSpare : 0 ) ,
sizeof ( struct raidcinfo ) , ( struct raidcinfo * ) ,
1998-11-13 07:20:26 +03:00
raidPtr - > cleanupList ) ;
1999-02-05 03:06:06 +03:00
if ( raidPtr - > raid_cinfo [ r ] = = NULL ) {
ret = ENOMEM ;
goto fail ;
}
for ( c = 0 ; c < raidPtr - > numCol ; c + + ) {
1999-02-24 03:00:03 +03:00
ret = rf_ConfigureDisk ( raidPtr ,
& cfgPtr - > devnames [ r ] [ c ] [ 0 ] ,
& disks [ r ] [ c ] , r , c ) ;
1999-02-05 03:06:06 +03:00
if ( ret )
goto fail ;
1999-03-02 06:18:48 +03:00
1999-02-24 03:00:03 +03:00
if ( disks [ r ] [ c ] . status = = rf_ds_optimal ) {
raidread_component_label (
raidPtr - > raid_cinfo [ r ] [ c ] . ci_dev ,
raidPtr - > raid_cinfo [ r ] [ c ] . ci_vp ,
& raidPtr - > raid_cinfo [ r ] [ c ] . ci_label ) ;
}
1999-03-02 06:18:48 +03:00
1999-02-05 03:06:06 +03:00
if ( disks [ r ] [ c ] . status ! = rf_ds_optimal ) {
numFailuresThisRow + + ;
} else {
if ( disks [ r ] [ c ] . numBlocks < min_numblks )
min_numblks = disks [ r ] [ c ] . numBlocks ;
DPRINTF7 ( " Disk at row %d col %d: dev %s numBlocks %ld blockSize %d (%ld MB) \n " ,
r , c , disks [ r ] [ c ] . devname ,
( long int ) disks [ r ] [ c ] . numBlocks ,
disks [ r ] [ c ] . blockSize ,
1999-02-24 03:00:03 +03:00
( long int ) disks [ r ] [ c ] . numBlocks *
disks [ r ] [ c ] . blockSize / 1024 / 1024 ) ;
1999-02-05 03:06:06 +03:00
}
num_cols_done + + ;
}
/* XXX fix for n-fault tolerant */
1999-02-24 03:00:03 +03:00
/* XXX this should probably check to see how many failures
we can handle for this configuration ! */
1999-02-05 03:06:06 +03:00
if ( numFailuresThisRow > 0 )
raidPtr - > status [ r ] = rf_rs_degraded ;
num_rows_done + + ;
}
1999-02-24 03:00:03 +03:00
1999-02-05 03:06:06 +03:00
/* all disks must be the same size & have the same block size, bs must
* be a power of 2 */
bs = 0 ;
for ( foundone = r = 0 ; ! foundone & & r < raidPtr - > numRow ; r + + ) {
for ( c = 0 ; ! foundone & & c < raidPtr - > numCol ; c + + ) {
if ( disks [ r ] [ c ] . status = = rf_ds_optimal ) {
bs = disks [ r ] [ c ] . blockSize ;
foundone = 1 ;
}
}
}
if ( ! foundone ) {
RF_ERRORMSG ( " RAIDFRAME: Did not find any live disks in the array. \n " ) ;
ret = EINVAL ;
goto fail ;
}
for ( count = 0 , i = 1 ; i ; i < < = 1 )
if ( bs & i )
count + + ;
if ( count ! = 1 ) {
RF_ERRORMSG1 ( " Error: block size on disks (%d) must be a power of 2 \n " , bs ) ;
ret = EINVAL ;
goto fail ;
1998-11-13 07:20:26 +03:00
}
1999-02-24 03:00:03 +03:00
if ( rf_CheckLabels ( raidPtr , cfgPtr ) ) {
1999-03-02 06:18:48 +03:00
printf ( " raid%d: There were fatal errors \n " , raidPtr - > raidid ) ;
if ( force ! = 0 ) {
printf ( " raid%d: Fatal errors being ignored. \n " ,
raidPtr - > raidid ) ;
} else {
ret = EINVAL ;
goto fail ;
}
1999-02-24 03:00:03 +03:00
}
1999-03-02 06:18:48 +03:00
1999-02-05 03:06:06 +03:00
for ( r = 0 ; r < raidPtr - > numRow ; r + + ) {
for ( c = 0 ; c < raidPtr - > numCol ; c + + ) {
if ( disks [ r ] [ c ] . status = = rf_ds_optimal ) {
if ( disks [ r ] [ c ] . blockSize ! = bs ) {
RF_ERRORMSG2 ( " Error: block size of disk at r %d c %d different from disk at r 0 c 0 \n " , r , c ) ;
ret = EINVAL ;
goto fail ;
}
if ( disks [ r ] [ c ] . numBlocks ! = min_numblks ) {
RF_ERRORMSG3 ( " WARNING: truncating disk at r %d c %d to %d blocks \n " ,
r , c , ( int ) min_numblks ) ;
disks [ r ] [ c ] . numBlocks = min_numblks ;
}
}
}
1998-11-13 07:20:26 +03:00
}
1999-02-05 03:06:06 +03:00
raidPtr - > sectorsPerDisk = min_numblks ;
raidPtr - > logBytesPerSector = ffs ( bs ) - 1 ;
raidPtr - > bytesPerSector = bs ;
raidPtr - > sectorMask = bs - 1 ;
return ( 0 ) ;
1998-11-13 07:20:26 +03:00
fail :
1999-02-24 03:00:03 +03:00
rf_UnconfigureVnodes ( raidPtr ) ;
1998-11-13 07:20:26 +03:00
1999-02-05 03:06:06 +03:00
return ( ret ) ;
1998-11-13 07:20:26 +03:00
}
1999-02-24 03:00:03 +03:00
/****************************************************************************
1998-11-13 07:20:26 +03:00
* set up the data structures describing the spare disks in the array
* recall from the above comment that the spare disk descriptors are stored
* in row zero , which is specially expanded to hold them .
1999-02-24 03:00:03 +03:00
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
1999-02-05 03:06:06 +03:00
int
1999-02-24 03:00:03 +03:00
rf_ConfigureSpareDisks ( listp , raidPtr , cfgPtr )
RF_ShutdownList_t * * listp ;
RF_Raid_t * raidPtr ;
RF_Config_t * cfgPtr ;
1998-11-13 07:20:26 +03:00
{
1999-02-24 03:00:03 +03:00
int i , ret ;
unsigned int bs ;
1999-02-05 03:06:06 +03:00
RF_RaidDisk_t * disks ;
int num_spares_done ;
1998-11-13 07:20:26 +03:00
1999-02-05 03:06:06 +03:00
num_spares_done = 0 ;
/* The space for the spares should have already been allocated by
* ConfigureDisks ( ) */
disks = & raidPtr - > Disks [ 0 ] [ raidPtr - > numCol ] ;
for ( i = 0 ; i < raidPtr - > numSpare ; i + + ) {
ret = rf_ConfigureDisk ( raidPtr , & cfgPtr - > spare_names [ i ] [ 0 ] ,
1999-02-24 03:00:03 +03:00
& disks [ i ] , 0 , raidPtr - > numCol + i ) ;
1999-02-05 03:06:06 +03:00
if ( ret )
goto fail ;
if ( disks [ i ] . status ! = rf_ds_optimal ) {
1999-02-24 03:00:03 +03:00
RF_ERRORMSG1 ( " Warning: spare disk %s failed TUR \n " ,
& cfgPtr - > spare_names [ i ] [ 0 ] ) ;
1999-02-05 03:06:06 +03:00
} else {
disks [ i ] . status = rf_ds_spare ; /* change status to
* spare */
DPRINTF6 ( " Spare Disk %d: dev %s numBlocks %ld blockSize %d (%ld MB) \n " , i ,
disks [ i ] . devname ,
( long int ) disks [ i ] . numBlocks , disks [ i ] . blockSize ,
1999-02-24 03:00:03 +03:00
( long int ) disks [ i ] . numBlocks *
disks [ i ] . blockSize / 1024 / 1024 ) ;
1999-02-05 03:06:06 +03:00
}
num_spares_done + + ;
}
1998-11-13 07:20:26 +03:00
1999-02-05 03:06:06 +03:00
/* check sizes and block sizes on spare disks */
bs = 1 < < raidPtr - > logBytesPerSector ;
for ( i = 0 ; i < raidPtr - > numSpare ; i + + ) {
if ( disks [ i ] . blockSize ! = bs ) {
RF_ERRORMSG3 ( " Block size of %d on spare disk %s is not the same as on other disks (%d) \n " , disks [ i ] . blockSize , disks [ i ] . devname , bs ) ;
ret = EINVAL ;
goto fail ;
}
if ( disks [ i ] . numBlocks < raidPtr - > sectorsPerDisk ) {
RF_ERRORMSG3 ( " Spare disk %s (%d blocks) is too small to serve as a spare (need %ld blocks) \n " ,
1999-02-24 03:00:03 +03:00
disks [ i ] . devname , disks [ i ] . blockSize ,
( long int ) raidPtr - > sectorsPerDisk ) ;
1999-02-05 03:06:06 +03:00
ret = EINVAL ;
goto fail ;
} else
if ( disks [ i ] . numBlocks > raidPtr - > sectorsPerDisk ) {
RF_ERRORMSG2 ( " Warning: truncating spare disk %s to %ld blocks \n " , disks [ i ] . devname , ( long int ) raidPtr - > sectorsPerDisk ) ;
disks [ i ] . numBlocks = raidPtr - > sectorsPerDisk ;
}
}
return ( 0 ) ;
1998-11-13 07:20:26 +03:00
fail :
1999-02-05 03:06:06 +03:00
/* Release the hold on the main components. We've failed to allocate
1999-02-24 03:00:03 +03:00
* a spare , and since we ' re failing , we need to free things . .
XXX failing to allocate a spare is * not * that big of a deal . . .
We * can * survive without it , if need be , esp . if we get hot
adding working .
1998-11-13 07:20:26 +03:00
1999-02-24 03:00:03 +03:00
If we don ' t fail out here , then we need a way to remove this spare . . .
that should be easier to do here than if we are " live " . . .
1998-11-13 07:20:26 +03:00
1999-02-24 03:00:03 +03:00
*/
1998-11-13 07:20:26 +03:00
1999-02-24 03:00:03 +03:00
rf_UnconfigureVnodes ( raidPtr ) ;
1998-11-13 07:20:26 +03:00
1999-02-05 03:06:06 +03:00
return ( ret ) ;
1998-11-13 07:20:26 +03:00
}
/* configure a single disk in the array */
1999-02-05 03:06:06 +03:00
int
1999-02-24 03:00:03 +03:00
rf_ConfigureDisk ( raidPtr , buf , diskPtr , row , col )
RF_Raid_t * raidPtr ;
1999-02-05 03:06:06 +03:00
char * buf ;
RF_RaidDisk_t * diskPtr ;
RF_RowCol_t row ;
RF_RowCol_t col ;
1998-11-13 07:20:26 +03:00
{
1999-02-05 03:06:06 +03:00
char * p ;
int retcode ;
1998-11-13 07:20:26 +03:00
struct partinfo dpart ;
struct vnode * vp ;
struct vattr va ;
struct proc * proc ;
1999-02-05 03:06:06 +03:00
int error ;
1998-11-13 07:20:26 +03:00
1999-02-05 03:06:06 +03:00
retcode = 0 ;
p = rf_find_non_white ( buf ) ;
if ( p [ strlen ( p ) - 1 ] = = ' \n ' ) {
/* strip off the newline */
p [ strlen ( p ) - 1 ] = ' \0 ' ;
}
( void ) strcpy ( diskPtr - > devname , p ) ;
1998-11-13 07:20:26 +03:00
1999-08-14 07:10:03 +04:00
proc = raidPtr - > engine_thread ;
1999-02-05 03:06:06 +03:00
/* Let's start by claiming the component is fine and well... */
diskPtr - > status = rf_ds_optimal ;
raidPtr - > raid_cinfo [ row ] [ col ] . ci_vp = NULL ;
raidPtr - > raid_cinfo [ row ] [ col ] . ci_dev = NULL ;
error = raidlookup ( diskPtr - > devname , proc , & vp ) ;
if ( error ) {
printf ( " raidlookup on device: %s failed! \n " , diskPtr - > devname ) ;
if ( error = = ENXIO ) {
1999-02-24 03:00:03 +03:00
/* the component isn't there... must be dead :-( */
1999-02-05 03:06:06 +03:00
diskPtr - > status = rf_ds_failed ;
} else {
return ( error ) ;
}
}
if ( diskPtr - > status = = rf_ds_optimal ) {
if ( ( error = VOP_GETATTR ( vp , & va , proc - > p_ucred , proc ) ) ! = 0 ) {
return ( error ) ;
}
error = VOP_IOCTL ( vp , DIOCGPART , ( caddr_t ) & dpart ,
1999-02-24 03:00:03 +03:00
FREAD , proc - > p_ucred , proc ) ;
1999-02-05 03:06:06 +03:00
if ( error ) {
return ( error ) ;
}
1999-02-24 03:00:03 +03:00
1999-02-05 03:06:06 +03:00
diskPtr - > blockSize = dpart . disklab - > d_secsize ;
1999-02-24 03:00:03 +03:00
1999-02-05 03:06:06 +03:00
diskPtr - > numBlocks = dpart . part - > p_size - rf_protectedSectors ;
1999-02-24 03:00:03 +03:00
1999-02-05 03:06:06 +03:00
raidPtr - > raid_cinfo [ row ] [ col ] . ci_vp = vp ;
raidPtr - > raid_cinfo [ row ] [ col ] . ci_dev = va . va_rdev ;
1999-02-24 03:00:03 +03:00
diskPtr - > dev = va . va_rdev ;
1999-02-05 03:06:06 +03:00
/* we allow the user to specify that only a fraction of the
* disks should be used this is just for debug : it speeds up
* the parity scan */
1999-02-24 03:00:03 +03:00
diskPtr - > numBlocks = diskPtr - > numBlocks *
rf_sizePercentage / 100 ;
}
return ( 0 ) ;
}
1999-03-02 06:18:48 +03:00
static void rf_print_label_status ( RF_Raid_t * , int , int , char * ,
RF_ComponentLabel_t * ) ;
static void
rf_print_label_status ( raidPtr , row , column , dev_name , ci_label )
RF_Raid_t * raidPtr ;
int row ;
int column ;
char * dev_name ;
RF_ComponentLabel_t * ci_label ;
{
printf ( " raid%d: Component %s being configured at row: %d col: %d \n " ,
raidPtr - > raidid , dev_name , row , column ) ;
printf ( " Row: %d Column: %d Num Rows: %d Num Columns: %d \n " ,
ci_label - > row , ci_label - > column ,
ci_label - > num_rows , ci_label - > num_columns ) ;
printf ( " Version: %d Serial Number: %d Mod Counter: %d \n " ,
ci_label - > version , ci_label - > serial_number ,
ci_label - > mod_counter ) ;
1999-08-11 02:56:20 +04:00
printf ( " Clean: %s Status: %d \n " ,
ci_label - > clean ? " Yes " : " No " , ci_label - > status ) ;
1999-03-02 06:18:48 +03:00
}
static int rf_check_label_vitals ( RF_Raid_t * , int , int , char * ,
RF_ComponentLabel_t * , int , int ) ;
static int rf_check_label_vitals ( raidPtr , row , column , dev_name , ci_label ,
serial_number , mod_counter )
RF_Raid_t * raidPtr ;
int row ;
int column ;
char * dev_name ;
RF_ComponentLabel_t * ci_label ;
int serial_number ;
int mod_counter ;
{
int fatal_error = 0 ;
if ( serial_number ! = ci_label - > serial_number ) {
printf ( " %s has a different serial number: %d %d \n " ,
dev_name , serial_number , ci_label - > serial_number ) ;
fatal_error = 1 ;
}
if ( mod_counter ! = ci_label - > mod_counter ) {
printf ( " %s has a different modfication count: %d %d \n " ,
dev_name , mod_counter , ci_label - > mod_counter ) ;
}
if ( row ! = ci_label - > row ) {
printf ( " Row out of alignment for: %s \n " , dev_name ) ;
fatal_error = 1 ;
}
if ( column ! = ci_label - > column ) {
printf ( " Column out of alignment for: %s \n " , dev_name ) ;
fatal_error = 1 ;
}
if ( raidPtr - > numRow ! = ci_label - > num_rows ) {
printf ( " Number of rows do not match for: %s \n " , dev_name ) ;
fatal_error = 1 ;
}
if ( raidPtr - > numCol ! = ci_label - > num_columns ) {
printf ( " Number of columns do not match for: %s \n " , dev_name ) ;
fatal_error = 1 ;
}
if ( ci_label - > clean = = 0 ) {
/* it's not clean, but that's not fatal */
printf ( " %s is not clean! \n " , dev_name ) ;
}
return ( fatal_error ) ;
}
1999-02-24 03:00:03 +03:00
/*
1998-11-13 07:20:26 +03:00
1999-02-24 03:00:03 +03:00
rf_CheckLabels ( ) - check all the component labels for consistency .
Return an error if there is anything major amiss .
*/
int
rf_CheckLabels ( raidPtr , cfgPtr )
RF_Raid_t * raidPtr ;
RF_Config_t * cfgPtr ;
{
int r , c ;
char * dev_name ;
RF_ComponentLabel_t * ci_label ;
int serial_number = 0 ;
1999-03-02 06:18:48 +03:00
int mod_number = 0 ;
1999-02-24 03:00:03 +03:00
int fatal_error = 0 ;
1999-03-02 06:18:48 +03:00
int mod_values [ 4 ] ;
int mod_count [ 4 ] ;
int ser_values [ 4 ] ;
int ser_count [ 4 ] ;
int num_ser ;
int num_mod ;
int i ;
int found ;
int hosed_row ;
int hosed_column ;
int too_fatal ;
int parity_good ;
int force ;
hosed_row = - 1 ;
hosed_column = - 1 ;
too_fatal = 0 ;
force = cfgPtr - > force ;
/*
We ' re going to try to be a little intelligent here . If one
component ' s label is bogus , and we can identify that it ' s the
* only * one that ' s gone , we ' ll mark it as " failed " and allow
the configuration to proceed . This will be the * only * case
that we ' ll proceed if there would be ( otherwise ) fatal errors .
Basically we simply keep a count of how many components had
what serial number . If all but one agree , we simply mark
the disagreeing component as being failed , and allow
things to come up " normally " .
We do this first for serial numbers , and then for " mod_counter " .
1999-02-24 03:00:03 +03:00
1999-03-02 06:18:48 +03:00
*/
num_ser = 0 ;
num_mod = 0 ;
for ( r = 0 ; r < raidPtr - > numRow & & ! fatal_error ; r + + ) {
1999-02-24 03:00:03 +03:00
for ( c = 0 ; c < raidPtr - > numCol ; c + + ) {
ci_label = & raidPtr - > raid_cinfo [ r ] [ c ] . ci_label ;
1999-03-02 06:18:48 +03:00
found = 0 ;
for ( i = 0 ; i < num_ser ; i + + ) {
if ( ser_values [ i ] = = ci_label - > serial_number ) {
ser_count [ i ] + + ;
found = 1 ;
break ;
1999-02-24 03:00:03 +03:00
}
1999-03-02 06:18:48 +03:00
}
if ( ! found ) {
ser_values [ num_ser ] = ci_label - > serial_number ;
ser_count [ num_ser ] = 1 ;
num_ser + + ;
if ( num_ser > 2 ) {
1999-02-24 03:00:03 +03:00
fatal_error = 1 ;
1999-03-02 06:18:48 +03:00
break ;
1999-02-24 03:00:03 +03:00
}
1999-03-02 06:18:48 +03:00
}
found = 0 ;
for ( i = 0 ; i < num_mod ; i + + ) {
if ( mod_values [ i ] = = ci_label - > mod_counter ) {
mod_count [ i ] + + ;
found = 1 ;
break ;
1999-02-24 03:00:03 +03:00
}
}
1999-03-02 06:18:48 +03:00
if ( ! found ) {
mod_values [ num_mod ] = ci_label - > mod_counter ;
mod_count [ num_mod ] = 1 ;
num_mod + + ;
if ( num_mod > 2 ) {
fatal_error = 1 ;
break ;
}
1999-02-24 03:00:03 +03:00
}
1999-03-02 06:18:48 +03:00
}
}
# if DEBUG
printf ( " raid%d: Summary of serial numbers: \n " , raidPtr - > raidid ) ;
for ( i = 0 ; i < num_ser ; i + + ) {
printf ( " %d %d \n " , ser_values [ i ] , ser_count [ i ] ) ;
}
printf ( " raid%d: Summary of mod counters: \n " , raidPtr - > raidid ) ;
for ( i = 0 ; i < num_mod ; i + + ) {
printf ( " %d %d \n " , mod_values [ i ] , mod_count [ i ] ) ;
}
# endif
serial_number = ser_values [ 0 ] ;
if ( num_ser = = 2 ) {
if ( ( ser_count [ 0 ] = = 1 ) | | ( ser_count [ 1 ] = = 1 ) ) {
/* Locate the maverick component */
if ( ser_count [ 1 ] > ser_count [ 0 ] ) {
serial_number = ser_values [ 1 ] ;
}
for ( r = 0 ; r < raidPtr - > numRow ; r + + ) {
for ( c = 0 ; c < raidPtr - > numCol ; c + + ) {
ci_label = & raidPtr - > raid_cinfo [ r ] [ c ] . ci_label ;
if ( serial_number ! =
ci_label - > serial_number ) {
hosed_row = r ;
hosed_column = c ;
break ;
}
}
1999-02-24 03:00:03 +03:00
}
1999-03-02 06:18:48 +03:00
printf ( " Hosed component: %s \n " ,
& cfgPtr - > devnames [ hosed_row ] [ hosed_column ] [ 0 ] ) ;
if ( ! force ) {
/* we'll fail this component, as if there are
other major errors , we arn ' t forcing things
and we ' ll abort the config anyways */
raidPtr - > Disks [ hosed_row ] [ hosed_column ] . status
= rf_ds_failed ;
raidPtr - > numFailures + + ;
raidPtr - > status [ hosed_row ] = rf_rs_degraded ;
1999-02-24 03:00:03 +03:00
}
1999-03-02 06:18:48 +03:00
} else {
too_fatal = 1 ;
}
if ( cfgPtr - > parityConfig = = ' 0 ' ) {
/* We've identified two different serial numbers.
RAID 0 can ' t cope with that , so we ' ll punt */
too_fatal = 1 ;
}
}
/* record the serial number for later. If we bail later, setting
this doesn ' t matter , otherwise we ' ve got the best guess at the
correct serial number */
raidPtr - > serial_number = serial_number ;
mod_number = mod_values [ 0 ] ;
if ( num_mod = = 2 ) {
if ( ( mod_count [ 0 ] = = 1 ) | | ( mod_count [ 1 ] = = 1 ) ) {
/* Locate the maverick component */
if ( mod_count [ 1 ] > mod_count [ 0 ] ) {
mod_number = mod_values [ 1 ] ;
1999-03-18 06:02:38 +03:00
} else if ( mod_count [ 1 ] < mod_count [ 0 ] ) {
mod_number = mod_values [ 0 ] ;
} else {
/* counts of different modification values
are the same . Assume greater value is
the correct one , all other things
considered */
if ( mod_values [ 0 ] > mod_values [ 1 ] ) {
mod_number = mod_values [ 0 ] ;
} else {
mod_number = mod_values [ 1 ] ;
}
}
1999-03-02 06:18:48 +03:00
for ( r = 0 ; r < raidPtr - > numRow & & ! too_fatal ; r + + ) {
for ( c = 0 ; c < raidPtr - > numCol ; c + + ) {
ci_label = & raidPtr - > raid_cinfo [ r ] [ c ] . ci_label ;
if ( mod_number ! =
ci_label - > mod_counter ) {
if ( ( hosed_row = = r ) & &
( hosed_column = = c ) ) {
/* same one. Can
deal with it . */
} else {
hosed_row = r ;
hosed_column = c ;
if ( num_ser ! = 1 ) {
too_fatal = 1 ;
break ;
}
}
}
}
1999-02-24 03:00:03 +03:00
}
1999-03-02 06:18:48 +03:00
printf ( " Hosed component: %s \n " ,
& cfgPtr - > devnames [ hosed_row ] [ hosed_column ] [ 0 ] ) ;
if ( ! force ) {
/* we'll fail this component, as if there are
other major errors , we arn ' t forcing things
and we ' ll abort the config anyways */
1999-06-04 05:50:01 +04:00
if ( raidPtr - > Disks [ hosed_row ] [ hosed_column ] . status ! = rf_ds_failed ) {
raidPtr - > Disks [ hosed_row ] [ hosed_column ] . status
= rf_ds_failed ;
raidPtr - > numFailures + + ;
raidPtr - > status [ hosed_row ] = rf_rs_degraded ;
}
1999-02-24 03:00:03 +03:00
}
1999-03-02 06:18:48 +03:00
} else {
too_fatal = 1 ;
}
if ( cfgPtr - > parityConfig = = ' 0 ' ) {
/* We've identified two different mod counters.
RAID 0 can ' t cope with that , so we ' ll punt */
too_fatal = 1 ;
1999-02-24 03:00:03 +03:00
}
1999-03-02 06:18:48 +03:00
}
raidPtr - > mod_counter = mod_number ;
if ( too_fatal ) {
/* we've had both a serial number mismatch, and a mod_counter
mismatch - - and they involved two different components ! !
Bail - - make things fail so that the user must force
the issue . . . */
hosed_row = - 1 ;
hosed_column = - 1 ;
1999-02-24 03:00:03 +03:00
}
1999-03-02 06:18:48 +03:00
if ( num_ser > 2 ) {
printf ( " raid%d: Too many different serial numbers! \n " ,
raidPtr - > raidid ) ;
}
if ( num_mod > 2 ) {
printf ( " raid%d: Too many different mod counters! \n " ,
raidPtr - > raidid ) ;
}
/* we start by assuming the parity will be good, and flee from
that notion at the slightest sign of trouble */
parity_good = RF_RAID_CLEAN ;
for ( r = 0 ; r < raidPtr - > numRow ; r + + ) {
for ( c = 0 ; c < raidPtr - > numCol ; c + + ) {
dev_name = & cfgPtr - > devnames [ r ] [ c ] [ 0 ] ;
ci_label = & raidPtr - > raid_cinfo [ r ] [ c ] . ci_label ;
if ( ( r = = hosed_row ) & & ( c = = hosed_column ) ) {
printf ( " raid%d: Ignoring %s \n " ,
raidPtr - > raidid , dev_name ) ;
} else {
rf_print_label_status ( raidPtr , r , c ,
dev_name , ci_label ) ;
if ( rf_check_label_vitals ( raidPtr , r , c ,
dev_name , ci_label ,
serial_number ,
mod_number ) ) {
fatal_error = 1 ;
}
if ( ci_label - > clean ! = RF_RAID_CLEAN ) {
parity_good = RF_RAID_DIRTY ;
}
}
}
}
if ( fatal_error ) {
parity_good = RF_RAID_DIRTY ;
}
/* we note the state of the parity */
raidPtr - > parity_good = parity_good ;
1999-02-24 03:00:03 +03:00
return ( fatal_error ) ;
}
1999-06-04 05:50:01 +04:00
int config_disk_queue ( RF_Raid_t * , RF_DiskQueue_t * , RF_RowCol_t ,
RF_RowCol_t , RF_DiskQueueSW_t * ,
RF_SectorCount_t , dev_t , int ,
RF_ShutdownList_t * * ,
RF_AllocListElem_t * ) ;
1999-03-02 06:18:48 +03:00
int rf_add_hot_spare ( RF_Raid_t * , RF_SingleComponent_t * ) ;
1999-02-24 03:00:03 +03:00
int
rf_add_hot_spare ( raidPtr , sparePtr )
RF_Raid_t * raidPtr ;
1999-03-02 06:18:48 +03:00
RF_SingleComponent_t * sparePtr ;
1999-02-24 03:00:03 +03:00
{
RF_RaidDisk_t * disks ;
1999-06-04 05:50:01 +04:00
RF_DiskQueue_t * spareQueues ;
1999-02-24 03:00:03 +03:00
int ret ;
unsigned int bs ;
int spare_number ;
printf ( " Just in rf_add_hot_spare: %d \n " , raidPtr - > numSpare ) ;
printf ( " Num col: %d \n " , raidPtr - > numCol ) ;
if ( raidPtr - > numSpare > = RF_MAXSPARE ) {
RF_ERRORMSG1 ( " Too many spares: %d \n " , raidPtr - > numSpare ) ;
return ( EINVAL ) ;
1999-02-05 03:06:06 +03:00
}
1999-06-04 05:50:01 +04:00
1999-06-04 06:02:39 +04:00
RF_LOCK_MUTEX ( raidPtr - > mutex ) ;
1999-02-24 03:00:03 +03:00
/* the beginning of the spares... */
disks = & raidPtr - > Disks [ 0 ] [ raidPtr - > numCol ] ;
spare_number = raidPtr - > numSpare ;
1999-03-02 06:18:48 +03:00
ret = rf_ConfigureDisk ( raidPtr , sparePtr - > component_name ,
1999-02-24 03:00:03 +03:00
& disks [ spare_number ] , 0 ,
raidPtr - > numCol + spare_number ) ;
if ( ret )
goto fail ;
if ( disks [ spare_number ] . status ! = rf_ds_optimal ) {
RF_ERRORMSG1 ( " Warning: spare disk %s failed TUR \n " ,
1999-03-02 06:18:48 +03:00
sparePtr - > component_name ) ;
1999-02-24 03:00:03 +03:00
ret = EINVAL ;
goto fail ;
} else {
disks [ spare_number ] . status = rf_ds_spare ;
DPRINTF6 ( " Spare Disk %d: dev %s numBlocks %ld blockSize %d (%ld MB) \n " , spare_number ,
disks [ spare_number ] . devname ,
( long int ) disks [ spare_number ] . numBlocks ,
disks [ spare_number ] . blockSize ,
( long int ) disks [ spare_number ] . numBlocks *
disks [ spare_number ] . blockSize / 1024 / 1024 ) ;
}
/* check sizes and block sizes on the spare disk */
bs = 1 < < raidPtr - > logBytesPerSector ;
if ( disks [ spare_number ] . blockSize ! = bs ) {
RF_ERRORMSG3 ( " Block size of %d on spare disk %s is not the same as on other disks (%d) \n " , disks [ spare_number ] . blockSize , disks [ spare_number ] . devname , bs ) ;
ret = EINVAL ;
goto fail ;
}
if ( disks [ spare_number ] . numBlocks < raidPtr - > sectorsPerDisk ) {
RF_ERRORMSG3 ( " Spare disk %s (%d blocks) is too small to serve as a spare (need %ld blocks) \n " ,
disks [ spare_number ] . devname ,
disks [ spare_number ] . blockSize ,
( long int ) raidPtr - > sectorsPerDisk ) ;
ret = EINVAL ;
goto fail ;
} else {
if ( disks [ spare_number ] . numBlocks >
raidPtr - > sectorsPerDisk ) {
RF_ERRORMSG2 ( " Warning: truncating spare disk %s to %ld blocks \n " , disks [ spare_number ] . devname ,
( long int ) raidPtr - > sectorsPerDisk ) ;
disks [ spare_number ] . numBlocks = raidPtr - > sectorsPerDisk ;
}
}
1999-06-04 05:50:01 +04:00
spareQueues = & raidPtr - > Queues [ 0 ] [ raidPtr - > numCol ] ;
ret = config_disk_queue ( raidPtr , & spareQueues [ spare_number ] ,
0 , raidPtr - > numCol + spare_number ,
raidPtr - > Queues [ 0 ] [ 0 ] . qPtr , /* XXX */
raidPtr - > sectorsPerDisk ,
raidPtr - > Disks [ 0 ] [ raidPtr - > numCol + spare_number ] . dev ,
raidPtr - > Queues [ 0 ] [ 0 ] . maxOutstanding , /* XXX */
& raidPtr - > shutdownList ,
raidPtr - > cleanupList ) ;
1999-02-24 03:00:03 +03:00
1999-06-04 05:50:01 +04:00
raidPtr - > numSpare + + ;
1999-06-04 06:02:39 +04:00
RF_UNLOCK_MUTEX ( raidPtr - > mutex ) ;
1999-02-05 03:06:06 +03:00
return ( 0 ) ;
1999-02-24 03:00:03 +03:00
fail :
1999-06-04 06:02:39 +04:00
RF_UNLOCK_MUTEX ( raidPtr - > mutex ) ;
1999-02-24 03:00:03 +03:00
return ( ret ) ;
}
int
rf_remove_hot_spare ( raidPtr , sparePtr )
RF_Raid_t * raidPtr ;
1999-03-02 06:18:48 +03:00
RF_SingleComponent_t * sparePtr ;
1999-02-24 03:00:03 +03:00
{
int spare_number ;
if ( raidPtr - > numSpare = = 0 ) {
printf ( " No spares to remove! \n " ) ;
return ( EINVAL ) ;
}
1999-03-02 06:18:48 +03:00
spare_number = sparePtr - > column ;
1999-02-24 03:00:03 +03:00
return ( EINVAL ) ; /* XXX not implemented yet */
#if 0
if ( spare_number < 0 | | spare_number > raidPtr - > numSpare ) {
return ( EINVAL ) ;
}
/* verify that this spare isn't in use... */
/* it's gone.. */
raidPtr - > numSpare - - ;
return ( 0 ) ;
# endif
1998-11-13 07:20:26 +03:00
}
1999-02-24 03:00:03 +03:00