raid5-cache: IO error handling
There are 3 places the raid5-cache dispatches IO. The discard IO error doesn't matter, so we ignore it. The superblock write IO error can be handled in MD core. The remaining are log write and flush. When the IO error happens, we mark log disk faulty and fail all write IO. Read IO is still allowed to run. Userspace will get a notification too and corresponding daemon can choose setting raid array readonly for example. Signed-off-by: Shaohua Li <shli@fb.com> Signed-off-by: NeilBrown <neilb@suse.com>
This commit is contained in:
parent
c2bb6242ec
commit
6e74a9cfb5
|
@ -190,7 +190,6 @@ static void r5l_io_run_stripes(struct r5l_io_unit *io)
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
/* XXX: totally ignores I/O errors */
|
|
||||||
static void r5l_log_run_stripes(struct r5l_log *log)
|
static void r5l_log_run_stripes(struct r5l_log *log)
|
||||||
{
|
{
|
||||||
struct r5l_io_unit *io, *next;
|
struct r5l_io_unit *io, *next;
|
||||||
|
@ -213,6 +212,9 @@ static void r5l_log_endio(struct bio *bio)
|
||||||
struct r5l_log *log = io->log;
|
struct r5l_log *log = io->log;
|
||||||
unsigned long flags;
|
unsigned long flags;
|
||||||
|
|
||||||
|
if (bio->bi_error)
|
||||||
|
md_error(log->rdev->mddev, log->rdev);
|
||||||
|
|
||||||
bio_put(bio);
|
bio_put(bio);
|
||||||
|
|
||||||
spin_lock_irqsave(&log->io_list_lock, flags);
|
spin_lock_irqsave(&log->io_list_lock, flags);
|
||||||
|
@ -598,6 +600,9 @@ static void r5l_log_flush_endio(struct bio *bio)
|
||||||
unsigned long flags;
|
unsigned long flags;
|
||||||
struct r5l_io_unit *io;
|
struct r5l_io_unit *io;
|
||||||
|
|
||||||
|
if (bio->bi_error)
|
||||||
|
md_error(log->rdev->mddev, log->rdev);
|
||||||
|
|
||||||
spin_lock_irqsave(&log->io_list_lock, flags);
|
spin_lock_irqsave(&log->io_list_lock, flags);
|
||||||
list_for_each_entry(io, &log->flushing_ios, log_sibling)
|
list_for_each_entry(io, &log->flushing_ios, log_sibling)
|
||||||
r5l_io_run_stripes(io);
|
r5l_io_run_stripes(io);
|
||||||
|
@ -684,6 +689,7 @@ static void r5l_write_super_and_discard_space(struct r5l_log *log,
|
||||||
md_update_sb(mddev, 1);
|
md_update_sb(mddev, 1);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
/* discard IO error really doesn't matter, ignore it */
|
||||||
if (log->last_checkpoint < end) {
|
if (log->last_checkpoint < end) {
|
||||||
blkdev_issue_discard(bdev,
|
blkdev_issue_discard(bdev,
|
||||||
log->last_checkpoint + log->rdev->data_offset,
|
log->last_checkpoint + log->rdev->data_offset,
|
||||||
|
@ -798,6 +804,13 @@ void r5l_quiesce(struct r5l_log *log, int state)
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
bool r5l_log_disk_error(struct r5conf *conf)
|
||||||
|
{
|
||||||
|
if (!conf->log)
|
||||||
|
return false;
|
||||||
|
return test_bit(Faulty, &conf->log->rdev->flags);
|
||||||
|
}
|
||||||
|
|
||||||
struct r5l_recovery_ctx {
|
struct r5l_recovery_ctx {
|
||||||
struct page *meta_page; /* current meta */
|
struct page *meta_page; /* current meta */
|
||||||
sector_t meta_total_blocks; /* total size of current meta and data */
|
sector_t meta_total_blocks; /* total size of current meta and data */
|
||||||
|
|
|
@ -3147,6 +3147,7 @@ handle_failed_stripe(struct r5conf *conf, struct stripe_head *sh,
|
||||||
* the data has not reached the cache yet.
|
* the data has not reached the cache yet.
|
||||||
*/
|
*/
|
||||||
if (!test_bit(R5_Wantfill, &sh->dev[i].flags) &&
|
if (!test_bit(R5_Wantfill, &sh->dev[i].flags) &&
|
||||||
|
s->failed > conf->max_degraded &&
|
||||||
(!test_bit(R5_Insync, &sh->dev[i].flags) ||
|
(!test_bit(R5_Insync, &sh->dev[i].flags) ||
|
||||||
test_bit(R5_ReadError, &sh->dev[i].flags))) {
|
test_bit(R5_ReadError, &sh->dev[i].flags))) {
|
||||||
spin_lock_irq(&sh->stripe_lock);
|
spin_lock_irq(&sh->stripe_lock);
|
||||||
|
@ -4015,6 +4016,7 @@ static void analyse_stripe(struct stripe_head *sh, struct stripe_head_state *s)
|
||||||
s->expanded = test_bit(STRIPE_EXPAND_READY, &sh->state) && !sh->batch_head;
|
s->expanded = test_bit(STRIPE_EXPAND_READY, &sh->state) && !sh->batch_head;
|
||||||
s->failed_num[0] = -1;
|
s->failed_num[0] = -1;
|
||||||
s->failed_num[1] = -1;
|
s->failed_num[1] = -1;
|
||||||
|
s->log_failed = r5l_log_disk_error(conf);
|
||||||
|
|
||||||
/* Now to look around and see what can be done */
|
/* Now to look around and see what can be done */
|
||||||
rcu_read_lock();
|
rcu_read_lock();
|
||||||
|
@ -4358,7 +4360,7 @@ static void handle_stripe(struct stripe_head *sh)
|
||||||
/* check if the array has lost more than max_degraded devices and,
|
/* check if the array has lost more than max_degraded devices and,
|
||||||
* if so, some requests might need to be failed.
|
* if so, some requests might need to be failed.
|
||||||
*/
|
*/
|
||||||
if (s.failed > conf->max_degraded) {
|
if (s.failed > conf->max_degraded || s.log_failed) {
|
||||||
sh->check_state = 0;
|
sh->check_state = 0;
|
||||||
sh->reconstruct_state = 0;
|
sh->reconstruct_state = 0;
|
||||||
break_stripe_batch_list(sh, 0);
|
break_stripe_batch_list(sh, 0);
|
||||||
|
|
|
@ -272,6 +272,7 @@ struct stripe_head_state {
|
||||||
struct bio_list return_bi;
|
struct bio_list return_bi;
|
||||||
struct md_rdev *blocked_rdev;
|
struct md_rdev *blocked_rdev;
|
||||||
int handle_bad_blocks;
|
int handle_bad_blocks;
|
||||||
|
int log_failed;
|
||||||
};
|
};
|
||||||
|
|
||||||
/* Flags for struct r5dev.flags */
|
/* Flags for struct r5dev.flags */
|
||||||
|
@ -631,4 +632,5 @@ extern void r5l_flush_stripe_to_raid(struct r5l_log *log);
|
||||||
extern void r5l_stripe_write_finished(struct stripe_head *sh);
|
extern void r5l_stripe_write_finished(struct stripe_head *sh);
|
||||||
extern int r5l_handle_flush_request(struct r5l_log *log, struct bio *bio);
|
extern int r5l_handle_flush_request(struct r5l_log *log, struct bio *bio);
|
||||||
extern void r5l_quiesce(struct r5l_log *log, int state);
|
extern void r5l_quiesce(struct r5l_log *log, int state);
|
||||||
|
extern bool r5l_log_disk_error(struct r5conf *conf);
|
||||||
#endif
|
#endif
|
||||||
|
|
Loading…
Reference in New Issue