123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442 |
- /* $OpenBSD: softraid_raid1.c,v 1.63 2015/07/21 03:30:51 krw Exp $ */
- /*
- * Copyright (c) 2007 Marco Peereboom <marco@peereboom.us>
- *
- * Permission to use, copy, modify, and distribute this software for any
- * purpose with or without fee is hereby granted, provided that the above
- * copyright notice and this permission notice appear in all copies.
- *
- * THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES
- * WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
- * MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR
- * ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
- * WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN
- * ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF
- * OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
- */
- #include "bio.h"
- #include <sys/param.h>
- #include <sys/systm.h>
- #include <sys/buf.h>
- #include <sys/device.h>
- #include <sys/ioctl.h>
- #include <sys/malloc.h>
- #include <sys/kernel.h>
- #include <sys/disk.h>
- #include <sys/rwlock.h>
- #include <sys/queue.h>
- #include <sys/fcntl.h>
- #include <sys/mount.h>
- #include <sys/sensors.h>
- #include <sys/stat.h>
- #include <sys/task.h>
- #include <sys/conf.h>
- #include <sys/uio.h>
- #include <scsi/scsi_all.h>
- #include <scsi/scsiconf.h>
- #include <scsi/scsi_disk.h>
- #include <dev/softraidvar.h>
- /* RAID 1 functions. */
- int sr_raid1_create(struct sr_discipline *, struct bioc_createraid *,
- int, int64_t);
- int sr_raid1_assemble(struct sr_discipline *, struct bioc_createraid *,
- int, void *);
- int sr_raid1_init(struct sr_discipline *sd);
- int sr_raid1_rw(struct sr_workunit *);
- int sr_raid1_wu_done(struct sr_workunit *);
- void sr_raid1_set_chunk_state(struct sr_discipline *, int, int);
- void sr_raid1_set_vol_state(struct sr_discipline *);
- /* Discipline initialisation. */
- void
- sr_raid1_discipline_init(struct sr_discipline *sd)
- {
- /* Fill out discipline members. */
- sd->sd_type = SR_MD_RAID1;
- strlcpy(sd->sd_name, "RAID 1", sizeof(sd->sd_name));
- sd->sd_capabilities = SR_CAP_SYSTEM_DISK | SR_CAP_AUTO_ASSEMBLE |
- SR_CAP_REBUILD | SR_CAP_REDUNDANT;
- sd->sd_max_wu = SR_RAID1_NOWU;
- /* Setup discipline specific function pointers. */
- sd->sd_assemble = sr_raid1_assemble;
- sd->sd_create = sr_raid1_create;
- sd->sd_scsi_rw = sr_raid1_rw;
- sd->sd_scsi_wu_done = sr_raid1_wu_done;
- sd->sd_set_chunk_state = sr_raid1_set_chunk_state;
- sd->sd_set_vol_state = sr_raid1_set_vol_state;
- }
- int
- sr_raid1_create(struct sr_discipline *sd, struct bioc_createraid *bc,
- int no_chunk, int64_t coerced_size)
- {
- if (no_chunk < 2) {
- sr_error(sd->sd_sc, "%s requires two or more chunks",
- sd->sd_name);
- return EINVAL;
- }
- sd->sd_meta->ssdi.ssd_size = coerced_size;
- return sr_raid1_init(sd);
- }
- int
- sr_raid1_assemble(struct sr_discipline *sd, struct bioc_createraid *bc,
- int no_chunk, void *data)
- {
- return sr_raid1_init(sd);
- }
- int
- sr_raid1_init(struct sr_discipline *sd)
- {
- sd->sd_max_ccb_per_wu = sd->sd_meta->ssdi.ssd_chunk_no;
- return 0;
- }
- void
- sr_raid1_set_chunk_state(struct sr_discipline *sd, int c, int new_state)
- {
- int old_state, s;
- DNPRINTF(SR_D_STATE, "%s: %s: %s: sr_raid_set_chunk_state %d -> %d\n",
- DEVNAME(sd->sd_sc), sd->sd_meta->ssd_devname,
- sd->sd_vol.sv_chunks[c]->src_meta.scmi.scm_devname, c, new_state);
- /* ok to go to splbio since this only happens in error path */
- s = splbio();
- old_state = sd->sd_vol.sv_chunks[c]->src_meta.scm_status;
- /* multiple IOs to the same chunk that fail will come through here */
- if (old_state == new_state)
- goto done;
- switch (old_state) {
- case BIOC_SDONLINE:
- switch (new_state) {
- case BIOC_SDOFFLINE:
- case BIOC_SDSCRUB:
- break;
- default:
- goto die;
- }
- break;
- case BIOC_SDOFFLINE:
- switch (new_state) {
- case BIOC_SDREBUILD:
- case BIOC_SDHOTSPARE:
- break;
- default:
- goto die;
- }
- break;
- case BIOC_SDSCRUB:
- if (new_state == BIOC_SDONLINE) {
- ;
- } else
- goto die;
- break;
- case BIOC_SDREBUILD:
- switch (new_state) {
- case BIOC_SDONLINE:
- break;
- case BIOC_SDOFFLINE:
- /* Abort rebuild since the rebuild chunk disappeared. */
- sd->sd_reb_abort = 1;
- break;
- default:
- goto die;
- }
- break;
- case BIOC_SDHOTSPARE:
- switch (new_state) {
- case BIOC_SDOFFLINE:
- case BIOC_SDREBUILD:
- break;
- default:
- goto die;
- }
- break;
- default:
- die:
- splx(s); /* XXX */
- panic("%s: %s: %s: invalid chunk state transition "
- "%d -> %d\n", DEVNAME(sd->sd_sc),
- sd->sd_meta->ssd_devname,
- sd->sd_vol.sv_chunks[c]->src_meta.scmi.scm_devname,
- old_state, new_state);
- /* NOTREACHED */
- }
- sd->sd_vol.sv_chunks[c]->src_meta.scm_status = new_state;
- sd->sd_set_vol_state(sd);
- sd->sd_must_flush = 1;
- task_add(systq, &sd->sd_meta_save_task);
- done:
- splx(s);
- }
- void
- sr_raid1_set_vol_state(struct sr_discipline *sd)
- {
- int states[SR_MAX_STATES];
- int new_state, i, s, nd;
- int old_state = sd->sd_vol_status;
- DNPRINTF(SR_D_STATE, "%s: %s: sr_raid_set_vol_state\n",
- DEVNAME(sd->sd_sc), sd->sd_meta->ssd_devname);
- nd = sd->sd_meta->ssdi.ssd_chunk_no;
- #ifdef SR_DEBUG
- for (i = 0; i < nd; i++)
- DNPRINTF(SR_D_STATE, "%s: chunk %d status = %u\n",
- DEVNAME(sd->sd_sc), i,
- sd->sd_vol.sv_chunks[i]->src_meta.scm_status);
- #endif
- for (i = 0; i < SR_MAX_STATES; i++)
- states[i] = 0;
- for (i = 0; i < nd; i++) {
- s = sd->sd_vol.sv_chunks[i]->src_meta.scm_status;
- if (s >= SR_MAX_STATES)
- panic("%s: %s: %s: invalid chunk state",
- DEVNAME(sd->sd_sc),
- sd->sd_meta->ssd_devname,
- sd->sd_vol.sv_chunks[i]->src_meta.scmi.scm_devname);
- states[s]++;
- }
- if (states[BIOC_SDONLINE] == nd)
- new_state = BIOC_SVONLINE;
- else if (states[BIOC_SDONLINE] == 0)
- new_state = BIOC_SVOFFLINE;
- else if (states[BIOC_SDSCRUB] != 0)
- new_state = BIOC_SVSCRUB;
- else if (states[BIOC_SDREBUILD] != 0)
- new_state = BIOC_SVREBUILD;
- else if (states[BIOC_SDOFFLINE] != 0)
- new_state = BIOC_SVDEGRADED;
- else {
- DNPRINTF(SR_D_STATE, "%s: invalid volume state, old state "
- "was %d\n", DEVNAME(sd->sd_sc), old_state);
- panic("invalid volume state");
- }
- DNPRINTF(SR_D_STATE, "%s: %s: sr_raid1_set_vol_state %d -> %d\n",
- DEVNAME(sd->sd_sc), sd->sd_meta->ssd_devname,
- old_state, new_state);
- switch (old_state) {
- case BIOC_SVONLINE:
- switch (new_state) {
- case BIOC_SVONLINE: /* can go to same state */
- case BIOC_SVOFFLINE:
- case BIOC_SVDEGRADED:
- case BIOC_SVREBUILD: /* happens on boot */
- break;
- default:
- goto die;
- }
- break;
- case BIOC_SVOFFLINE:
- /* XXX this might be a little too much */
- goto die;
- case BIOC_SVDEGRADED:
- switch (new_state) {
- case BIOC_SVOFFLINE:
- case BIOC_SVREBUILD:
- case BIOC_SVDEGRADED: /* can go to the same state */
- break;
- default:
- goto die;
- }
- break;
- case BIOC_SVBUILDING:
- switch (new_state) {
- case BIOC_SVONLINE:
- case BIOC_SVOFFLINE:
- case BIOC_SVBUILDING: /* can go to the same state */
- break;
- default:
- goto die;
- }
- break;
- case BIOC_SVSCRUB:
- switch (new_state) {
- case BIOC_SVONLINE:
- case BIOC_SVOFFLINE:
- case BIOC_SVDEGRADED:
- case BIOC_SVSCRUB: /* can go to same state */
- break;
- default:
- goto die;
- }
- break;
- case BIOC_SVREBUILD:
- switch (new_state) {
- case BIOC_SVONLINE:
- case BIOC_SVOFFLINE:
- case BIOC_SVDEGRADED:
- case BIOC_SVREBUILD: /* can go to the same state */
- break;
- default:
- goto die;
- }
- break;
- default:
- die:
- panic("%s: %s: invalid volume state transition "
- "%d -> %d\n", DEVNAME(sd->sd_sc),
- sd->sd_meta->ssd_devname,
- old_state, new_state);
- /* NOTREACHED */
- }
- sd->sd_vol_status = new_state;
- /* If we have just become degraded, look for a hotspare. */
- if (new_state == BIOC_SVDEGRADED)
- task_add(systq, &sd->sd_hotspare_rebuild_task);
- }
- int
- sr_raid1_rw(struct sr_workunit *wu)
- {
- struct sr_discipline *sd = wu->swu_dis;
- struct scsi_xfer *xs = wu->swu_xs;
- struct sr_ccb *ccb;
- struct sr_chunk *scp;
- int ios, chunk, i, rt;
- daddr_t blkno;
- /* blkno and scsi error will be handled by sr_validate_io */
- if (sr_validate_io(wu, &blkno, "sr_raid1_rw"))
- goto bad;
- if (xs->flags & SCSI_DATA_IN)
- ios = 1;
- else
- ios = sd->sd_meta->ssdi.ssd_chunk_no;
- for (i = 0; i < ios; i++) {
- if (xs->flags & SCSI_DATA_IN) {
- rt = 0;
- ragain:
- /* interleave reads */
- chunk = sd->mds.mdd_raid1.sr1_counter++ %
- sd->sd_meta->ssdi.ssd_chunk_no;
- scp = sd->sd_vol.sv_chunks[chunk];
- switch (scp->src_meta.scm_status) {
- case BIOC_SDONLINE:
- case BIOC_SDSCRUB:
- break;
- case BIOC_SDOFFLINE:
- case BIOC_SDREBUILD:
- case BIOC_SDHOTSPARE:
- if (rt++ < sd->sd_meta->ssdi.ssd_chunk_no)
- goto ragain;
- /* FALLTHROUGH */
- default:
- /* volume offline */
- printf("%s: is offline, cannot read\n",
- DEVNAME(sd->sd_sc));
- goto bad;
- }
- } else {
- /* writes go on all working disks */
- chunk = i;
- scp = sd->sd_vol.sv_chunks[chunk];
- switch (scp->src_meta.scm_status) {
- case BIOC_SDONLINE:
- case BIOC_SDSCRUB:
- case BIOC_SDREBUILD:
- break;
- case BIOC_SDHOTSPARE: /* should never happen */
- case BIOC_SDOFFLINE:
- continue;
- default:
- goto bad;
- }
- }
- ccb = sr_ccb_rw(sd, chunk, blkno, xs->datalen, xs->data,
- xs->flags, 0);
- if (!ccb) {
- /* should never happen but handle more gracefully */
- printf("%s: %s: too many ccbs queued\n",
- DEVNAME(sd->sd_sc),
- sd->sd_meta->ssd_devname);
- goto bad;
- }
- sr_wu_enqueue_ccb(wu, ccb);
- }
- sr_schedule_wu(wu);
- return (0);
- bad:
- /* wu is unwound by sr_wu_put */
- return (1);
- }
- int
- sr_raid1_wu_done(struct sr_workunit *wu)
- {
- struct sr_discipline *sd = wu->swu_dis;
- struct scsi_xfer *xs = wu->swu_xs;
- /* If at least one I/O succeeded, we are okay. */
- if (wu->swu_ios_succeeded > 0) {
- xs->error = XS_NOERROR;
- return SR_WU_OK;
- }
- /* If all I/O failed, retry reads and give up on writes. */
- if (xs->flags & SCSI_DATA_IN) {
- printf("%s: retrying read on block %lld\n",
- sd->sd_meta->ssd_devname, (long long)wu->swu_blk_start);
- if (wu->swu_cb_active == 1)
- panic("%s: sr_raid1_intr_cb",
- DEVNAME(sd->sd_sc));
- sr_wu_release_ccbs(wu);
- wu->swu_state = SR_WU_RESTART;
- if (sd->sd_scsi_rw(wu) == 0)
- return SR_WU_RESTART;
- } else {
- printf("%s: permanently failing write on block %lld\n",
- sd->sd_meta->ssd_devname, (long long)wu->swu_blk_start);
- }
- wu->swu_state = SR_WU_FAILED;
- xs->error = XS_DRIVER_STUFFUP;
- return SR_WU_FAILED;
- }
|