/* $NetBSD: wd.c,v 1.332 2006/10/25 04:04:45 thorpej Exp $ */ /* * Copyright (c) 1998, 2001 Manuel Bouyer. All rights reserved. * * Redistribution and use in source and binary forms, with or without * modification, are permitted provided that the following conditions * are met: * 1. Redistributions of source code must retain the above copyright * notice, this list of conditions and the following disclaimer. * 2. Redistributions in binary form must reproduce the above copyright * notice, this list of conditions and the following disclaimer in the * documentation and/or other materials provided with the distribution. * 3. All advertising materials mentioning features or use of this software * must display the following acknowledgement: * This product includes software developed by Manuel Bouyer. * 4. The name of the author may not be used to endorse or promote products * derived from this software without specific prior written permission. * * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT, * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. */ /*- * Copyright (c) 1998, 2003, 2004 The NetBSD Foundation, Inc. * All rights reserved. * * This code is derived from software contributed to The NetBSD Foundation * by Charles M. Hannum and by Onno van der Linden. * * Redistribution and use in source and binary forms, with or without * modification, are permitted provided that the following conditions * are met: * 1. Redistributions of source code must retain the above copyright * notice, this list of conditions and the following disclaimer. * 2. Redistributions in binary form must reproduce the above copyright * notice, this list of conditions and the following disclaimer in the * documentation and/or other materials provided with the distribution. * 3. All advertising materials mentioning features or use of this software * must display the following acknowledgement: * This product includes software developed by the NetBSD * Foundation, Inc. and its contributors. * 4. Neither the name of The NetBSD Foundation nor the names of its * contributors may be used to endorse or promote products derived * from this software without specific prior written permission. * * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE * POSSIBILITY OF SUCH DAMAGE. */ #include __KERNEL_RCSID(0, "$NetBSD: wd.c,v 1.332 2006/10/25 04:04:45 thorpej Exp $"); #ifndef ATADEBUG #define ATADEBUG #endif /* ATADEBUG */ #include "rnd.h" #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include #if NRND > 0 #include #endif #include #include #include #include #include #include #include #include "locators.h" #include #define LBA48_THRESHOLD (0xfffffff) /* 128GB / DEV_BSIZE */ #define WDIORETRIES_SINGLE 4 /* number of retries before single-sector */ #define WDIORETRIES 5 /* number of retries before giving up */ #define RECOVERYTIME hz/2 /* time to wait before retrying a cmd */ #define WDUNIT(dev) DISKUNIT(dev) #define WDPART(dev) DISKPART(dev) #define WDMINOR(unit, part) DISKMINOR(unit, part) #define MAKEWDDEV(maj, unit, part) MAKEDISKDEV(maj, unit, part) #define WDLABELDEV(dev) (MAKEWDDEV(major(dev), WDUNIT(dev), RAW_PART)) #define DEBUG_INTR 0x01 #define DEBUG_XFERS 0x02 #define DEBUG_STATUS 0x04 #define DEBUG_FUNCS 0x08 #define DEBUG_PROBE 0x10 #ifdef ATADEBUG int wdcdebug_wd_mask = 0x0; #define ATADEBUG_PRINT(args, level) \ if (wdcdebug_wd_mask & (level)) \ printf args #else #define ATADEBUG_PRINT(args, level) #endif int wdprobe(struct device *, struct cfdata *, void *); void wdattach(struct device *, struct device *, void *); int wddetach(struct device *, int); int wdactivate(struct device *, enum devact); int wdprint(void *, char *); void wdperror(const struct wd_softc *); CFATTACH_DECL(wd, sizeof(struct wd_softc), wdprobe, wdattach, wddetach, wdactivate); extern struct cfdriver wd_cd; dev_type_open(wdopen); dev_type_close(wdclose); dev_type_read(wdread); dev_type_write(wdwrite); dev_type_ioctl(wdioctl); dev_type_strategy(wdstrategy); dev_type_dump(wddump); dev_type_size(wdsize); const struct bdevsw wd_bdevsw = { wdopen, wdclose, wdstrategy, wdioctl, wddump, wdsize, D_DISK }; const struct cdevsw wd_cdevsw = { wdopen, wdclose, wdread, wdwrite, wdioctl, nostop, notty, nopoll, nommap, nokqfilter, D_DISK }; /* * Glue necessary to hook WDCIOCCOMMAND into physio */ struct wd_ioctl { LIST_ENTRY(wd_ioctl) wi_list; struct buf wi_bp; struct uio wi_uio; struct iovec wi_iov; atareq_t wi_atareq; struct wd_softc *wi_softc; }; LIST_HEAD(, wd_ioctl) wi_head; struct wd_ioctl *wi_find(struct buf *); void wi_free(struct wd_ioctl *); struct wd_ioctl *wi_get(void); void wdioctlstrategy(struct buf *); void wdgetdefaultlabel(struct wd_softc *, struct disklabel *); void wdgetdisklabel(struct wd_softc *); void wdstart(void *); void __wdstart(struct wd_softc*, struct buf *); void wdrestart(void *); void wddone(void *); int wd_get_params(struct wd_softc *, u_int8_t, struct ataparams *); int wd_standby(struct wd_softc *, int); int wd_flushcache(struct wd_softc *, int); void wd_shutdown(void *); int wd_getcache(struct wd_softc *, int *); int wd_setcache(struct wd_softc *, int); struct dkdriver wddkdriver = { wdstrategy, minphys }; #ifdef HAS_BAD144_HANDLING static void bad144intern(struct wd_softc *); #endif #define WD_QUIRK_SPLIT_MOD15_WRITE 0x0001 /* must split certain writes */ #define WD_QUIRK_FORCE_LBA48 0x0002 /* must use LBA48 commands */ #define WD_QUIRK_FMT "\20\1SPLIT_MOD15_WRITE\2FORCE_LBA48" /* * Quirk table for IDE drives. Put more-specific matches first, since * a simple globbing routine is used for matching. */ static const struct wd_quirk { const char *wdq_match; /* inquiry pattern to match */ int wdq_quirks; /* drive quirks */ } wd_quirk_table[] = { /* * Some Seagate S-ATA drives have a PHY which can get confused * with the way data is packetized by some S-ATA controllers. * * The work-around is to split in two any write transfer whose * sector count % 15 == 1 (assuming 512 byte sectors). * * XXX This is an incomplete list. There are at least a couple * XXX more model numbers. If you have trouble with such transfers * XXX (8K is the most common) on Seagate S-ATA drives, please * XXX notify thorpej@NetBSD.org. */ { "ST3120023AS", WD_QUIRK_SPLIT_MOD15_WRITE }, { "ST380023AS", WD_QUIRK_SPLIT_MOD15_WRITE }, /* * These seagate drives seems to have issue addressing sector 0xfffffff * (aka LBA48_THRESHOLD) in LBA mode. The workaround is to force * LBA48 * Note that we can't just change the code to always use LBA48 for * sector 0xfffffff, because this would break valid and working * setups using LBA48 drives on non-LBA48-capable controllers * (and it's hard to get a list of such controllers) */ { "ST3160021A*", WD_QUIRK_FORCE_LBA48 }, { "ST3160812A*", WD_QUIRK_FORCE_LBA48 }, { "ST3160023A*", WD_QUIRK_FORCE_LBA48 }, { "ST3160827A*", WD_QUIRK_FORCE_LBA48 }, /* Attempt to catch all seagate drives larger than 200GB */ { "ST3[2-9][0-9][0-9][0-9][0-9][0-9][A-Z]*", WD_QUIRK_FORCE_LBA48 }, { NULL, 0 } }; static const struct wd_quirk * wd_lookup_quirks(const char *name) { const struct wd_quirk *wdq; const char *estr; for (wdq = wd_quirk_table; wdq->wdq_match != NULL; wdq++) { /* * We only want exact matches (which include matches * against globbing characters). */ if (pmatch(name, wdq->wdq_match, &estr) == 2) return (wdq); } return (NULL); } int wdprobe(struct device *parent __unused, struct cfdata *match, void *aux) { struct ata_device *adev = aux; if (adev == NULL) return 0; if (adev->adev_bustype->bustype_type != SCSIPI_BUSTYPE_ATA) return 0; if (match->cf_loc[ATA_HLCF_DRIVE] != ATA_HLCF_DRIVE_DEFAULT && match->cf_loc[ATA_HLCF_DRIVE] != adev->adev_drv_data->drive) return 0; return 1; } void wdattach(struct device *parent __unused, struct device *self, void *aux) { struct wd_softc *wd = (void *)self; struct ata_device *adev= aux; int i, blank; char tbuf[41], pbuf[9], c, *p, *q; const struct wd_quirk *wdq; ATADEBUG_PRINT(("wdattach\n"), DEBUG_FUNCS | DEBUG_PROBE); callout_init(&wd->sc_restart_ch); bufq_alloc(&wd->sc_q, BUFQ_DISK_DEFAULT_STRAT, BUFQ_SORT_RAWBLOCK); #ifdef WD_SOFTBADSECT SLIST_INIT(&wd->sc_bslist); #endif wd->atabus = adev->adev_bustype; wd->openings = adev->adev_openings; wd->drvp = adev->adev_drv_data; wd->drvp->drv_done = wddone; wd->drvp->drv_softc = &wd->sc_dev; aprint_naive("\n"); /* read our drive info */ if (wd_get_params(wd, AT_WAIT, &wd->sc_params) != 0) { aprint_error("\n%s: IDENTIFY failed\n", wd->sc_dev.dv_xname); return; } for (blank = 0, p = wd->sc_params.atap_model, q = tbuf, i = 0; i < sizeof(wd->sc_params.atap_model); i++) { c = *p++; if (c == '\0') break; if (c != ' ') { if (blank) { *q++ = ' '; blank = 0; } *q++ = c; } else blank = 1; } *q++ = '\0'; aprint_normal(": <%s>\n", tbuf); wdq = wd_lookup_quirks(tbuf); if (wdq != NULL) wd->sc_quirks = wdq->wdq_quirks; if (wd->sc_quirks != 0) { char sbuf[sizeof(WD_QUIRK_FMT) + 64]; bitmask_snprintf(wd->sc_quirks, WD_QUIRK_FMT, sbuf, sizeof(sbuf)); aprint_normal("%s: quirks %s\n", wd->sc_dev.dv_xname, sbuf); } if ((wd->sc_params.atap_multi & 0xff) > 1) { wd->sc_multi = wd->sc_params.atap_multi & 0xff; } else { wd->sc_multi = 1; } aprint_normal("%s: drive supports %d-sector PIO transfers,", wd->sc_dev.dv_xname, wd->sc_multi); /* 48-bit LBA addressing */ if ((wd->sc_params.atap_cmd2_en & ATA_CMD2_LBA48) != 0) wd->sc_flags |= WDF_LBA48; /* Prior to ATA-4, LBA was optional. */ if ((wd->sc_params.atap_capabilities1 & WDC_CAP_LBA) != 0) wd->sc_flags |= WDF_LBA; #if 0 /* ATA-4 requires LBA. */ if (wd->sc_params.atap_ataversion != 0xffff && wd->sc_params.atap_ataversion >= WDC_VER_ATA4) wd->sc_flags |= WDF_LBA; #endif if ((wd->sc_flags & WDF_LBA48) != 0) { aprint_normal(" LBA48 addressing\n"); wd->sc_capacity = ((u_int64_t) wd->sc_params.__reserved6[11] << 48) | ((u_int64_t) wd->sc_params.__reserved6[10] << 32) | ((u_int64_t) wd->sc_params.__reserved6[9] << 16) | ((u_int64_t) wd->sc_params.__reserved6[8] << 0); } else if ((wd->sc_flags & WDF_LBA) != 0) { aprint_normal(" LBA addressing\n"); wd->sc_capacity = ((u_int64_t)wd->sc_params.atap_capacity[1] << 16) | wd->sc_params.atap_capacity[0]; } else { aprint_normal(" chs addressing\n"); wd->sc_capacity = wd->sc_params.atap_cylinders * wd->sc_params.atap_heads * wd->sc_params.atap_sectors; } format_bytes(pbuf, sizeof(pbuf), wd->sc_capacity * DEV_BSIZE); aprint_normal("%s: %s, %d cyl, %d head, %d sec, " "%d bytes/sect x %llu sectors\n", self->dv_xname, pbuf, (wd->sc_flags & WDF_LBA) ? (int)(wd->sc_capacity / (wd->sc_params.atap_heads * wd->sc_params.atap_sectors)) : wd->sc_params.atap_cylinders, wd->sc_params.atap_heads, wd->sc_params.atap_sectors, DEV_BSIZE, (unsigned long long)wd->sc_capacity); ATADEBUG_PRINT(("%s: atap_dmatiming_mimi=%d, atap_dmatiming_recom=%d\n", self->dv_xname, wd->sc_params.atap_dmatiming_mimi, wd->sc_params.atap_dmatiming_recom), DEBUG_PROBE); /* * Initialize and attach the disk structure. */ wd->sc_dk.dk_driver = &wddkdriver; wd->sc_dk.dk_name = wd->sc_dev.dv_xname; /* we fill in dk_info later */ disk_attach(&wd->sc_dk); wd->sc_wdc_bio.lp = wd->sc_dk.dk_label; wd->sc_sdhook = shutdownhook_establish(wd_shutdown, wd); if (wd->sc_sdhook == NULL) aprint_error("%s: WARNING: unable to establish shutdown hook\n", wd->sc_dev.dv_xname); #if NRND > 0 rnd_attach_source(&wd->rnd_source, wd->sc_dev.dv_xname, RND_TYPE_DISK, 0); #endif /* Discover wedges on this disk. */ dkwedge_discover(&wd->sc_dk); } int wdactivate(struct device *self __unused, enum devact act) { int rv = 0; switch (act) { case DVACT_ACTIVATE: rv = EOPNOTSUPP; break; case DVACT_DEACTIVATE: /* * Nothing to do; we key off the device's DVF_ACTIVATE. */ break; } return (rv); } int wddetach(struct device *self, int flags __unused) { struct wd_softc *sc = (struct wd_softc *)self; int s, bmaj, cmaj, i, mn; /* locate the major number */ bmaj = bdevsw_lookup_major(&wd_bdevsw); cmaj = cdevsw_lookup_major(&wd_cdevsw); /* Nuke the vnodes for any open instances. */ for (i = 0; i < MAXPARTITIONS; i++) { mn = WDMINOR(device_unit(self), i); vdevgone(bmaj, mn, mn, VBLK); vdevgone(cmaj, mn, mn, VCHR); } /* Delete all of our wedges. */ dkwedge_delall(&sc->sc_dk); s = splbio(); /* Kill off any queued buffers. */ bufq_drain(sc->sc_q); bufq_free(sc->sc_q); sc->atabus->ata_killpending(sc->drvp); splx(s); /* Detach disk. */ disk_detach(&sc->sc_dk); #ifdef WD_SOFTBADSECT /* Clean out the bad sector list */ while (!SLIST_EMPTY(&sc->sc_bslist)) { void *head = SLIST_FIRST(&sc->sc_bslist); SLIST_REMOVE_HEAD(&sc->sc_bslist, dbs_next); free(head, M_TEMP); } sc->sc_bscount = 0; #endif /* Get rid of the shutdown hook. */ if (sc->sc_sdhook != NULL) shutdownhook_disestablish(sc->sc_sdhook); #if NRND > 0 /* Unhook the entropy source. */ rnd_detach_source(&sc->rnd_source); #endif sc->drvp->drive_flags = 0; /* no drive any more here */ return (0); } /* * Read/write routine for a buffer. Validates the arguments and schedules the * transfer. Does not wait for the transfer to complete. */ void wdstrategy(struct buf *bp) { struct wd_softc *wd = device_lookup(&wd_cd, WDUNIT(bp->b_dev)); struct disklabel *lp = wd->sc_dk.dk_label; daddr_t blkno; int s; ATADEBUG_PRINT(("wdstrategy (%s)\n", wd->sc_dev.dv_xname), DEBUG_XFERS); /* Valid request? */ if (bp->b_blkno < 0 || (bp->b_bcount % lp->d_secsize) != 0 || (bp->b_bcount / lp->d_secsize) >= (1 << NBBY)) { bp->b_error = EINVAL; goto bad; } /* If device invalidated (e.g. media change, door open), error. */ if ((wd->sc_flags & WDF_LOADED) == 0) { bp->b_error = EIO; goto bad; } /* If it's a null transfer, return immediately. */ if (bp->b_bcount == 0) goto done; /* * Do bounds checking, adjust transfer. if error, process. * If end of partition, just return. */ if (WDPART(bp->b_dev) == RAW_PART) { if (bounds_check_with_mediasize(bp, DEV_BSIZE, wd->sc_capacity) <= 0) goto done; } else { if (bounds_check_with_label(&wd->sc_dk, bp, (wd->sc_flags & (WDF_WLABEL|WDF_LABELLING)) != 0) <= 0) goto done; } /* * Now convert the block number to absolute and put it in * terms of the device's logical block size. */ if (lp->d_secsize >= DEV_BSIZE) blkno = bp->b_blkno / (lp->d_secsize / DEV_BSIZE); else blkno = bp->b_blkno * (DEV_BSIZE / lp->d_secsize); if (WDPART(bp->b_dev) != RAW_PART) blkno += lp->d_partitions[WDPART(bp->b_dev)].p_offset; bp->b_rawblkno = blkno; #ifdef WD_SOFTBADSECT /* * If the transfer about to be attempted contains only a block that * is known to be bad then return an error for the transfer without * even attempting to start a transfer up under the premis that we * will just end up doing more retries for a transfer that will end * up failing again. * XXX:SMP - mutex required to protect with DIOCBSFLUSH */ if (__predict_false(!SLIST_EMPTY(&wd->sc_bslist))) { struct disk_badsectors *dbs; daddr_t maxblk = blkno + (bp->b_bcount >> DEV_BSHIFT) - 1; SLIST_FOREACH(dbs, &wd->sc_bslist, dbs_next) if ((dbs->dbs_min <= blkno && blkno <= dbs->dbs_max) || (dbs->dbs_min <= maxblk && maxblk <= dbs->dbs_max)){ bp->b_error = EIO; goto bad; } } #endif /* Queue transfer on drive, activate drive and controller if idle. */ s = splbio(); BUFQ_PUT(wd->sc_q, bp); wdstart(wd); splx(s); return; bad: bp->b_flags |= B_ERROR; done: /* Toss transfer; we're done early. */ bp->b_resid = bp->b_bcount; biodone(bp); } /* * Queue a drive for I/O. */ void wdstart(void *arg) { struct wd_softc *wd = arg; struct buf *bp = NULL; ATADEBUG_PRINT(("wdstart %s\n", wd->sc_dev.dv_xname), DEBUG_XFERS); while (wd->openings > 0) { /* Is there a buf for us ? */ if ((bp = BUFQ_GET(wd->sc_q)) == NULL) return; /* * Make the command. First lock the device */ wd->openings--; wd->retries = 0; __wdstart(wd, bp); } } static void wd_split_mod15_write(struct buf *bp) { struct buf *obp = bp->b_private; struct wd_softc *sc = wd_cd.cd_devs[DISKUNIT(obp->b_dev)]; if (__predict_false(bp->b_flags & B_ERROR) != 0) { /* * Propagate the error. If this was the first half of * the original transfer, make sure to account for that * in the residual. */ if (bp->b_data == obp->b_data) bp->b_resid += bp->b_bcount; goto done; } /* * If this was the second half of the transfer, we're all done! */ if (bp->b_data != obp->b_data) goto done; /* * Advance the pointer to the second half and issue that command * using the same opening. */ bp->b_flags = obp->b_flags | B_CALL; bp->b_data += bp->b_bcount; bp->b_blkno += (bp->b_bcount / 512); bp->b_rawblkno += (bp->b_bcount / 512); __wdstart(sc, bp); return; done: obp->b_flags |= bp->b_flags & B_ERROR; obp->b_error = bp->b_error; obp->b_resid = bp->b_resid; putiobuf(bp); biodone(obp); sc->openings++; /* wddone() will call wdstart() */ } void __wdstart(struct wd_softc *wd, struct buf *bp) { /* * Deal with the "split mod15 write" quirk. We just divide the * transfer in two, doing the first half and then then second half * with the same command opening. * * Note we MUST do this here, because we can't let insertion * into the bufq cause the transfers to be re-merged. */ if (__predict_false((wd->sc_quirks & WD_QUIRK_SPLIT_MOD15_WRITE) != 0 && (bp->b_flags & B_READ) == 0 && bp->b_bcount > 512 && ((bp->b_bcount / 512) % 15) == 1)) { struct buf *nbp; /* already at splbio */ nbp = getiobuf_nowait(); if (__predict_false(nbp == NULL)) { /* No memory -- fail the iop. */ bp->b_error = ENOMEM; bp->b_flags |= B_ERROR; bp->b_resid = bp->b_bcount; biodone(bp); wd->openings++; return; } nbp->b_error = 0; nbp->b_proc = bp->b_proc; nbp->b_vp = NULLVP; nbp->b_dev = bp->b_dev; nbp->b_bcount = bp->b_bcount / 2; nbp->b_bufsize = bp->b_bcount / 2; nbp->b_data = bp->b_data; nbp->b_blkno = bp->b_blkno; nbp->b_rawblkno = bp->b_rawblkno; nbp->b_flags = bp->b_flags | B_CALL; nbp->b_iodone = wd_split_mod15_write; /* Put ptr to orig buf in b_private and use new buf */ nbp->b_private = bp; BIO_COPYPRIO(nbp, bp); bp = nbp; } wd->sc_wdc_bio.blkno = bp->b_rawblkno; wd->sc_wdc_bio.blkdone =0; wd->sc_bp = bp; /* * If we're retrying, retry in single-sector mode. This will give us * the sector number of the problem, and will eventually allow the * transfer to succeed. */ if (wd->retries >= WDIORETRIES_SINGLE) wd->sc_wdc_bio.flags = ATA_SINGLE; else wd->sc_wdc_bio.flags = 0; if (wd->sc_flags & WDF_LBA48 && (wd->sc_wdc_bio.blkno > LBA48_THRESHOLD || (wd->sc_quirks & WD_QUIRK_FORCE_LBA48) != 0)) wd->sc_wdc_bio.flags |= ATA_LBA48; if (wd->sc_flags & WDF_LBA) wd->sc_wdc_bio.flags |= ATA_LBA; if (bp->b_flags & B_READ) wd->sc_wdc_bio.flags |= ATA_READ; wd->sc_wdc_bio.bcount = bp->b_bcount; wd->sc_wdc_bio.databuf = bp->b_data; /* Instrumentation. */ disk_busy(&wd->sc_dk); switch (wd->atabus->ata_bio(wd->drvp, &wd->sc_wdc_bio)) { case ATACMD_TRY_AGAIN: callout_reset(&wd->sc_restart_ch, hz, wdrestart, wd); break; case ATACMD_QUEUED: case ATACMD_COMPLETE: break; default: panic("__wdstart: bad return code from ata_bio()"); } } void wddone(void *v) { struct wd_softc *wd = v; struct buf *bp = wd->sc_bp; const char *errmsg; int do_perror = 0; ATADEBUG_PRINT(("wddone %s\n", wd->sc_dev.dv_xname), DEBUG_XFERS); if (bp == NULL) return; bp->b_resid = wd->sc_wdc_bio.bcount; switch (wd->sc_wdc_bio.error) { case ERR_DMA: errmsg = "DMA error"; goto retry; case ERR_DF: errmsg = "device fault"; goto retry; case TIMEOUT: errmsg = "device timeout"; goto retry; case ERR_RESET: errmsg = "channel reset"; goto retry2; case ERROR: /* Don't care about media change bits */ if (wd->sc_wdc_bio.r_error != 0 && (wd->sc_wdc_bio.r_error & ~(WDCE_MC | WDCE_MCR)) == 0) goto noerror; errmsg = "error"; do_perror = 1; retry: /* Just reset and retry. Can we do more ? */ (*wd->atabus->ata_reset_drive)(wd->drvp, AT_RST_NOCMD); retry2: diskerr(bp, "wd", errmsg, LOG_PRINTF, wd->sc_wdc_bio.blkdone, wd->sc_dk.dk_label); if (wd->retries < WDIORETRIES) printf(", retrying\n"); if (do_perror) wdperror(wd); if (wd->retries < WDIORETRIES) { wd->retries++; callout_reset(&wd->sc_restart_ch, RECOVERYTIME, wdrestart, wd); return; } printf("\n"); #ifdef WD_SOFTBADSECT /* * Not all errors indicate a failed block but those that do, * put the block on the bad-block list for the device. Only * do this for reads because the drive should do it for writes, * itself, according to Manuel. */ if ((bp->b_flags & B_READ) && ((wd->drvp->ata_vers >= 4 && wd->sc_wdc_bio.r_error & 64) || (wd->drvp->ata_vers < 4 && wd->sc_wdc_bio.r_error & 192))) { struct disk_badsectors *dbs; dbs = malloc(sizeof *dbs, M_TEMP, M_WAITOK); dbs->dbs_min = bp->b_rawblkno; dbs->dbs_max = dbs->dbs_min + (bp->b_bcount >> DEV_BSHIFT) - 1; microtime(&dbs->dbs_failedat); SLIST_INSERT_HEAD(&wd->sc_bslist, dbs, dbs_next); wd->sc_bscount++; } #endif bp->b_flags |= B_ERROR; bp->b_error = EIO; break; case NOERROR: noerror: if ((wd->sc_wdc_bio.flags & ATA_CORR) || wd->retries > 0) printf("%s: soft error (corrected)\n", wd->sc_dev.dv_xname); break; case ERR_NODEV: bp->b_flags |= B_ERROR; bp->b_error = EIO; break; } disk_unbusy(&wd->sc_dk, (bp->b_bcount - bp->b_resid), (bp->b_flags & B_READ)); #if NRND > 0 rnd_add_uint32(&wd->rnd_source, bp->b_blkno); #endif /* XXX Yuck, but we don't want to increment openings in this case */ if (__predict_false((bp->b_flags & B_CALL) != 0 && bp->b_iodone == wd_split_mod15_write)) biodone(bp); else { biodone(bp); wd->openings++; } wdstart(wd); } void wdrestart(void *v) { struct wd_softc *wd = v; struct buf *bp = wd->sc_bp; int s; ATADEBUG_PRINT(("wdrestart %s\n", wd->sc_dev.dv_xname), DEBUG_XFERS); s = splbio(); __wdstart(v, bp); splx(s); } int wdread(dev_t dev, struct uio *uio, int flags __unused) { ATADEBUG_PRINT(("wdread\n"), DEBUG_XFERS); return (physio(wdstrategy, NULL, dev, B_READ, minphys, uio)); } int wdwrite(dev_t dev, struct uio *uio, int flags __unused) { ATADEBUG_PRINT(("wdwrite\n"), DEBUG_XFERS); return (physio(wdstrategy, NULL, dev, B_WRITE, minphys, uio)); } int wdopen(dev_t dev, int flag __unused, int fmt, struct lwp *l __unused) { struct wd_softc *wd; int part, error; ATADEBUG_PRINT(("wdopen\n"), DEBUG_FUNCS); wd = device_lookup(&wd_cd, WDUNIT(dev)); if (wd == NULL) return (ENXIO); if (! device_is_active(&wd->sc_dev)) return (ENODEV); part = WDPART(dev); if ((error = lockmgr(&wd->sc_dk.dk_openlock, LK_EXCLUSIVE, NULL)) != 0) return (error); /* * If there are wedges, and this is not RAW_PART, then we * need to fail. */ if (wd->sc_dk.dk_nwedges != 0 && part != RAW_PART) { error = EBUSY; goto bad1; } /* * If this is the first open of this device, add a reference * to the adapter. */ if (wd->sc_dk.dk_openmask == 0 && (error = wd->atabus->ata_addref(wd->drvp)) != 0) goto bad1; if (wd->sc_dk.dk_openmask != 0) { /* * If any partition is open, but the disk has been invalidated, * disallow further opens. */ if ((wd->sc_flags & WDF_LOADED) == 0) { error = EIO; goto bad2; } } else { if ((wd->sc_flags & WDF_LOADED) == 0) { wd->sc_flags |= WDF_LOADED; /* Load the physical device parameters. */ wd_get_params(wd, AT_WAIT, &wd->sc_params); /* Load the partition info if not already loaded. */ wdgetdisklabel(wd); } } /* Check that the partition exists. */ if (part != RAW_PART && (part >= wd->sc_dk.dk_label->d_npartitions || wd->sc_dk.dk_label->d_partitions[part].p_fstype == FS_UNUSED)) { error = ENXIO; goto bad2; } /* Insure only one open at a time. */ switch (fmt) { case S_IFCHR: wd->sc_dk.dk_copenmask |= (1 << part); break; case S_IFBLK: wd->sc_dk.dk_bopenmask |= (1 << part); break; } wd->sc_dk.dk_openmask = wd->sc_dk.dk_copenmask | wd->sc_dk.dk_bopenmask; (void) lockmgr(&wd->sc_dk.dk_openlock, LK_RELEASE, NULL); return 0; bad2: if (wd->sc_dk.dk_openmask == 0) wd->atabus->ata_delref(wd->drvp); bad1: (void) lockmgr(&wd->sc_dk.dk_openlock, LK_RELEASE, NULL); return error; } int wdclose(dev_t dev, int flag __unused, int fmt, struct lwp *l __unused) { struct wd_softc *wd = device_lookup(&wd_cd, WDUNIT(dev)); int part = WDPART(dev); int error; ATADEBUG_PRINT(("wdclose\n"), DEBUG_FUNCS); if ((error = lockmgr(&wd->sc_dk.dk_openlock, LK_EXCLUSIVE, NULL)) != 0) return error; switch (fmt) { case S_IFCHR: wd->sc_dk.dk_copenmask &= ~(1 << part); break; case S_IFBLK: wd->sc_dk.dk_bopenmask &= ~(1 << part); break; } wd->sc_dk.dk_openmask = wd->sc_dk.dk_copenmask | wd->sc_dk.dk_bopenmask; if (wd->sc_dk.dk_openmask == 0) { wd_flushcache(wd, AT_WAIT); if (! (wd->sc_flags & WDF_KLABEL)) wd->sc_flags &= ~WDF_LOADED; wd->atabus->ata_delref(wd->drvp); } (void) lockmgr(&wd->sc_dk.dk_openlock, LK_RELEASE, NULL); return 0; } void wdgetdefaultlabel(struct wd_softc *wd, struct disklabel *lp) { ATADEBUG_PRINT(("wdgetdefaultlabel\n"), DEBUG_FUNCS); memset(lp, 0, sizeof(struct disklabel)); lp->d_secsize = DEV_BSIZE; lp->d_ntracks = wd->sc_params.atap_heads; lp->d_nsectors = wd->sc_params.atap_sectors; lp->d_ncylinders = (wd->sc_flags & WDF_LBA) ? wd->sc_capacity / (wd->sc_params.atap_heads * wd->sc_params.atap_sectors) : wd->sc_params.atap_cylinders; lp->d_secpercyl = lp->d_ntracks * lp->d_nsectors; if (strcmp(wd->sc_params.atap_model, "ST506") == 0) lp->d_type = DTYPE_ST506; else lp->d_type = DTYPE_ESDI; strncpy(lp->d_typename, wd->sc_params.atap_model, 16); strncpy(lp->d_packname, "fictitious", 16); if (wd->sc_capacity > UINT32_MAX) lp->d_secperunit = UINT32_MAX; else lp->d_secperunit = wd->sc_capacity; lp->d_rpm = 3600; lp->d_interleave = 1; lp->d_flags = 0; lp->d_partitions[RAW_PART].p_offset = 0; lp->d_partitions[RAW_PART].p_size = lp->d_secperunit * (lp->d_secsize / DEV_BSIZE); lp->d_partitions[RAW_PART].p_fstype = FS_UNUSED; lp->d_npartitions = RAW_PART + 1; lp->d_magic = DISKMAGIC; lp->d_magic2 = DISKMAGIC; lp->d_checksum = dkcksum(lp); } /* * Fabricate a default disk label, and try to read the correct one. */ void wdgetdisklabel(struct wd_softc *wd) { struct disklabel *lp = wd->sc_dk.dk_label; const char *errstring; int s; ATADEBUG_PRINT(("wdgetdisklabel\n"), DEBUG_FUNCS); memset(wd->sc_dk.dk_cpulabel, 0, sizeof(struct cpu_disklabel)); wdgetdefaultlabel(wd, lp); wd->sc_badsect[0] = -1; if (wd->drvp->state > RESET) { s = splbio(); wd->drvp->drive_flags |= DRIVE_RESET; splx(s); } errstring = readdisklabel(MAKEWDDEV(0, device_unit(&wd->sc_dev), RAW_PART), wdstrategy, lp, wd->sc_dk.dk_cpulabel); if (errstring) { /* * This probably happened because the drive's default * geometry doesn't match the DOS geometry. We * assume the DOS geometry is now in the label and try * again. XXX This is a kluge. */ if (wd->drvp->state > RESET) { s = splbio(); wd->drvp->drive_flags |= DRIVE_RESET; splx(s); } errstring = readdisklabel(MAKEWDDEV(0, device_unit(&wd->sc_dev), RAW_PART), wdstrategy, lp, wd->sc_dk.dk_cpulabel); } if (errstring) { printf("%s: %s\n", wd->sc_dev.dv_xname, errstring); return; } if (wd->drvp->state > RESET) { s = splbio(); wd->drvp->drive_flags |= DRIVE_RESET; splx(s); } #ifdef HAS_BAD144_HANDLING if ((lp->d_flags & D_BADSECT) != 0) bad144intern(wd); #endif } void wdperror(const struct wd_softc *wd) { static const char *const errstr0_3[] = {"address mark not found", "track 0 not found", "aborted command", "media change requested", "id not found", "media changed", "uncorrectable data error", "bad block detected"}; static const char *const errstr4_5[] = { "obsolete (address mark not found)", "no media/write protected", "aborted command", "media change requested", "id not found", "media changed", "uncorrectable data error", "interface CRC error"}; const char *const *errstr; int i; const char *sep = ""; const char *devname = wd->sc_dev.dv_xname; struct ata_drive_datas *drvp = wd->drvp; int errno = wd->sc_wdc_bio.r_error; if (drvp->ata_vers >= 4) errstr = errstr4_5; else errstr = errstr0_3; printf("%s: (", devname); if (errno == 0) printf("error not notified"); for (i = 0; i < 8; i++) { if (errno & (1 << i)) { printf("%s%s", sep, errstr[i]); sep = ", "; } } printf(")\n"); } int wdioctl(dev_t dev, u_long xfer, caddr_t addr, int flag, struct lwp *l) { struct wd_softc *wd = device_lookup(&wd_cd, WDUNIT(dev)); int error = 0, s; #ifdef __HAVE_OLD_DISKLABEL struct disklabel *newlabel = NULL; #endif ATADEBUG_PRINT(("wdioctl\n"), DEBUG_FUNCS); if ((wd->sc_flags & WDF_LOADED) == 0) return EIO; error = disk_ioctl(&wd->sc_dk, xfer, addr, flag, l); if (error != EPASSTHROUGH) return (error); switch (xfer) { #ifdef HAS_BAD144_HANDLING case DIOCSBAD: if ((flag & FWRITE) == 0) return EBADF; wd->sc_dk.dk_cpulabel->bad = *(struct dkbad *)addr; wd->sc_dk.dk_label->d_flags |= D_BADSECT; bad144intern(wd); return 0; #endif #ifdef WD_SOFTBADSECT case DIOCBSLIST : { u_int32_t count, missing, skip; struct disk_badsecinfo dbsi; struct disk_badsectors *dbs; size_t available; caddr_t laddr; dbsi = *(struct disk_badsecinfo *)addr; missing = wd->sc_bscount; count = 0; available = dbsi.dbsi_bufsize; skip = dbsi.dbsi_skip; laddr = dbsi.dbsi_buffer; /* * We start this loop with the expectation that all of the * entries will be missed and decrement this counter each * time we either skip over one (already copied out) or * we actually copy it back to user space. The structs * holding the bad sector information are copied directly * back to user space whilst the summary is returned via * the struct passed in via the ioctl. */ SLIST_FOREACH(dbs, &wd->sc_bslist, dbs_next) { if (skip > 0) { missing--; skip--; continue; } if (available < sizeof(*dbs)) break; available -= sizeof(*dbs); copyout(dbs, laddr, sizeof(*dbs)); laddr += sizeof(*dbs); missing--; count++; } dbsi.dbsi_left = missing; dbsi.dbsi_copied = count; *(struct disk_badsecinfo *)addr = dbsi; return 0; } case DIOCBSFLUSH : /* Clean out the bad sector list */ while (!SLIST_EMPTY(&wd->sc_bslist)) { void *head = SLIST_FIRST(&wd->sc_bslist); SLIST_REMOVE_HEAD(&wd->sc_bslist, dbs_next); free(head, M_TEMP); } wd->sc_bscount = 0; return 0; #endif case DIOCGDINFO: *(struct disklabel *)addr = *(wd->sc_dk.dk_label); return 0; #ifdef __HAVE_OLD_DISKLABEL case ODIOCGDINFO: newlabel = malloc(sizeof *newlabel, M_TEMP, M_WAITOK); if (newlabel == NULL) return EIO; *newlabel = *(wd->sc_dk.dk_label); if (newlabel->d_npartitions <= OLDMAXPARTITIONS) memcpy(addr, newlabel, sizeof (struct olddisklabel)); else error = ENOTTY; free(newlabel, M_TEMP); return error; #endif case DIOCGPART: ((struct partinfo *)addr)->disklab = wd->sc_dk.dk_label; ((struct partinfo *)addr)->part = &wd->sc_dk.dk_label->d_partitions[WDPART(dev)]; return 0; case DIOCWDINFO: case DIOCSDINFO: #ifdef __HAVE_OLD_DISKLABEL case ODIOCWDINFO: case ODIOCSDINFO: #endif { struct disklabel *lp; if ((flag & FWRITE) == 0) return EBADF; #ifdef __HAVE_OLD_DISKLABEL if (xfer == ODIOCSDINFO || xfer == ODIOCWDINFO) { newlabel = malloc(sizeof *newlabel, M_TEMP, M_WAITOK); if (newlabel == NULL) return EIO; memset(newlabel, 0, sizeof newlabel); memcpy(newlabel, addr, sizeof (struct olddisklabel)); lp = newlabel; } else #endif lp = (struct disklabel *)addr; if ((error = lockmgr(&wd->sc_dk.dk_openlock, LK_EXCLUSIVE, NULL)) != 0) goto bad; wd->sc_flags |= WDF_LABELLING; error = setdisklabel(wd->sc_dk.dk_label, lp, /*wd->sc_dk.dk_openmask : */0, wd->sc_dk.dk_cpulabel); if (error == 0) { if (wd->drvp->state > RESET) { s = splbio(); wd->drvp->drive_flags |= DRIVE_RESET; splx(s); } if (xfer == DIOCWDINFO #ifdef __HAVE_OLD_DISKLABEL || xfer == ODIOCWDINFO #endif ) error = writedisklabel(WDLABELDEV(dev), wdstrategy, wd->sc_dk.dk_label, wd->sc_dk.dk_cpulabel); } wd->sc_flags &= ~WDF_LABELLING; (void) lockmgr(&wd->sc_dk.dk_openlock, LK_RELEASE, NULL); bad: #ifdef __HAVE_OLD_DISKLABEL if (newlabel != NULL) free(newlabel, M_TEMP); #endif return error; } case DIOCKLABEL: if (*(int *)addr) wd->sc_flags |= WDF_KLABEL; else wd->sc_flags &= ~WDF_KLABEL; return 0; case DIOCWLABEL: if ((flag & FWRITE) == 0) return EBADF; if (*(int *)addr) wd->sc_flags |= WDF_WLABEL; else wd->sc_flags &= ~WDF_WLABEL; return 0; case DIOCGDEFLABEL: wdgetdefaultlabel(wd, (struct disklabel *)addr); return 0; #ifdef __HAVE_OLD_DISKLABEL case ODIOCGDEFLABEL: newlabel = malloc(sizeof *newlabel, M_TEMP, M_WAITOK); if (newlabel == NULL) return EIO; wdgetdefaultlabel(wd, newlabel); if (newlabel->d_npartitions <= OLDMAXPARTITIONS) memcpy(addr, &newlabel, sizeof (struct olddisklabel)); else error = ENOTTY; free(newlabel, M_TEMP); return error; #endif #ifdef notyet case DIOCWFORMAT: if ((flag & FWRITE) == 0) return EBADF; { register struct format_op *fop; struct iovec aiov; struct uio auio; fop = (struct format_op *)addr; aiov.iov_base = fop->df_buf; aiov.iov_len = fop->df_count; auio.uio_iov = &aiov; auio.uio_iovcnt = 1; auio.uio_resid = fop->df_count; auio.uio_offset = fop->df_startblk * wd->sc_dk.dk_label->d_secsize; auio.uio_vmspace = l->l_proc->p_vmspace; error = physio(wdformat, NULL, dev, B_WRITE, minphys, &auio); fop->df_count -= auio.uio_resid; fop->df_reg[0] = wdc->sc_status; fop->df_reg[1] = wdc->sc_error; return error; } #endif case DIOCGCACHE: return wd_getcache(wd, (int *)addr); case DIOCSCACHE: return wd_setcache(wd, *(int *)addr); case DIOCCACHESYNC: return wd_flushcache(wd, AT_WAIT); case ATAIOCCOMMAND: /* * Make sure this command is (relatively) safe first */ if ((((atareq_t *) addr)->flags & ATACMD_READ) == 0 && (flag & FWRITE) == 0) return (EBADF); { struct wd_ioctl *wi; atareq_t *atareq = (atareq_t *) addr; int error1; wi = wi_get(); wi->wi_softc = wd; wi->wi_atareq = *atareq; if (atareq->datalen && atareq->flags & (ATACMD_READ | ATACMD_WRITE)) { wi->wi_iov.iov_base = atareq->databuf; wi->wi_iov.iov_len = atareq->datalen; wi->wi_uio.uio_iov = &wi->wi_iov; wi->wi_uio.uio_iovcnt = 1; wi->wi_uio.uio_resid = atareq->datalen; wi->wi_uio.uio_offset = 0; wi->wi_uio.uio_rw = (atareq->flags & ATACMD_READ) ? B_READ : B_WRITE; wi->wi_uio.uio_vmspace = l->l_proc->p_vmspace; error1 = physio(wdioctlstrategy, &wi->wi_bp, dev, (atareq->flags & ATACMD_READ) ? B_READ : B_WRITE, minphys, &wi->wi_uio); } else { /* No need to call physio if we don't have any user data */ wi->wi_bp.b_flags = 0; wi->wi_bp.b_data = 0; wi->wi_bp.b_bcount = 0; wi->wi_bp.b_dev = 0; wi->wi_bp.b_proc = l->l_proc; wdioctlstrategy(&wi->wi_bp); error1 = wi->wi_bp.b_error; } *atareq = wi->wi_atareq; wi_free(wi); return(error1); } case DIOCAWEDGE: { struct dkwedge_info *dkw = (void *) addr; if ((flag & FWRITE) == 0) return (EBADF); /* If the ioctl happens here, the parent is us. */ strcpy(dkw->dkw_parent, wd->sc_dev.dv_xname); return (dkwedge_add(dkw)); } case DIOCDWEDGE: { struct dkwedge_info *dkw = (void *) addr; if ((flag & FWRITE) == 0) return (EBADF); /* If the ioctl happens here, the parent is us. */ strcpy(dkw->dkw_parent, wd->sc_dev.dv_xname); return (dkwedge_del(dkw)); } case DIOCLWEDGES: { struct dkwedge_list *dkwl = (void *) addr; return (dkwedge_list(&wd->sc_dk, dkwl, l)); } case DIOCGSTRATEGY: { struct disk_strategy *dks = (void *)addr; s = splbio(); strlcpy(dks->dks_name, bufq_getstrategyname(wd->sc_q), sizeof(dks->dks_name)); splx(s); dks->dks_paramlen = 0; return 0; } case DIOCSSTRATEGY: { struct disk_strategy *dks = (void *)addr; struct bufq_state *new; struct bufq_state *old; if ((flag & FWRITE) == 0) { return EBADF; } if (dks->dks_param != NULL) { return EINVAL; } dks->dks_name[sizeof(dks->dks_name) - 1] = 0; /* ensure term */ error = bufq_alloc(&new, dks->dks_name, BUFQ_EXACT|BUFQ_SORT_RAWBLOCK); if (error) { return error; } s = splbio(); old = wd->sc_q; bufq_move(new, old); wd->sc_q = new; splx(s); bufq_free(old); return 0; } default: return ENOTTY; } #ifdef DIAGNOSTIC panic("wdioctl: impossible"); #endif } #ifdef B_FORMAT int wdformat(struct buf *bp) { bp->b_flags |= B_FORMAT; return wdstrategy(bp); } #endif int wdsize(dev_t dev) { struct wd_softc *wd; int part, omask; int size; ATADEBUG_PRINT(("wdsize\n"), DEBUG_FUNCS); wd = device_lookup(&wd_cd, WDUNIT(dev)); if (wd == NULL) return (-1); part = WDPART(dev); omask = wd->sc_dk.dk_openmask & (1 << part); if (omask == 0 && wdopen(dev, 0, S_IFBLK, NULL) != 0) return (-1); if (wd->sc_dk.dk_label->d_partitions[part].p_fstype != FS_SWAP) size = -1; else size = wd->sc_dk.dk_label->d_partitions[part].p_size * (wd->sc_dk.dk_label->d_secsize / DEV_BSIZE); if (omask == 0 && wdclose(dev, 0, S_IFBLK, NULL) != 0) return (-1); return (size); } /* #define WD_DUMP_NOT_TRUSTED if you just want to watch */ static int wddoingadump = 0; static int wddumprecalibrated = 0; /* * Dump core after a system crash. */ int wddump(dev_t dev, daddr_t blkno, caddr_t va, size_t size) { struct wd_softc *wd; /* disk unit to do the I/O */ struct disklabel *lp; /* disk's disklabel */ int part, err; int nblks; /* total number of sectors left to write */ /* Check if recursive dump; if so, punt. */ if (wddoingadump) return EFAULT; wddoingadump = 1; wd = device_lookup(&wd_cd, WDUNIT(dev)); if (wd == NULL) return (ENXIO); part = WDPART(dev); /* Convert to disk sectors. Request must be a multiple of size. */ lp = wd->sc_dk.dk_label; if ((size % lp->d_secsize) != 0) return EFAULT; nblks = size / lp->d_secsize; blkno = blkno / (lp->d_secsize / DEV_BSIZE); /* Check transfer bounds against partition size. */ if ((blkno < 0) || ((blkno + nblks) > lp->d_partitions[part].p_size)) return EINVAL; /* Offset block number to start of partition. */ blkno += lp->d_partitions[part].p_offset; /* Recalibrate, if first dump transfer. */ if (wddumprecalibrated == 0) { wddumprecalibrated = 1; (*wd->atabus->ata_reset_drive)(wd->drvp, AT_POLL | AT_RST_EMERG); wd->drvp->state = RESET; } wd->sc_bp = NULL; wd->sc_wdc_bio.blkno = blkno; wd->sc_wdc_bio.flags = ATA_POLL; if (wd->sc_flags & WDF_LBA48 && (blkno > LBA48_THRESHOLD || (wd->sc_quirks & WD_QUIRK_FORCE_LBA48) != 0)) wd->sc_wdc_bio.flags |= ATA_LBA48; if (wd->sc_flags & WDF_LBA) wd->sc_wdc_bio.flags |= ATA_LBA; wd->sc_wdc_bio.bcount = nblks * lp->d_secsize; wd->sc_wdc_bio.databuf = va; #ifndef WD_DUMP_NOT_TRUSTED switch (wd->atabus->ata_bio(wd->drvp, &wd->sc_wdc_bio)) { case ATACMD_TRY_AGAIN: panic("wddump: try again"); break; case ATACMD_QUEUED: panic("wddump: polled command has been queued"); break; case ATACMD_COMPLETE: break; } switch(wd->sc_wdc_bio.error) { case TIMEOUT: printf("wddump: device timed out"); err = EIO; break; case ERR_DF: printf("wddump: drive fault"); err = EIO; break; case ERR_DMA: printf("wddump: DMA error"); err = EIO; break; case ERROR: printf("wddump: "); wdperror(wd); err = EIO; break; case NOERROR: err = 0; break; default: panic("wddump: unknown error type"); } if (err != 0) { printf("\n"); return err; } #else /* WD_DUMP_NOT_TRUSTED */ /* Let's just talk about this first... */ printf("wd%d: dump addr 0x%x, cylin %d, head %d, sector %d\n", unit, va, cylin, head, sector); delay(500 * 1000); /* half a second */ #endif wddoingadump = 0; return 0; } #ifdef HAS_BAD144_HANDLING /* * Internalize the bad sector table. */ void bad144intern(struct wd_softc *wd) { struct dkbad *bt = &wd->sc_dk.dk_cpulabel->bad; struct disklabel *lp = wd->sc_dk.dk_label; int i = 0; ATADEBUG_PRINT(("bad144intern\n"), DEBUG_XFERS); for (; i < NBT_BAD; i++) { if (bt->bt_bad[i].bt_cyl == 0xffff) break; wd->sc_badsect[i] = bt->bt_bad[i].bt_cyl * lp->d_secpercyl + (bt->bt_bad[i].bt_trksec >> 8) * lp->d_nsectors + (bt->bt_bad[i].bt_trksec & 0xff); } for (; i < NBT_BAD+1; i++) wd->sc_badsect[i] = -1; } #endif static void wd_params_to_properties(struct wd_softc *wd, struct ataparams *params __unused) { prop_dictionary_t disk_info, odisk_info, geom; prop_string_t string; prop_number_t number; disk_info = prop_dictionary_create(); if (strcmp(wd->sc_params.atap_model, "ST506") == 0) string = prop_string_create_cstring_nocopy("ST506"); else { /* XXX Should have a case for ATA here, too. */ string = prop_string_create_cstring_nocopy("ESDI"); } prop_dictionary_set(disk_info, "type", string); prop_object_release(string); geom = prop_dictionary_create(); number = prop_number_create_integer(wd->sc_capacity); prop_dictionary_set(geom, "sectors-per-unit", number); prop_object_release(number); number = prop_number_create_integer(DEV_BSIZE /* XXX 512? */); prop_dictionary_set(geom, "sector-size", number); prop_object_release(number); number = prop_number_create_integer(wd->sc_params.atap_sectors); prop_dictionary_set(geom, "sectors-per-track", number); prop_object_release(number); number = prop_number_create_integer(wd->sc_params.atap_heads); prop_dictionary_set(geom, "tracks-per-cylinder", number); prop_object_release(number); number = prop_number_create_integer( (wd->sc_flags & WDF_LBA) ? wd->sc_capacity / (wd->sc_params.atap_heads * wd->sc_params.atap_sectors) : wd->sc_params.atap_cylinders); prop_dictionary_set(geom, "cylinders-per-unit", number); prop_object_release(number); prop_dictionary_set(disk_info, "geometry", geom); prop_object_release(geom); prop_dictionary_set(device_properties(&wd->sc_dev), "disk-info", disk_info); /* * Don't release disk_info here; we keep a reference to it. * disk_detach() will release it when we go away. */ odisk_info = wd->sc_dk.dk_info; wd->sc_dk.dk_info = disk_info; if (odisk_info) prop_object_release(odisk_info); } int wd_get_params(struct wd_softc *wd, u_int8_t flags, struct ataparams *params) { switch (wd->atabus->ata_get_params(wd->drvp, flags, params)) { case CMD_AGAIN: return 1; case CMD_ERR: /* * We `know' there's a drive here; just assume it's old. * This geometry is only used to read the MBR and print a * (false) attach message. */ strncpy(params->atap_model, "ST506", sizeof params->atap_model); params->atap_config = ATA_CFG_FIXED; params->atap_cylinders = 1024; params->atap_heads = 8; params->atap_sectors = 17; params->atap_multi = 1; params->atap_capabilities1 = params->atap_capabilities2 = 0; wd->drvp->ata_vers = -1; /* Mark it as pre-ATA */ /* FALLTHROUGH */ case CMD_OK: wd_params_to_properties(wd, params); return 0; default: panic("wd_get_params: bad return code from ata_get_params"); /* NOTREACHED */ } } int wd_getcache(struct wd_softc *wd, int *bitsp) { struct ataparams params; if (wd_get_params(wd, AT_WAIT, ¶ms) != 0) return EIO; if (params.atap_cmd_set1 == 0x0000 || params.atap_cmd_set1 == 0xffff || (params.atap_cmd_set1 & WDC_CMD1_CACHE) == 0) { *bitsp = 0; return 0; } *bitsp = DKCACHE_WCHANGE | DKCACHE_READ; if (params.atap_cmd1_en & WDC_CMD1_CACHE) *bitsp |= DKCACHE_WRITE; return 0; } const char at_errbits[] = "\20\10ERROR\11TIMEOU\12DF"; int wd_setcache(struct wd_softc *wd, int bits) { struct ataparams params; struct ata_command ata_c; if (wd_get_params(wd, AT_WAIT, ¶ms) != 0) return EIO; if (params.atap_cmd_set1 == 0x0000 || params.atap_cmd_set1 == 0xffff || (params.atap_cmd_set1 & WDC_CMD1_CACHE) == 0) return EOPNOTSUPP; if ((bits & DKCACHE_READ) == 0 || (bits & DKCACHE_SAVE) != 0) return EOPNOTSUPP; memset(&ata_c, 0, sizeof(struct ata_command)); ata_c.r_command = SET_FEATURES; ata_c.r_st_bmask = 0; ata_c.r_st_pmask = 0; ata_c.timeout = 30000; /* 30s timeout */ ata_c.flags = AT_WAIT; if (bits & DKCACHE_WRITE) ata_c.r_features = WDSF_WRITE_CACHE_EN; else ata_c.r_features = WDSF_WRITE_CACHE_DS; if (wd->atabus->ata_exec_command(wd->drvp, &ata_c) != ATACMD_COMPLETE) { printf("%s: wd_setcache command not complete\n", wd->sc_dev.dv_xname); return EIO; } if (ata_c.flags & (AT_ERROR | AT_TIMEOU | AT_DF)) { char sbuf[sizeof(at_errbits) + 64]; bitmask_snprintf(ata_c.flags, at_errbits, sbuf, sizeof(sbuf)); printf("%s: wd_setcache: status=%s\n", wd->sc_dev.dv_xname, sbuf); return EIO; } return 0; } int wd_standby(struct wd_softc *wd, int flags) { struct ata_command ata_c; memset(&ata_c, 0, sizeof(struct ata_command)); ata_c.r_command = WDCC_STANDBY_IMMED; ata_c.r_st_bmask = WDCS_DRDY; ata_c.r_st_pmask = WDCS_DRDY; ata_c.flags = flags; ata_c.timeout = 30000; /* 30s timeout */ if (wd->atabus->ata_exec_command(wd->drvp, &ata_c) != ATACMD_COMPLETE) { printf("%s: standby immediate command didn't complete\n", wd->sc_dev.dv_xname); return EIO; } if (ata_c.flags & AT_ERROR) { if (ata_c.r_error == WDCE_ABRT) /* command not supported */ return ENODEV; } if (ata_c.flags & (AT_ERROR | AT_TIMEOU | AT_DF)) { char sbuf[sizeof(at_errbits) + 64]; bitmask_snprintf(ata_c.flags, at_errbits, sbuf, sizeof(sbuf)); printf("%s: wd_standby: status=%s\n", wd->sc_dev.dv_xname, sbuf); return EIO; } return 0; } int wd_flushcache(struct wd_softc *wd, int flags) { struct ata_command ata_c; /* * WDCC_FLUSHCACHE is here since ATA-4, but some drives report * only ATA-2 and still support it. */ if (wd->drvp->ata_vers < 4 && ((wd->sc_params.atap_cmd_set2 & WDC_CMD2_FC) == 0 || wd->sc_params.atap_cmd_set2 == 0xffff)) return ENODEV; memset(&ata_c, 0, sizeof(struct ata_command)); if ((wd->sc_params.atap_cmd2_en & ATA_CMD2_LBA48) != 0 && (wd->sc_params.atap_cmd2_en & ATA_CMD2_FCE) != 0) ata_c.r_command = WDCC_FLUSHCACHE_EXT; else ata_c.r_command = WDCC_FLUSHCACHE; ata_c.r_st_bmask = WDCS_DRDY; ata_c.r_st_pmask = WDCS_DRDY; ata_c.flags = flags; ata_c.timeout = 30000; /* 30s timeout */ if (wd->atabus->ata_exec_command(wd->drvp, &ata_c) != ATACMD_COMPLETE) { printf("%s: flush cache command didn't complete\n", wd->sc_dev.dv_xname); return EIO; } if (ata_c.flags & AT_ERROR) { if (ata_c.r_error == WDCE_ABRT) /* command not supported */ return ENODEV; } if (ata_c.flags & (AT_ERROR | AT_TIMEOU | AT_DF)) { char sbuf[sizeof(at_errbits) + 64]; bitmask_snprintf(ata_c.flags, at_errbits, sbuf, sizeof(sbuf)); printf("%s: wd_flushcache: status=%s\n", wd->sc_dev.dv_xname, sbuf); return EIO; } return 0; } void wd_shutdown(void *arg) { struct wd_softc *wd = arg; wd_flushcache(wd, AT_POLL); } /* * Allocate space for a ioctl queue structure. Mostly taken from * scsipi_ioctl.c */ struct wd_ioctl * wi_get(void) { struct wd_ioctl *wi; int s; wi = malloc(sizeof(struct wd_ioctl), M_TEMP, M_WAITOK|M_ZERO); simple_lock_init(&wi->wi_bp.b_interlock); s = splbio(); LIST_INSERT_HEAD(&wi_head, wi, wi_list); splx(s); return (wi); } /* * Free an ioctl structure and remove it from our list */ void wi_free(struct wd_ioctl *wi) { int s; s = splbio(); LIST_REMOVE(wi, wi_list); splx(s); free(wi, M_TEMP); } /* * Find a wd_ioctl structure based on the struct buf. */ struct wd_ioctl * wi_find(struct buf *bp) { struct wd_ioctl *wi; int s; s = splbio(); for (wi = wi_head.lh_first; wi != 0; wi = wi->wi_list.le_next) if (bp == &wi->wi_bp) break; splx(s); return (wi); } /* * Ioctl pseudo strategy routine * * This is mostly stolen from scsipi_ioctl.c:scsistrategy(). What * happens here is: * * - wdioctl() queues a wd_ioctl structure. * * - wdioctl() calls physio/wdioctlstrategy based on whether or not * user space I/O is required. If physio() is called, physio() eventually * calls wdioctlstrategy(). * * - In either case, wdioctlstrategy() calls wd->atabus->ata_exec_command() * to perform the actual command * * The reason for the use of the pseudo strategy routine is because * when doing I/O to/from user space, physio _really_ wants to be in * the loop. We could put the entire buffer into the ioctl request * structure, but that won't scale if we want to do things like download * microcode. */ void wdioctlstrategy(struct buf *bp) { struct wd_ioctl *wi; struct ata_command ata_c; int error = 0; wi = wi_find(bp); if (wi == NULL) { printf("wdioctlstrategy: " "No matching ioctl request found in queue\n"); error = EINVAL; goto bad; } memset(&ata_c, 0, sizeof(ata_c)); /* * Abort if physio broke up the transfer */ if (bp->b_bcount != wi->wi_atareq.datalen) { printf("physio split wd ioctl request... cannot proceed\n"); error = EIO; goto bad; } /* * Abort if we didn't get a buffer size that was a multiple of * our sector size (or was larger than NBBY) */ if ((bp->b_bcount % wi->wi_softc->sc_dk.dk_label->d_secsize) != 0 || (bp->b_bcount / wi->wi_softc->sc_dk.dk_label->d_secsize) >= (1 << NBBY)) { error = EINVAL; goto bad; } /* * Make sure a timeout was supplied in the ioctl request */ if (wi->wi_atareq.timeout == 0) { error = EINVAL; goto bad; } if (wi->wi_atareq.flags & ATACMD_READ) ata_c.flags |= AT_READ; else if (wi->wi_atareq.flags & ATACMD_WRITE) ata_c.flags |= AT_WRITE; if (wi->wi_atareq.flags & ATACMD_READREG) ata_c.flags |= AT_READREG; ata_c.flags |= AT_WAIT; ata_c.timeout = wi->wi_atareq.timeout; ata_c.r_command = wi->wi_atareq.command; ata_c.r_head = wi->wi_atareq.head & 0x0f; ata_c.r_cyl = wi->wi_atareq.cylinder; ata_c.r_sector = wi->wi_atareq.sec_num; ata_c.r_count = wi->wi_atareq.sec_count; ata_c.r_features = wi->wi_atareq.features; ata_c.r_st_bmask = WDCS_DRDY; ata_c.r_st_pmask = WDCS_DRDY; ata_c.data = wi->wi_bp.b_data; ata_c.bcount = wi->wi_bp.b_bcount; if (wi->wi_softc->atabus->ata_exec_command(wi->wi_softc->drvp, &ata_c) != ATACMD_COMPLETE) { wi->wi_atareq.retsts = ATACMD_ERROR; goto bad; } if (ata_c.flags & (AT_ERROR | AT_TIMEOU | AT_DF)) { if (ata_c.flags & AT_ERROR) { wi->wi_atareq.retsts = ATACMD_ERROR; wi->wi_atareq.error = ata_c.r_error; } else if (ata_c.flags & AT_DF) wi->wi_atareq.retsts = ATACMD_DF; else wi->wi_atareq.retsts = ATACMD_TIMEOUT; } else { wi->wi_atareq.retsts = ATACMD_OK; if (wi->wi_atareq.flags & ATACMD_READREG) { wi->wi_atareq.head = ata_c.r_head ; wi->wi_atareq.cylinder = ata_c.r_cyl; wi->wi_atareq.sec_num = ata_c.r_sector; wi->wi_atareq.sec_count = ata_c.r_count; wi->wi_atareq.features = ata_c.r_features; wi->wi_atareq.error = ata_c.r_error; } } bp->b_error = 0; biodone(bp); return; bad: bp->b_flags |= B_ERROR; bp->b_error = error; biodone(bp); }