summaryrefslogtreecommitdiff
path: root/sys/dev/ccd.c
diff options
context:
space:
mode:
Diffstat (limited to 'sys/dev/ccd.c')
-rw-r--r--sys/dev/ccd.c243
1 files changed, 130 insertions, 113 deletions
diff --git a/sys/dev/ccd.c b/sys/dev/ccd.c
index 9d1740c3657..b2ee154bddc 100644
--- a/sys/dev/ccd.c
+++ b/sys/dev/ccd.c
@@ -1,9 +1,10 @@
-/* $OpenBSD: ccd.c,v 1.55 2004/02/15 02:45:46 tedu Exp $ */
+/* $OpenBSD: ccd.c,v 1.56 2005/02/24 19:36:39 mickey Exp $ */
/* $NetBSD: ccd.c,v 1.33 1996/05/05 04:21:14 thorpej Exp $ */
/*-
* Copyright (c) 1996 The NetBSD Foundation, Inc.
* Copyright (c) 1997 Niklas Hallqvist.
+ * Copyright (c) 2005 Michael Shalayeff.
* All rights reserved.
*
* This code is derived from software contributed to The NetBSD Foundation
@@ -92,6 +93,7 @@
*
* Buffer scatter/gather policy by Niklas Hallqvist.
*/
+/*#define CCDDEBUG */
#include <sys/param.h>
#include <sys/systm.h>
@@ -99,6 +101,7 @@
#include <sys/errno.h>
#include <sys/buf.h>
#include <sys/malloc.h>
+#include <sys/pool.h>
#include <sys/namei.h>
#include <sys/stat.h>
#include <sys/ioctl.h>
@@ -140,28 +143,28 @@ int ccddebug = 0x00;
#endif
#define ccdunit(x) DISKUNIT(x)
-
-struct ccdseg {
- caddr_t cs_sgaddr; /* scatter/gather segment addresses */
- long cs_sglen; /* scatter/gather segment lengths */
-};
+#define CCDLABELDEV(dev) \
+ (MAKEDISKDEV(major((dev)), ccdunit((dev)), RAW_PART))
struct ccdbuf {
struct buf cb_buf; /* new I/O buf */
struct buf *cb_obp; /* ptr. to original I/O buf */
- int cb_unit; /* target unit */
+ struct ccd_softc*cb_sc; /* point back to the device */
+ struct ccdbuf *cb_dep; /* mutual ptrs for mirror part */
int cb_comp; /* target component */
int cb_flags; /* misc. flags */
#define CBF_MIRROR 0x01 /* we're for a mirror component */
#define CBF_OLD 0x02 /* use old I/O protocol */
+#define CBF_DONE 0x04 /* this buffer is done */
int cb_sgcnt; /* scatter/gather segment count */
- struct ccdseg *cb_sg; /* scatter/gather segments */
+#define CCD_SGMAX (MAXBSIZE >> PAGE_SHIFT)
+ struct ccdseg {
+ caddr_t cs_sgaddr; /* scatter/gather segment addresses */
+ long cs_sglen; /* scatter/gather segment lengths */
+ } cb_sg[1];
};
-#define CCDLABELDEV(dev) \
- (MAKEDISKDEV(major((dev)), ccdunit((dev)), RAW_PART))
-
/* called by main() at boot time */
void ccdattach(int);
@@ -170,13 +173,14 @@ void ccdiodone(struct buf *);
int ccdsize(dev_t);
void ccdstart(struct ccd_softc *, struct buf *);
-void ccdinterleave(struct ccd_softc *, int);
+void ccdinterleave(struct ccd_softc *);
void ccdintr(struct ccd_softc *, struct buf *);
int ccdinit(struct ccddevice *, char **, struct proc *);
int ccdlookup(char *, struct proc *p, struct vnode **);
long ccdbuffer(struct ccd_softc *, struct buf *, daddr_t, caddr_t,
long, struct ccdbuf **, int);
-void ccdgetdisklabel(dev_t);
+void ccdgetdisklabel(dev_t, struct ccd_softc *, struct disklabel *,
+ struct cpu_disklabel *, int);
void ccdmakedisklabel(struct ccd_softc *);
int ccdlock(struct ccd_softc *);
void ccdunlock(struct ccd_softc *);
@@ -191,28 +195,35 @@ void printiinfo(struct ccdiinfo *);
struct ccd_softc *ccd_softc;
struct ccddevice *ccddevs;
int numccd = 0;
+int ccdbufsizeof;
-/* A separate map so that locking on kernel_map won't happen in interrupts */
-static struct vm_map *ccdmap;
+/*
+ * A separate map so that locking on kernel_map won't happen in interrupts
+ * (XXX due to fragmentation this might fail easy and panic the kernel)
+ */
+struct vm_map *ccdmap;
/*
* Set when a process need some kvm.
* XXX should we fallback to old I/O policy instead when out of ccd kvm?
*/
-static int ccd_need_kvm = 0;
+int ccd_need_kvm = 0;
+
+/*
+ * struct ccdbuf allocator
+ */
+struct pool ccdbufpl;
/*
* Manage the ccd buffer structures.
*/
INLINE struct ccdbuf *
-getccdbuf()
+getccdbuf(void)
{
struct ccdbuf *cbp;
- cbp = malloc(sizeof (struct ccdbuf), M_DEVBUF, M_WAITOK);
- bzero(cbp, sizeof (struct ccdbuf));
- cbp->cb_sg = malloc(sizeof (struct ccdseg) * MAXBSIZE >> PAGE_SHIFT,
- M_DEVBUF, M_WAITOK);
+ if ((cbp = pool_get(&ccdbufpl, PR_WAITOK)))
+ bzero(cbp, ccdbufsizeof);
return (cbp);
}
@@ -220,8 +231,7 @@ INLINE void
putccdbuf(cbp)
struct ccdbuf *cbp;
{
- free((caddr_t)cbp->cb_sg, M_DEVBUF);
- free((caddr_t)cbp, M_DEVBUF);
+ pool_put(&ccdbufpl, cbp);
}
/*
@@ -239,6 +249,12 @@ ccdattach(num)
return;
}
+ ccdbufsizeof = sizeof(struct ccdbuf) +
+ (CCD_SGMAX - 1) * sizeof(struct ccdseg);
+ pool_init(&ccdbufpl, ccdbufsizeof, 0, 0, 0, "ccdbufpl", NULL);
+ pool_setlowat(&ccdbufpl, 16);
+ pool_sethiwat(&ccdbufpl, 1024);
+
ccd_softc = (struct ccd_softc *)malloc(num * sizeof(struct ccd_softc),
M_DEVBUF, M_NOWAIT);
ccddevs = (struct ccddevice *)malloc(num * sizeof(struct ccddevice),
@@ -277,7 +293,8 @@ ccdinit(ccd, cpaths, p)
#ifdef DEBUG
if (ccddebug & (CCDB_FOLLOW|CCDB_INIT))
- printf("ccdinit: unit %d\n", ccd->ccd_unit);
+ printf("ccdinit: unit %d cflags %b\n",
+ ccd->ccd_unit, ccd->ccd_flags, CCDF_BITS);
#endif
cs->sc_size = 0;
@@ -442,42 +459,42 @@ ccdinit(ccd, cpaths, p)
* If uniform interleave is desired set all sizes to that of
* the smallest component.
*/
+ ccg->ccg_ntracks = cs->sc_nccunits = cs->sc_nccdisks;
if (ccd->ccd_flags & CCDF_UNIFORM) {
for (ci = cs->sc_cinfo;
ci < &cs->sc_cinfo[cs->sc_nccdisks]; ci++)
ci->ci_size = minsize;
if (ccd->ccd_flags & CCDF_MIRROR)
- cs->sc_size = (cs->sc_nccdisks / 2) * minsize;
- else
- cs->sc_size = cs->sc_nccdisks * minsize;
+ cs->sc_nccunits = ccg->ccg_ntracks /= 2;
+ cs->sc_size = ccg->ccg_ntracks * minsize;
}
+ cs->sc_cflags = ccd->ccd_flags; /* So we can find out later... */
+
/*
* Construct the interleave table.
*/
- ccdinterleave(cs, ccd->ccd_unit);
+ ccdinterleave(cs);
/*
* Create pseudo-geometry based on 1MB cylinders. It's
* pretty close.
*/
ccg->ccg_secsize = DEV_BSIZE;
- ccg->ccg_ntracks = 1;
- ccg->ccg_nsectors = 1024 * (1024 / ccg->ccg_secsize);
- ccg->ccg_ncylinders = cs->sc_size / ccg->ccg_nsectors;
+ ccg->ccg_nsectors = cs->sc_ileave? cs->sc_ileave :
+ 1024 * (1024 / ccg->ccg_secsize);
+ ccg->ccg_ncylinders = cs->sc_size / ccg->ccg_ntracks /
+ ccg->ccg_nsectors;
cs->sc_flags |= CCDF_INITED;
- cs->sc_cflags = ccd->ccd_flags; /* So we can find out later... */
- cs->sc_unit = ccd->ccd_unit;
return (0);
}
void
-ccdinterleave(cs, unit)
+ccdinterleave(cs)
struct ccd_softc *cs;
- int unit;
{
struct ccdcinfo *ci, *smallci;
struct ccdiinfo *ii;
@@ -564,7 +581,7 @@ ccdinterleave(cs, unit)
*/
ix = 0;
for (ci = cs->sc_cinfo;
- ci < &cs->sc_cinfo[cs->sc_nccdisks]; ci++)
+ ci < &cs->sc_cinfo[cs->sc_nccunits]; ci++)
if (ci->ci_size >= smallci->ci_size)
ii->ii_index[ix++] = ci - cs->sc_cinfo;
ii->ii_ndisk = ix;
@@ -612,7 +629,7 @@ ccdopen(dev, flags, fmt, p)
* the in-core disklabel.
*/
if ((cs->sc_flags & CCDF_INITED) && (cs->sc_dkdev.dk_openmask == 0))
- ccdgetdisklabel(dev);
+ ccdgetdisklabel(dev, cs, lp, cs->sc_dkdev.dk_cpulabel, 0);
/* Check that the partition exists. */
if (part != RAW_PART) {
@@ -746,11 +763,12 @@ ccdstart(cs, bp)
caddr_t addr;
daddr_t bn;
struct partition *pp;
- int i, old_io = ccddevs[cs->sc_unit].ccd_flags & CCDF_OLD;
+ int i, old_io = cs->sc_cflags & CCDF_OLD;
#ifdef DEBUG
if (ccddebug & CCDB_FOLLOW)
- printf("ccdstart(%p, %p)\n", cs, bp);
+ printf("ccdstart(%p, %p, %s)\n", cs, bp,
+ bp->b_flags & B_READ? "read" : "write");
#endif
/* Instrumentation. */
@@ -786,9 +804,6 @@ ccdstart(cs, bp)
cbpp[0]->cb_buf.b_vp->v_numoutput++;
VOP_STRATEGY(&cbpp[0]->cb_buf);
- /*
- * Mirror requires additional write.
- */
if ((cs->sc_cflags & CCDF_MIRROR) &&
((cbpp[0]->cb_buf.b_flags & B_READ) == 0)) {
cbpp[1]->cb_buf.b_vp->v_numoutput++;
@@ -839,8 +854,8 @@ ccdbuffer(cs, bp, bn, addr, bcount, cbpp, old_io)
#ifdef DEBUG
if (ccddebug & CCDB_IO)
- printf("ccdbuffer(%p, %p, %d, %p, %ld)\n", cs, bp, bn, addr,
- bcount);
+ printf("ccdbuffer(%p, %p, %d, %p, %ld, %p)\n",
+ cs, bp, bn, addr, bcount, cbpp);
#endif
/*
@@ -874,22 +889,23 @@ ccdbuffer(cs, bp, bn, addr, bcount, cbpp, old_io)
ccdisk = ii->ii_index[0];
cbn = ii->ii_startoff + off;
} else {
- if (cs->sc_cflags & CCDF_MIRROR) {
- ccdisk =
- ii->ii_index[off % (ii->ii_ndisk / 2)];
- cbn = ii->ii_startoff +
- (off / (ii->ii_ndisk / 2));
- /* Mirrored data */
- ci2 =
- &cs->sc_cinfo[ccdisk + (ii->ii_ndisk / 2)];
- } else {
- /* Normal case. */
- ccdisk = ii->ii_index[off % ii->ii_ndisk];
- cbn = ii->ii_startoff + off / ii->ii_ndisk;
- }
+ ccdisk = ii->ii_index[off % ii->ii_ndisk];
+ cbn = ii->ii_startoff + off / ii->ii_ndisk;
+ }
+ if (cs->sc_cflags & CCDF_MIRROR) {
+ /* Mirrored data */
+ ci2 = &cs->sc_cinfo[ccdisk + ii->ii_ndisk];
+ /* spread the read over both parts */
+ if (bp->b_flags & B_READ && cbn & 1)
+ ccdisk += ii->ii_ndisk;
}
cbn *= cs->sc_ileave;
ci = &cs->sc_cinfo[ccdisk];
+#ifdef DEBUG
+ if (ccddebug & CCDB_IO)
+ printf("ccdisk %d cbn %d ci %p ci2 %p\n",
+ ccdisk, cbn, ci, ci2);
+#endif
}
/* Limit the operation at next component border */
@@ -920,7 +936,7 @@ ccdbuffer(cs, bp, bn, addr, bcount, cbpp, old_io)
* context for ccdiodone
*/
cbp->cb_obp = bp;
- cbp->cb_unit = cs->sc_unit;
+ cbp->cb_sc = cs;
cbp->cb_comp = ccdisk;
/* Deal with the different algorithms */
@@ -957,7 +973,8 @@ ccdbuffer(cs, bp, bn, addr, bcount, cbpp, old_io)
cbp->cb_buf.b_vp = ci2->ci_vp;
LIST_INIT(&cbp->cb_buf.b_dep);
cbp->cb_comp = ci2 - cs->sc_cinfo;
- cbpp[1] = cbp;
+ cbp->cb_dep = cbpp[0];
+ cbpp[0]->cb_dep = cbpp[1] = cbp;
}
} else {
/*
@@ -1029,8 +1046,7 @@ ccdiodone(vbp)
{
struct ccdbuf *cbp = (struct ccdbuf *)vbp;
struct buf *bp = cbp->cb_obp;
- int unit = cbp->cb_unit;
- struct ccd_softc *cs = &ccd_softc[unit];
+ struct ccd_softc *cs = cbp->cb_sc;
int old_io = cbp->cb_flags & CBF_OLD;
int cbflags, i;
long count = bp->b_bcount, off;
@@ -1054,6 +1070,7 @@ ccdiodone(vbp)
#endif
if (vbp->b_flags & B_ERROR) {
+ cs->sc_cinfo[cbp->cb_comp].ci_flags |= CCIF_FAILED;
if (cbp->cb_flags & CBF_MIRROR)
comptype = " (mirror)";
else {
@@ -1066,7 +1083,7 @@ ccdiodone(vbp)
printf("%s: error %d on component %d%s\n",
cs->sc_xname, bp->b_error, cbp->cb_comp, comptype);
}
- cbflags = cbp->cb_flags;
+ cbflags = cbp->cb_flags |= CBF_DONE;
if (!old_io) {
/*
@@ -1091,21 +1108,26 @@ ccdiodone(vbp)
}
}
count = vbp->b_bcount;
+
+ if (cbp->cb_dep &&
+ (cbp->cb_dep->cb_flags & CBF_DONE) != (cbflags & CBF_DONE))
+ return;
+
putccdbuf(cbp);
+ if (cbp->cb_dep)
+ putccdbuf(cbp->cb_dep);
- if ((cbflags & CBF_MIRROR) == 0) {
- /*
- * If all done, "interrupt".
- *
- * Note that mirror component buffers aren't counted against
- * the original I/O buffer.
- */
- if (count > bp->b_resid)
- panic("ccdiodone: count");
- bp->b_resid -= count;
- if (bp->b_resid == 0)
- ccdintr(&ccd_softc[unit], bp);
- }
+ /*
+ * If all done, "interrupt".
+ *
+ * Note that mirror component buffers aren't counted against
+ * the original I/O buffer.
+ */
+ if (count > bp->b_resid)
+ panic("ccdiodone: count");
+ bp->b_resid -= count;
+ if (bp->b_resid == 0)
+ ccdintr(cs, bp);
}
/* ARGSUSED */
@@ -1186,18 +1208,28 @@ ccdioctl(dev, cmd, data, flag, p)
if (unit >= numccd)
return (ENXIO);
+
cs = &ccd_softc[unit];
+ if (cmd != CCDIOCSET && !(cs->sc_flags & CCDF_INITED))
+ return (ENXIO);
- bzero(&ccd, sizeof(ccd));
+ /* access control */
+ switch (cmd) {
+ case CCDIOCSET:
+ case CCDIOCCLR:
+ case DIOCWDINFO:
+ case DIOCSDINFO:
+ case DIOCWLABEL:
+ if ((flag & FWRITE) == 0)
+ return (EBADF);
+ }
+ bzero(&ccd, sizeof(ccd));
switch (cmd) {
case CCDIOCSET:
if (cs->sc_flags & CCDF_INITED)
return (EBUSY);
- if ((flag & FWRITE) == 0)
- return (EBADF);
-
if ((error = ccdlock(cs)) != 0)
return (error);
@@ -1206,7 +1238,7 @@ ccdioctl(dev, cmd, data, flag, p)
ccd.ccd_interleave = ccio->ccio_ileave;
ccd.ccd_flags = ccio->ccio_flags & CCDF_USERMASK;
- /* XXX the new code is unstable still */
+ /* new code seems to work now but enable it after a release */
ccd.ccd_flags |= CCDF_OLD;
/*
@@ -1307,19 +1339,13 @@ ccdioctl(dev, cmd, data, flag, p)
disk_attach(&cs->sc_dkdev);
/* Try and read the disklabel. */
- ccdgetdisklabel(dev);
+ ccdgetdisklabel(dev, cs, cs->sc_dkdev.dk_label,
+ cs->sc_dkdev.dk_cpulabel, 0);
ccdunlock(cs);
-
break;
case CCDIOCCLR:
- if ((cs->sc_flags & CCDF_INITED) == 0)
- return (ENXIO);
-
- if ((flag & FWRITE) == 0)
- return (EBADF);
-
if ((error = ccdlock(cs)) != 0)
return (error);
@@ -1382,20 +1408,26 @@ ccdioctl(dev, cmd, data, flag, p)
ccdunlock(cs);
bzero(cs, sizeof(struct ccd_softc));
splx(s);
+ break;
+
+ case DIOCGPDINFO: {
+ struct cpu_disklabel osdep;
+
+ if ((error = ccdlock(cs)) != 0)
+ return (error);
+
+ ccdgetdisklabel(dev, cs, (struct disklabel *)data,
+ &osdep, 1);
+ ccdunlock(cs);
break;
+ }
case DIOCGDINFO:
- if ((cs->sc_flags & CCDF_INITED) == 0)
- return (ENXIO);
-
*(struct disklabel *)data = *(cs->sc_dkdev.dk_label);
break;
case DIOCGPART:
- if ((cs->sc_flags & CCDF_INITED) == 0)
- return (ENXIO);
-
((struct partinfo *)data)->disklab = cs->sc_dkdev.dk_label;
((struct partinfo *)data)->part =
&cs->sc_dkdev.dk_label->d_partitions[DISKPART(dev)];
@@ -1403,12 +1435,6 @@ ccdioctl(dev, cmd, data, flag, p)
case DIOCWDINFO:
case DIOCSDINFO:
- if ((cs->sc_flags & CCDF_INITED) == 0)
- return (ENXIO);
-
- if ((flag & FWRITE) == 0)
- return (EBADF);
-
if ((error = ccdlock(cs)) != 0)
return (error);
@@ -1432,11 +1458,6 @@ ccdioctl(dev, cmd, data, flag, p)
break;
case DIOCWLABEL:
- if ((cs->sc_flags & CCDF_INITED) == 0)
- return (ENXIO);
-
- if ((flag & FWRITE) == 0)
- return (EBADF);
if (*(int *)data != 0)
cs->sc_flags |= CCDF_WLABEL;
else
@@ -1556,15 +1577,11 @@ ccdlookup(path, p, vpp)
* up.
*/
void
-ccdgetdisklabel(dev)
- dev_t dev;
+ccdgetdisklabel(dev_t dev, struct ccd_softc *cs, struct disklabel *lp,
+ struct cpu_disklabel *clp, int spoofonly)
{
- int unit = ccdunit(dev);
- struct ccd_softc *cs = &ccd_softc[unit];
- char *errstring;
- struct disklabel *lp = cs->sc_dkdev.dk_label;
- struct cpu_disklabel *clp = cs->sc_dkdev.dk_cpulabel;
struct ccdgeom *ccg = &cs->sc_geom;
+ char *errstring;
bzero(lp, sizeof(*lp));
bzero(clp, sizeof(*clp));
@@ -1596,7 +1613,7 @@ ccdgetdisklabel(dev)
* Call the generic disklabel extraction routine.
*/
errstring = readdisklabel(CCDLABELDEV(dev), ccdstrategy,
- cs->sc_dkdev.dk_label, cs->sc_dkdev.dk_cpulabel, 0);
+ cs->sc_dkdev.dk_label, cs->sc_dkdev.dk_cpulabel, spoofonly);
if (errstring)
ccdmakedisklabel(cs);