#include <sys/param.h>
#include <sys/systm.h>
#include <sys/kernel.h>
#include <sys/module.h>
#include <sys/bio.h>
#include <sys/malloc.h>
#include <sys/sbuf.h>
#include <geom/geom.h>
#if !defined(CCD_OFFSET)
#define CCD_OFFSET 16
#endif
#define CCDF_UNIFORM 0x02
#define CCDF_MIRROR 0x04
#define CCDF_NO_OFFSET 0x08
#define CCDF_LINUX 0x10
#define CCDF_USERMASK (CCDF_UNIFORM|CCDF_MIRROR)
struct ccdiinfo {
int ii_ndisk;
daddr_t ii_startblk;
daddr_t ii_startoff;
int *ii_index;
};
struct ccdcinfo {
daddr_t ci_size;
struct g_provider *ci_provider;
struct g_consumer *ci_consumer;
};
struct ccd_s {
LIST_ENTRY(ccd_s) list;
int sc_unit;
int sc_flags;
daddr_t sc_size;
int sc_ileave;
u_int sc_ndisks;
struct ccdcinfo *sc_cinfo;
struct ccdiinfo *sc_itable;
uint32_t sc_secsize;
int sc_pick;
daddr_t sc_blk[2];
uint32_t sc_offset;
};
static g_start_t g_ccd_start;
static void ccdiodone(struct bio *bp);
static void ccdinterleave(struct ccd_s *);
static int ccdinit(struct gctl_req *req, struct ccd_s *);
static int ccdbuffer(struct bio **ret, struct ccd_s *,
struct bio *, daddr_t, caddr_t, long);
static void
g_ccd_orphan(struct g_consumer *cp)
{
}
static int
g_ccd_access(struct g_provider *pp, int dr, int dw, int de)
{
struct g_geom *gp;
struct g_consumer *cp1, *cp2;
int error;
de += dr;
de += dw;
gp = pp->geom;
error = ENXIO;
LIST_FOREACH(cp1, &gp->consumer, consumer) {
error = g_access(cp1, dr, dw, de);
if (error) {
LIST_FOREACH(cp2, &gp->consumer, consumer) {
if (cp1 == cp2)
break;
g_access(cp2, -dr, -dw, -de);
}
break;
}
}
return (error);
}
static void
g_ccd_freesc(struct ccd_s *sc)
{
struct ccdiinfo *ii;
g_free(sc->sc_cinfo);
if (sc->sc_itable != NULL) {
for (ii = sc->sc_itable; ii->ii_ndisk > 0; ii++)
g_free(ii->ii_index);
g_free(sc->sc_itable);
}
g_free(sc);
}
static int
ccdinit(struct gctl_req *req, struct ccd_s *cs)
{
struct ccdcinfo *ci;
daddr_t size;
int ix;
daddr_t minsize;
int maxsecsize;
off_t mediasize;
u_int sectorsize;
cs->sc_size = 0;
maxsecsize = 0;
minsize = 0;
if (cs->sc_flags & CCDF_LINUX) {
cs->sc_offset = 0;
cs->sc_ileave *= 2;
if (cs->sc_flags & CCDF_MIRROR && cs->sc_ndisks != 2)
gctl_error(req, "Mirror mode for Linux raids is "
"only supported with 2 devices");
} else {
if (cs->sc_flags & CCDF_NO_OFFSET)
cs->sc_offset = 0;
else
cs->sc_offset = CCD_OFFSET;
}
for (ix = 0; ix < cs->sc_ndisks; ix++) {
ci = &cs->sc_cinfo[ix];
mediasize = ci->ci_provider->mediasize;
sectorsize = ci->ci_provider->sectorsize;
if (sectorsize > maxsecsize)
maxsecsize = sectorsize;
size = mediasize / DEV_BSIZE - cs->sc_offset;
if (cs->sc_ileave > 1)
size -= size % cs->sc_ileave;
if (size == 0) {
gctl_error(req, "Component %s has effective size zero",
ci->ci_provider->name);
return(ENODEV);
}
if (minsize == 0 || size < minsize)
minsize = size;
ci->ci_size = size;
cs->sc_size += size;
}
if ((cs->sc_ileave > 0) &&
(cs->sc_ileave < (maxsecsize / DEV_BSIZE))) {
gctl_error(req, "Interleave to small for sector size");
return(EINVAL);
}
if (cs->sc_flags & CCDF_UNIFORM) {
for (ix = 0; ix < cs->sc_ndisks; ix++) {
ci = &cs->sc_cinfo[ix];
ci->ci_size = minsize;
}
cs->sc_size = cs->sc_ndisks * minsize;
}
if (cs->sc_flags & CCDF_MIRROR) {
if (cs->sc_ndisks % 2) {
gctl_error(req,
"Mirroring requires an even number of disks");
return(EINVAL);
}
if (cs->sc_ileave == 0) {
gctl_error(req,
"An interleave must be specified when mirroring");
return(EINVAL);
}
cs->sc_size = (cs->sc_ndisks/2) * minsize;
}
ccdinterleave(cs);
cs->sc_secsize = maxsecsize;
return (0);
}
static void
ccdinterleave(struct ccd_s *cs)
{
struct ccdcinfo *ci, *smallci;
struct ccdiinfo *ii;
daddr_t bn, lbn;
int ix;
daddr_t size;
size = (cs->sc_ndisks + 1) * sizeof(struct ccdiinfo);
cs->sc_itable = g_malloc(size, M_WAITOK | M_ZERO);
if (cs->sc_ileave == 0) {
bn = 0;
ii = cs->sc_itable;
for (ix = 0; ix < cs->sc_ndisks; ix++) {
ii->ii_index = g_malloc(sizeof(int), M_WAITOK);
ii->ii_ndisk = 1;
ii->ii_startblk = bn;
ii->ii_startoff = 0;
ii->ii_index[0] = ix;
bn += cs->sc_cinfo[ix].ci_size;
ii++;
}
ii->ii_ndisk = 0;
return;
}
size = 0;
bn = lbn = 0;
for (ii = cs->sc_itable; ; ii++) {
ii->ii_index = g_malloc((sizeof(int) * cs->sc_ndisks),
M_WAITOK);
smallci = NULL;
for (ci = cs->sc_cinfo; ci < &cs->sc_cinfo[cs->sc_ndisks];
ci++) {
if (ci->ci_size > size &&
(smallci == NULL ||
ci->ci_size < smallci->ci_size)) {
smallci = ci;
}
}
if (smallci == NULL) {
ii->ii_ndisk = 0;
g_free(ii->ii_index);
ii->ii_index = NULL;
break;
}
ii->ii_startblk = bn / cs->sc_ileave;
ii->ii_startoff = lbn;
ix = 0;
for (ci = cs->sc_cinfo;
ci < &cs->sc_cinfo[cs->sc_ndisks]; ci++) {
if (ci->ci_size >= smallci->ci_size) {
ii->ii_index[ix++] = ci - cs->sc_cinfo;
}
}
ii->ii_ndisk = ix;
bn += ix * (smallci->ci_size - size);
lbn = smallci->ci_size / cs->sc_ileave;
size = smallci->ci_size;
}
}
static void
g_ccd_start(struct bio *bp)
{
long bcount, rcount;
struct bio *cbp[2];
caddr_t addr;
daddr_t bn;
int err;
struct ccd_s *cs;
cs = bp->bio_to->geom->softc;
if(bp->bio_cmd == BIO_GETATTR) {
g_io_deliver(bp, EINVAL);
return;
}
bn = bp->bio_offset / cs->sc_secsize;
addr = bp->bio_data;
for (bcount = bp->bio_length; bcount > 0; bcount -= rcount) {
err = ccdbuffer(cbp, cs, bp, bn, addr, bcount);
if (err) {
bp->bio_completed += bcount;
if (bp->bio_error == 0)
bp->bio_error = err;
if (bp->bio_completed == bp->bio_length)
g_io_deliver(bp, bp->bio_error);
return;
}
rcount = cbp[0]->bio_length;
if (cs->sc_flags & CCDF_MIRROR) {
if (cbp[0]->bio_cmd != BIO_READ) {
g_io_request(cbp[0], cbp[0]->bio_from);
g_io_request(cbp[1], cbp[1]->bio_from);
} else {
int pick = cs->sc_pick;
daddr_t range = cs->sc_size / 16;
if (bn < cs->sc_blk[pick] - range ||
bn > cs->sc_blk[pick] + range
) {
cs->sc_pick = pick = 1 - pick;
}
cs->sc_blk[pick] = bn + btodb(rcount);
g_io_request(cbp[pick], cbp[pick]->bio_from);
}
} else {
g_io_request(cbp[0], cbp[0]->bio_from);
}
bn += btodb(rcount);
addr += rcount;
}
}
static int
ccdbuffer(struct bio **cb, struct ccd_s *cs, struct bio *bp, daddr_t bn, caddr_t addr, long bcount)
{
struct ccdcinfo *ci, *ci2 = NULL;
struct bio *cbp;
daddr_t cbn, cboff;
off_t cbc;
cbn = bn;
cboff = 0;
if (cs->sc_ileave == 0) {
daddr_t sblk;
sblk = 0;
for (ci = cs->sc_cinfo; cbn >= sblk + ci->ci_size; ci++)
sblk += ci->ci_size;
cbn -= sblk;
} else {
struct ccdiinfo *ii;
int ccdisk, off;
cboff = cbn % cs->sc_ileave;
cbn = cbn / cs->sc_ileave;
for (ii = cs->sc_itable; ii->ii_ndisk; ii++) {
if (ii->ii_startblk > cbn)
break;
}
ii--;
off = cbn - ii->ii_startblk;
if (ii->ii_ndisk == 1) {
ccdisk = ii->ii_index[0];
cbn = ii->ii_startoff + off;
} else {
if (cs->sc_flags & CCDF_MIRROR) {
int ndisk2 = ii->ii_ndisk / 2;
ccdisk = ii->ii_index[off % ndisk2];
cbn = ii->ii_startoff + off / ndisk2;
ci2 = &cs->sc_cinfo[ccdisk + ndisk2];
} else {
ccdisk = ii->ii_index[off % ii->ii_ndisk];
cbn = ii->ii_startoff + off / ii->ii_ndisk;
}
}
ci = &cs->sc_cinfo[ccdisk];
cbn *= cs->sc_ileave;
}
cbp = g_clone_bio(bp);
if (cbp == NULL)
return (ENOMEM);
cbp->bio_done = g_std_done;
cbp->bio_offset = dbtob(cbn + cboff + cs->sc_offset);
cbp->bio_data = addr;
if (cs->sc_ileave == 0)
cbc = dbtob((off_t)(ci->ci_size - cbn));
else
cbc = dbtob((off_t)(cs->sc_ileave - cboff));
cbp->bio_length = (cbc < bcount) ? cbc : bcount;
cbp->bio_from = ci->ci_consumer;
cb[0] = cbp;
if (cs->sc_flags & CCDF_MIRROR) {
cbp = g_clone_bio(bp);
if (cbp == NULL)
return (ENOMEM);
cbp->bio_done = cb[0]->bio_done = ccdiodone;
cbp->bio_offset = cb[0]->bio_offset;
cbp->bio_data = cb[0]->bio_data;
cbp->bio_length = cb[0]->bio_length;
cbp->bio_from = ci2->ci_consumer;
cbp->bio_caller1 = cb[0];
cb[0]->bio_caller1 = cbp;
cb[1] = cbp;
}
return (0);
}
static void
ccdiodone(struct bio *cbp)
{
struct bio *mbp, *pbp;
mbp = cbp->bio_caller1;
pbp = cbp->bio_parent;
if (pbp->bio_cmd == BIO_READ) {
if (cbp->bio_error == 0) {
if (mbp != NULL) {
pbp->bio_inbed++;
g_destroy_bio(mbp);
}
g_std_done(cbp);
return;
}
if (mbp != NULL) {
mbp->bio_caller1 = NULL;
pbp->bio_inbed++;
g_destroy_bio(cbp);
g_io_request(mbp, mbp->bio_from);
return;
}
g_std_done(cbp);
return;
}
if (mbp != NULL) {
mbp->bio_caller1 = NULL;
pbp->bio_inbed++;
if (cbp->bio_error != 0 && pbp->bio_error == 0)
pbp->bio_error = cbp->bio_error;
g_destroy_bio(cbp);
return;
}
g_std_done(cbp);
}
static void
g_ccd_create(struct gctl_req *req, struct g_class *mp)
{
int *unit, *ileave, *nprovider;
struct g_geom *gp;
struct g_consumer *cp;
struct g_provider *pp;
struct ccd_s *sc;
struct sbuf *sb;
char buf[20];
int i, error;
g_topology_assert();
unit = gctl_get_paraml(req, "unit", sizeof(*unit));
if (unit == NULL) {
gctl_error(req, "unit parameter not given");
return;
}
ileave = gctl_get_paraml(req, "ileave", sizeof(*ileave));
if (ileave == NULL) {
gctl_error(req, "ileave parameter not given");
return;
}
nprovider = gctl_get_paraml(req, "nprovider", sizeof(*nprovider));
if (nprovider == NULL) {
gctl_error(req, "nprovider parameter not given");
return;
}
LIST_FOREACH(gp, &mp->geom, geom) {
sc = gp->softc;
if (sc != NULL && sc->sc_unit == *unit) {
gctl_error(req, "Unit %d already configured", *unit);
return;
}
}
if (*nprovider <= 0) {
gctl_error(req, "Bogus nprovider argument (= %d)", *nprovider);
return;
}
for (i = 0; i < *nprovider; i++) {
snprintf(buf, sizeof(buf), "provider%d", i);
pp = gctl_get_provider(req, buf);
if (pp == NULL)
return;
}
gp = g_new_geomf(mp, "ccd%d", *unit);
sc = g_malloc(sizeof(*sc), M_WAITOK | M_ZERO);
gp->softc = sc;
sc->sc_ndisks = *nprovider;
sc->sc_cinfo = g_malloc(sc->sc_ndisks * sizeof(struct ccdcinfo),
M_WAITOK | M_ZERO);
for (i = 0; i < *nprovider; i++) {
snprintf(buf, sizeof(buf), "provider%d", i);
pp = gctl_get_provider(req, buf);
cp = g_new_consumer(gp);
error = g_attach(cp, pp);
KASSERT(error == 0, ("attach to %s failed", pp->name));
sc->sc_cinfo[i].ci_consumer = cp;
sc->sc_cinfo[i].ci_provider = pp;
}
sc->sc_unit = *unit;
sc->sc_ileave = *ileave;
if (gctl_get_param(req, "no_offset", NULL))
sc->sc_flags |= CCDF_NO_OFFSET;
if (gctl_get_param(req, "linux", NULL))
sc->sc_flags |= CCDF_LINUX;
if (gctl_get_param(req, "uniform", NULL))
sc->sc_flags |= CCDF_UNIFORM;
if (gctl_get_param(req, "mirror", NULL))
sc->sc_flags |= CCDF_MIRROR;
if (sc->sc_ileave == 0 && (sc->sc_flags & CCDF_MIRROR)) {
printf("%s: disabling mirror, interleave is 0\n", gp->name);
sc->sc_flags &= ~(CCDF_MIRROR);
}
if ((sc->sc_flags & CCDF_MIRROR) && !(sc->sc_flags & CCDF_UNIFORM)) {
printf("%s: mirror/parity forces uniform flag\n", gp->name);
sc->sc_flags |= CCDF_UNIFORM;
}
error = ccdinit(req, sc);
if (error != 0) {
g_ccd_freesc(sc);
gp->softc = NULL;
g_wither_geom(gp, ENXIO);
return;
}
pp = g_new_providerf(gp, "%s", gp->name);
pp->mediasize = sc->sc_size * (off_t)sc->sc_secsize;
pp->sectorsize = sc->sc_secsize;
g_error_provider(pp, 0);
sb = sbuf_new_auto();
sbuf_printf(sb, "ccd%d: %d components ", sc->sc_unit, *nprovider);
for (i = 0; i < *nprovider; i++) {
sbuf_printf(sb, "%s%s",
i == 0 ? "(" : ", ",
sc->sc_cinfo[i].ci_provider->name);
}
sbuf_printf(sb, "), %jd blocks ", (off_t)pp->mediasize / DEV_BSIZE);
if (sc->sc_ileave != 0)
sbuf_printf(sb, "interleaved at %d blocks\n",
sc->sc_ileave);
else
sbuf_printf(sb, "concatenated\n");
sbuf_finish(sb);
gctl_set_param_err(req, "output", sbuf_data(sb), sbuf_len(sb) + 1);
sbuf_delete(sb);
}
static int
g_ccd_destroy_geom(struct gctl_req *req, struct g_class *mp, struct g_geom *gp)
{
struct g_provider *pp;
struct ccd_s *sc;
g_topology_assert();
sc = gp->softc;
pp = LIST_FIRST(&gp->provider);
if (sc == NULL || pp == NULL)
return (EBUSY);
if (pp->acr != 0 || pp->acw != 0 || pp->ace != 0) {
gctl_error(req, "%s is open(r%dw%de%d)", gp->name,
pp->acr, pp->acw, pp->ace);
return (EBUSY);
}
g_ccd_freesc(sc);
gp->softc = NULL;
g_wither_geom(gp, ENXIO);
return (0);
}
static void
g_ccd_list(struct gctl_req *req, struct g_class *mp)
{
struct sbuf *sb;
struct ccd_s *cs;
struct g_geom *gp;
int i, unit, *up;
up = gctl_get_paraml(req, "unit", sizeof(*up));
if (up == NULL) {
gctl_error(req, "unit parameter not given");
return;
}
unit = *up;
sb = sbuf_new_auto();
LIST_FOREACH(gp, &mp->geom, geom) {
cs = gp->softc;
if (cs == NULL || (unit >= 0 && unit != cs->sc_unit))
continue;
sbuf_printf(sb, "ccd%d\t\t%d\t%d\t",
cs->sc_unit, cs->sc_ileave, cs->sc_flags & CCDF_USERMASK);
for (i = 0; i < cs->sc_ndisks; ++i) {
sbuf_printf(sb, "%s/dev/%s", i == 0 ? "" : " ",
cs->sc_cinfo[i].ci_provider->name);
}
sbuf_printf(sb, "\n");
}
sbuf_finish(sb);
gctl_set_param_err(req, "output", sbuf_data(sb), sbuf_len(sb) + 1);
sbuf_delete(sb);
}
static void
g_ccd_config(struct gctl_req *req, struct g_class *mp, char const *verb)
{
struct g_geom *gp;
g_topology_assert();
if (!strcmp(verb, "create geom")) {
g_ccd_create(req, mp);
} else if (!strcmp(verb, "destroy geom")) {
gp = gctl_get_geom(req, mp, "geom");
if (gp != NULL)
g_ccd_destroy_geom(req, mp, gp);
} else if (!strcmp(verb, "list")) {
g_ccd_list(req, mp);
} else {
gctl_error(req, "unknown verb");
}
}
static struct g_class g_ccd_class = {
.name = "CCD",
.version = G_VERSION,
.ctlreq = g_ccd_config,
.destroy_geom = g_ccd_destroy_geom,
.start = g_ccd_start,
.orphan = g_ccd_orphan,
.access = g_ccd_access,
};
DECLARE_GEOM_CLASS(g_ccd_class, g_ccd);
MODULE_VERSION(geom_ccd, 0);