root/usr/src/uts/common/crypto/io/dca_3des.c

/*
 * CDDL HEADER START
 *
 * The contents of this file are subject to the terms of the
 * Common Development and Distribution License (the "License").
 * You may not use this file except in compliance with the License.
 *
 * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
 * or http://www.opensolaris.org/os/licensing.
 * See the License for the specific language governing permissions
 * and limitations under the License.
 *
 * When distributing Covered Code, include this CDDL HEADER in each
 * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
 * If applicable, add the following below this CDDL HEADER, with the
 * fields enclosed by brackets "[]" replaced with your own identifying
 * information: Portions Copyright [yyyy] [name of copyright owner]
 *
 * CDDL HEADER END
 */

/*
 * Copyright 2008 Sun Microsystems, Inc.  All rights reserved.
 * Use is subject to license terms.
 */

/*
 * Deimos - cryptographic acceleration based upon Broadcom 582x.
 */

#include <sys/types.h>
#include <sys/ddi.h>
#include <sys/sunddi.h>
#include <sys/kmem.h>
#include <sys/note.h>
#include <sys/crypto/common.h>
#include <sys/crypto/spi.h>
#include <sys/crypto/dca.h>

#if defined(__x86)
#include <sys/byteorder.h>
#define UNALIGNED_POINTERS_PERMITTED
#endif

/*
 * 3DES implementation.
 */

static int dca_3desstart(dca_t *, uint32_t, dca_request_t *);
static void dca_3desdone(dca_request_t *, int);


int
dca_3des(crypto_ctx_t *ctx, crypto_data_t *in,
    crypto_data_t *out, crypto_req_handle_t req, int flags)
{
        int                     len;
        int                     rv;
        dca_request_t           *reqp = ctx->cc_provider_private;
        dca_request_t           *des_ctx = ctx->cc_provider_private;
        dca_t                   *dca = ctx->cc_provider;
        crypto_data_t           *nin = &reqp->dr_ctx.in_dup;

        len = dca_length(in);
        if (len % DESBLOCK) {
                DBG(dca, DWARN, "input not an integral number of DES blocks");
                (void) dca_free_context(ctx);
                if (flags & DR_DECRYPT) {
                        return (CRYPTO_ENCRYPTED_DATA_LEN_RANGE);
                } else {
                        return (CRYPTO_DATA_LEN_RANGE);
                }
        }

        /*
         * If cd_miscdata non-null then this contains the IV.
         */
        if (in->cd_miscdata != NULL) {
#ifdef UNALIGNED_POINTERS_PERMITTED
                uint32_t        *p = (uint32_t *)in->cd_miscdata;
                des_ctx->dr_ctx.iv[0] = htonl(p[0]);
                des_ctx->dr_ctx.iv[1] = htonl(p[1]);
#else
                uchar_t *p = (uchar_t *)in->cd_miscdata;
                des_ctx->dr_ctx.iv[0] = p[0]<<24 | p[1]<<16 | p[2]<<8 | p[3];
                des_ctx->dr_ctx.iv[1] = p[4]<<24 | p[5]<<16 | p[6]<<8 | p[7];
#endif  /* UNALIGNED_POINTERS_PERMITTED */
        }

        if (len > dca_length(out)) {
                DBG(dca, DWARN, "inadequate output space (need %d, got %d)",
                    len, dca_length(out));
                out->cd_length = len;
                /* Do not free the context since the app will call again */
                return (CRYPTO_BUFFER_TOO_SMALL);
        }

        if ((rv = dca_verifyio(in, out)) != CRYPTO_SUCCESS) {
                (void) dca_free_context(ctx);
                return (rv);
        }

        /* special handling for null-sized input buffers */
        if (len == 0) {
                out->cd_length = 0;
                (void) dca_free_context(ctx);
                return (CRYPTO_SUCCESS);
        }

        /*
         * Make a local copy of the input crypto_data_t structure. This
         * allows it to be manipulated locally and for dealing with in-place
         * data (ie in == out). Note that "nin" has been pre-allocated,
         * and only fields are copied, not actual data.
         */
        if ((rv = dca_dupcrypto(in, nin)) != CRYPTO_SUCCESS) {
                (void) dca_free_context(ctx);
                return (rv);
        }

        /* Set output to zero ready to take the processed data */
        out->cd_length = 0;

        reqp->dr_kcf_req = req;
        reqp->dr_in = nin;
        reqp->dr_out = out;
        reqp->dr_job_stat = DS_3DESJOBS;
        reqp->dr_byte_stat = DS_3DESBYTES;

        rv = dca_3desstart(dca, flags, reqp);

        /* Context will be freed in the kCF callback function otherwise */
        if (rv != CRYPTO_QUEUED && rv != CRYPTO_BUFFER_TOO_SMALL) {
                (void) dca_free_context(ctx);
        }
        return (rv);
}


void
dca_3desctxfree(void *arg)
{
        crypto_ctx_t    *ctx = (crypto_ctx_t *)arg;
        dca_request_t   *des_ctx = ctx->cc_provider_private;

        if (des_ctx == NULL)
                return;

        des_ctx->dr_ctx.atomic = 0;
        des_ctx->dr_ctx.ctx_cm_type = 0;
        ctx->cc_provider_private = NULL;

        if (des_ctx->destroy)
                dca_destroyreq(des_ctx);
        else
                /* Return it to the pool */
                dca_freereq(des_ctx);
}

int
dca_3desupdate(crypto_ctx_t *ctx, crypto_data_t *in,
    crypto_data_t *out, crypto_req_handle_t req, int flags)
{
        int                     len;
        int                     rawlen;
        int                     rv;
        dca_request_t           *reqp = ctx->cc_provider_private;
        dca_request_t           *des_ctx = ctx->cc_provider_private;
        dca_t                   *dca = ctx->cc_provider;
        crypto_data_t           *nin = &reqp->dr_ctx.in_dup;

        rawlen = dca_length(in) + des_ctx->dr_ctx.residlen;

        len = ROUNDDOWN(rawlen, DESBLOCK);
        /*
         * If cd_miscdata non-null then this contains the IV.
         */
        if (in->cd_miscdata != NULL) {
#ifdef UNALIGNED_POINTERS_PERMITTED
                uint32_t        *p = (uint32_t *)in->cd_miscdata;
                des_ctx->dr_ctx.iv[0] = htonl(p[0]);
                des_ctx->dr_ctx.iv[1] = htonl(p[1]);
#else
                uchar_t *p = (uchar_t *)in->cd_miscdata;
                des_ctx->dr_ctx.iv[0] = p[0]<<24 | p[1]<<16 | p[2]<<8 | p[3];
                des_ctx->dr_ctx.iv[1] = p[4]<<24 | p[5]<<16 | p[6]<<8 | p[7];
#endif  /* UNALIGNED_POINTERS_PERMITTED */
        }

        if (len > dca_length(out)) {
                DBG(dca, DWARN, "not enough output space (need %d, got %d)",
                    len, dca_length(out));
                out->cd_length = len;
                /* Do not free the context since the app will call again */
                return (CRYPTO_BUFFER_TOO_SMALL);
        }

        if ((rv = dca_verifyio(in, out)) != CRYPTO_SUCCESS) {
                (void) dca_free_context(ctx);
                return (rv);
        }

        reqp->dr_kcf_req = req;

        /*
         * From here on out, we are committed.
         */

        if (len == 0) {
                /*
                 * No blocks being encrypted, so we just accumulate the
                 * input for the next pass and return.
                 */
                if ((rv = dca_getbufbytes(in, 0,
                    (rawlen % DESBLOCK) - des_ctx->dr_ctx.residlen,
                    des_ctx->dr_ctx.resid + des_ctx->dr_ctx.residlen)) !=
                    CRYPTO_SUCCESS) {
                        DBG(dca, DWARN,
            "dca_3desupdate: dca_getbufbytes() failed for residual only pass");
                        dca_freereq(reqp);
                        return (rv);
                }
                des_ctx->dr_ctx.residlen = rawlen % DESBLOCK;

                out->cd_length = 0;
                /*
                 * Do not free the context here since it will be done
                 * in the final function
                 */
                return (CRYPTO_SUCCESS);
        }

        /*
         * Set up rbuf for previous residual data.
         */
        if (des_ctx->dr_ctx.residlen) {
                bcopy(des_ctx->dr_ctx.resid, des_ctx->dr_ctx.activeresid,
                    des_ctx->dr_ctx.residlen);
                des_ctx->dr_ctx.activeresidlen = des_ctx->dr_ctx.residlen;
        }

        /*
         * Locate and save residual data for next encrypt_update.
         */
        if ((rv = dca_getbufbytes(in, len - des_ctx->dr_ctx.residlen,
            rawlen % DESBLOCK, des_ctx->dr_ctx.resid)) != CRYPTO_SUCCESS) {
                DBG(dca, DWARN, "dca_3desupdate: dca_getbufbytes() failed");
                (void) dca_free_context(ctx);
                return (rv);
        }

        /* Calculate new residual length. */
        des_ctx->dr_ctx.residlen = rawlen % DESBLOCK;

        /*
         * Make a local copy of the input crypto_data_t structure. This
         * allows it to be manipulated locally and for dealing with in-place
         * data (ie in == out).
         */
        if ((rv = dca_dupcrypto(in, nin)) != CRYPTO_SUCCESS) {
                (void) dca_free_context(ctx);
                return (rv);
        }

        /* Set output to zero ready to take the processed data */
        out->cd_length = 0;

        reqp->dr_in = nin;
        reqp->dr_out = out;
        reqp->dr_job_stat = DS_3DESJOBS;
        reqp->dr_byte_stat = DS_3DESBYTES;

        rv = dca_3desstart(dca, flags, reqp);

        /*
         * As this is multi-part the context is cleared on success
         * (CRYPTO_QUEUED) in dca_3desfinal().
         */

        if (rv != CRYPTO_QUEUED && rv != CRYPTO_BUFFER_TOO_SMALL) {
                (void) dca_free_context(ctx);
        }
        return (rv);
}

int
dca_3desfinal(crypto_ctx_t *ctx, crypto_data_t *out, int mode)
{
        dca_request_t   *des_ctx = ctx->cc_provider_private;
        dca_t           *dca = ctx->cc_provider;
        int             rv = CRYPTO_SUCCESS;

        ASSERT(ctx->cc_provider_private != NULL);
        /*
         * There must be no unprocessed ciphertext/plaintext.
         * This happens if the length of the last data is
         * not a multiple of the DES block length.
         */
        if (des_ctx->dr_ctx.residlen != 0) {
                DBG(dca, DWARN, "dca_3desfinal: invalid nonzero residual");
                if (mode & DR_DECRYPT) {
                        rv = CRYPTO_ENCRYPTED_DATA_LEN_RANGE;
                } else {
                        rv = CRYPTO_DATA_LEN_RANGE;
                }
        }
        (void) dca_free_context(ctx);
        out->cd_length = 0;
        return (rv);
}

int
dca_3desatomic(crypto_provider_handle_t provider,
    crypto_session_id_t session_id, crypto_mechanism_t *mechanism,
    crypto_key_t *key, crypto_data_t *input, crypto_data_t *output,
    int kmflag, crypto_req_handle_t req, int mode)
{
        crypto_ctx_t    ctx;    /* on the stack */
        int             rv;

        ctx.cc_provider = provider;
        ctx.cc_session = session_id;

        /*
         * Input must be a multiple of the block size. This test only
         * works for non-padded mechanisms when the blocksize is 2^N.
         */
        if ((dca_length(input) & (DESBLOCK - 1)) != 0) {
                DBG(NULL, DWARN, "dca_3desatomic: input not multiple of BS");
                if (mode & DR_DECRYPT) {
                        return (CRYPTO_ENCRYPTED_DATA_LEN_RANGE);
                } else {
                        return (CRYPTO_DATA_LEN_RANGE);
                }
        }

        rv = dca_3desctxinit(&ctx, mechanism, key, kmflag, mode);
        if (rv != CRYPTO_SUCCESS) {
                DBG(NULL, DWARN, "dca_3desatomic: dca_3desctxinit() failed");
                return (rv);
        }

        /*
         * Set the atomic flag so that the hardware callback function
         * will free the context.
         */
        ((dca_request_t *)ctx.cc_provider_private)->dr_ctx.atomic = 1;

        /* check for inplace ops */
        if (input == output) {
                ((dca_request_t *)ctx.cc_provider_private)->dr_flags
                    |= DR_INPLACE;
        }

        rv = dca_3des(&ctx, input, output, req, mode);
        if ((rv != CRYPTO_QUEUED) && (rv != CRYPTO_SUCCESS)) {
                DBG(NULL, DWARN, "dca_3desatomic: dca_3des() failed");
                output->cd_length = 0;
        }

        /*
         * The features of dca_3desfinal() are implemented within
         * dca_3desdone() due to the asynchronous nature of dca_3des().
         */

        /*
         * The context will be freed in the hardware callback function if it
         * is queued
         */
        if (rv != CRYPTO_QUEUED)
                dca_3desctxfree(&ctx);

        return (rv);
}

int
dca_3desstart(dca_t *dca, uint32_t flags, dca_request_t *reqp)
{
        size_t          len;
        crypto_data_t   *in = reqp->dr_in;
        int             rv;
        dca_request_t   *ctx = reqp;
        uint32_t        iv[2];

        /*
         * Preconditions:
         * 1) in and out point to the "right" buffers.
         * 2) in->b_bcount - in->b_resid == initial offset
         * 3) likewise for out
         * 4) there is enough space in the output
         * 5) we perform a block for block encrypt
         */
        len = ctx->dr_ctx.activeresidlen + dca_length(in);
        len = ROUNDDOWN(min(len, MAXPACKET), DESBLOCK);
        reqp->dr_pkt_length = (uint16_t)len;

        /* collect IVs for this pass */
        iv[0] = ctx->dr_ctx.iv[0];
        iv[1] = ctx->dr_ctx.iv[1];

        /*
         * And also, for decrypt, collect the IV for the next pass.  For
         * decrypt, the IV must be collected BEFORE decryption, or else
         * we will lose it.  (For encrypt, we grab the IV AFTER encryption,
         * in dca_3desdone.
         */
        if (flags & DR_DECRYPT) {
                uchar_t         ivstore[DESBLOCK];
#ifdef UNALIGNED_POINTERS_PERMITTED
                uint32_t        *ivp = (uint32_t *)ivstore;
#else
                uchar_t         *ivp = ivstore;
#endif  /* UNALIGNED_POINTERS_PERMITTED */

                /* get last 8 bytes of ciphertext for IV of next op */
                /*
                 * If we're processing only a DESBLOCKS worth of data
                 * and there is active residual present then it will be
                 * needed for the IV also.
                 */
                if ((len == DESBLOCK) && ctx->dr_ctx.activeresidlen) {
                        /* Bring the active residual into play */
                        bcopy(ctx->dr_ctx.activeresid, ivstore,
                            ctx->dr_ctx.activeresidlen);
                        rv = dca_getbufbytes(in, 0,
                            DESBLOCK - ctx->dr_ctx.activeresidlen,
                            ivstore + ctx->dr_ctx.activeresidlen);
                } else {
                        rv = dca_getbufbytes(in,
                            len - DESBLOCK - ctx->dr_ctx.activeresidlen,
                            DESBLOCK, ivstore);
                }

                if (rv != CRYPTO_SUCCESS) {
                        DBG(dca, DWARN,
                            "dca_3desstart: dca_getbufbytes() failed");
                        return (rv);
                }

                /* store as a pair of native 32-bit values */
#ifdef UNALIGNED_POINTERS_PERMITTED
                ctx->dr_ctx.iv[0] = htonl(ivp[0]);
                ctx->dr_ctx.iv[1] = htonl(ivp[1]);
#else
                ctx->dr_ctx.iv[0] =
                    ivp[0]<<24 | ivp[1]<<16 | ivp[2]<<8 | ivp[3];
                ctx->dr_ctx.iv[1] =
                    ivp[4]<<24 | ivp[5]<<16 | ivp[6]<<8 | ivp[7];
#endif  /* UNALIGNED_POINTERS_PERMITTED */
        }

        /* For now we force a pullup.  Add direct DMA later. */
        reqp->dr_flags &= ~(DR_SCATTER | DR_GATHER);
        if ((len < dca_mindma) || (ctx->dr_ctx.activeresidlen > 0) ||
            dca_sgcheck(dca, reqp->dr_in, DCA_SG_CONTIG) ||
            dca_sgcheck(dca, reqp->dr_out, DCA_SG_WALIGN)) {
                reqp->dr_flags |= DR_SCATTER | DR_GATHER;
        }

        /* Try to do direct DMA. */
        if (!(reqp->dr_flags & (DR_SCATTER | DR_GATHER))) {
                if (dca_bindchains(reqp, len, len) == DDI_SUCCESS) {
                        reqp->dr_in->cd_offset += len;
                        reqp->dr_in->cd_length -= len;
                } else {
                        DBG(dca, DWARN,
                            "dca_3desstart: dca_bindchains() failed");
                        return (CRYPTO_DEVICE_ERROR);
                }
        }

        /* gather the data into the device */
        if (reqp->dr_flags & DR_GATHER) {
                rv = dca_resid_gather(in, (char *)ctx->dr_ctx.activeresid,
                    &ctx->dr_ctx.activeresidlen, reqp->dr_ibuf_kaddr, len);
                if (rv != CRYPTO_SUCCESS) {
                        DBG(dca, DWARN,
                            "dca_3desstart: dca_resid_gather() failed");
                        return (rv);
                }
                /*
                 * Setup for scattering the result back out
                 * The output buffer is a multi-entry chain for x86 and
                 * a single entry chain for Sparc.
                 * Use the actual length if the first entry is sufficient.
                 */
                (void) ddi_dma_sync(reqp->dr_ibuf_dmah, 0, len,
                    DDI_DMA_SYNC_FORDEV);
                if (dca_check_dma_handle(dca, reqp->dr_ibuf_dmah,
                    DCA_FM_ECLASS_NONE) != DDI_SUCCESS) {
                        reqp->destroy = TRUE;
                        return (CRYPTO_DEVICE_ERROR);
                }

                reqp->dr_in_paddr = reqp->dr_ibuf_head.dc_buffer_paddr;
                reqp->dr_in_next = reqp->dr_ibuf_head.dc_next_paddr;
                if (len > reqp->dr_ibuf_head.dc_buffer_length)
                        reqp->dr_in_len = reqp->dr_ibuf_head.dc_buffer_length;
                else
                        reqp->dr_in_len = len;
        }
        /*
         * Setup for scattering the result back out
         * The output buffer is a multi-entry chain for x86 and
         * a single entry chain for Sparc.
         * Use the actual length if the first entry is sufficient.
         */
        if (reqp->dr_flags & DR_SCATTER) {
                reqp->dr_out_paddr = reqp->dr_obuf_head.dc_buffer_paddr;
                reqp->dr_out_next = reqp->dr_obuf_head.dc_next_paddr;
                if (len > reqp->dr_obuf_head.dc_buffer_length)
                        reqp->dr_out_len = reqp->dr_obuf_head.dc_buffer_length;
                else
                        reqp->dr_out_len = len;
        }

        reqp->dr_flags |= flags;
        reqp->dr_callback = dca_3desdone;

        /* write out the context structure */
        PUTCTX32(reqp, CTX_3DESIVHI, iv[0]);
        PUTCTX32(reqp, CTX_3DESIVLO, iv[1]);

        /* schedule the work by doing a submit */
        return (dca_start(dca, reqp, MCR1, 1));
}

void
dca_3desdone(dca_request_t *reqp, int errno)
{
        crypto_data_t   *out = reqp->dr_out;
        dca_request_t   *ctx = reqp;
        ASSERT(ctx != NULL);

        if (errno == CRYPTO_SUCCESS) {
                size_t          off;
                /*
                 * Save the offset: this has to be done *before* dca_scatter
                 * modifies the buffer.  We take the initial offset into the
                 * first buf, and add that to the total packet size to find
                 * the end of the packet.
                 */
                off = dca_length(out) + reqp->dr_pkt_length - DESBLOCK;

                if (reqp->dr_flags & DR_SCATTER) {
                        (void) ddi_dma_sync(reqp->dr_obuf_dmah, 0,
                            reqp->dr_out_len, DDI_DMA_SYNC_FORKERNEL);
                        if (dca_check_dma_handle(reqp->dr_dca,
                            reqp->dr_obuf_dmah, DCA_FM_ECLASS_NONE) !=
                            DDI_SUCCESS) {
                                reqp->destroy = TRUE;
                                errno = CRYPTO_DEVICE_ERROR;
                                goto errout;
                        }

                        errno = dca_scatter(reqp->dr_obuf_kaddr,
                            reqp->dr_out, reqp->dr_out_len, 0);
                        if (errno != CRYPTO_SUCCESS) {
                                DBG(NULL, DWARN,
                                    "dca_3desdone: dca_scatter() failed");
                                goto errout;
                        }

                } else {
                        /* we've processed some more data */
                        out->cd_length += reqp->dr_pkt_length;
                }


                /*
                 * For encryption only, we have to grab the IV for the
                 * next pass AFTER encryption.
                 */
                if (reqp->dr_flags & DR_ENCRYPT) {
                        uchar_t         ivstore[DESBLOCK];
#ifdef UNALIGNED_POINTERS_PERMITTED
                        uint32_t        *iv = (uint32_t *)ivstore;
#else
                        uchar_t         *iv = ivstore;
#endif  /* UNALIGNED_POINTERS_PERMITTED */

                        /* get last 8 bytes for IV of next op */
                        errno = dca_getbufbytes(out, off, DESBLOCK,
                            (uchar_t *)iv);
                        if (errno != CRYPTO_SUCCESS) {
                                DBG(NULL, DWARN,
                                    "dca_3desdone: dca_getbufbytes() failed");
                                goto errout;
                        }

                        /* store as a pair of native 32-bit values */
#ifdef UNALIGNED_POINTERS_PERMITTED
                        ctx->dr_ctx.iv[0] = htonl(iv[0]);
                        ctx->dr_ctx.iv[1] = htonl(iv[1]);
#else
                        ctx->dr_ctx.iv[0] =
                            iv[0]<<24 | iv[1]<<16 | iv[2]<<8 | iv[3];
                        ctx->dr_ctx.iv[1] =
                            iv[4]<<24 | iv[5]<<16 | iv[6]<<8 | iv[7];
#endif  /* UNALIGNED_POINTERS_PERMITTED */
                }

                /*
                 * If there is more to do, then reschedule another
                 * pass.
                 */
                if (dca_length(reqp->dr_in) >= 8) {
                        errno = dca_3desstart(reqp->dr_dca, reqp->dr_flags,
                            reqp);
                        if (errno == CRYPTO_QUEUED) {
                                return;
                        }
                }
        }

errout:

        /*
         * If this is an atomic operation perform the final function
         * tasks (equivalent to to dca_3desfinal()).
         */
        if (reqp->dr_ctx.atomic) {
                if ((errno == CRYPTO_SUCCESS) && (ctx->dr_ctx.residlen != 0)) {
                        DBG(NULL, DWARN,
                            "dca_3desdone: invalid nonzero residual");
                        if (reqp->dr_flags & DR_DECRYPT) {
                                errno = CRYPTO_ENCRYPTED_DATA_LEN_RANGE;
                        } else {
                                errno = CRYPTO_DATA_LEN_RANGE;
                        }
                }
        }

        ASSERT(reqp->dr_kcf_req != NULL);
        /* notify framework that request is completed */
        crypto_op_notification(reqp->dr_kcf_req, errno);
        DBG(NULL, DINTR,
            "dca_3desdone: returning %d to the kef via crypto_op_notification",
            errno);

        /* This has to be done after notifing the framework */
        if (reqp->dr_ctx.atomic) {
                reqp->dr_context = NULL;
                reqp->dr_ctx.atomic = 0;
                reqp->dr_ctx.ctx_cm_type = 0;
                if (reqp->destroy)
                        dca_destroyreq(reqp);
                else
                        dca_freereq(reqp);
        }
}

/* ARGSUSED */
int
dca_3desctxinit(crypto_ctx_t *ctx, crypto_mechanism_t *mechanism,
    crypto_key_t *key, int kmflag, int flags)
{
        dca_request_t   *des_ctx;
        dca_t           *dca = ctx->cc_provider;
#ifdef UNALIGNED_POINTERS_PERMITTED
        uint32_t        *param;
        uint32_t        *value32;
#else
        uchar_t         *param;
#endif  /* UNALIGNED_POINTERS_PERMITTED */
        uchar_t         *value;
        size_t          paramsz;
        unsigned        len;
        int             i, j;

        paramsz = mechanism->cm_param_len;
#ifdef UNALIGNED_POINTERS_PERMITTED
        param = (uint32_t *)mechanism->cm_param;
#else
        param = (uchar_t *)mechanism->cm_param;
#endif  /* UNALIGNED_POINTERS_PERMITTED */

        if ((paramsz != 0) && (paramsz != DES_IV_LEN)) {
                DBG(NULL, DWARN,
                    "dca_3desctxinit: parameter(IV) length not %d (%d)",
                    DES_IV_LEN, paramsz);
                return (CRYPTO_MECHANISM_PARAM_INVALID);
        }

        if ((des_ctx = dca_getreq(dca, MCR1, 1)) == NULL) {
                dca_error(dca, "unable to allocate request for 3DES");
                return (CRYPTO_HOST_MEMORY);
        }
        /*
         * Identify and store the IV as a pair of native 32-bit words.
         *
         * If cm_param == NULL then the IV comes from the cd_miscdata field
         * in the crypto_data structure.
         */
        if (param != NULL) {
                ASSERT(paramsz == DES_IV_LEN);
#ifdef UNALIGNED_POINTERS_PERMITTED
                des_ctx->dr_ctx.iv[0] = htonl(param[0]);
                des_ctx->dr_ctx.iv[1] = htonl(param[1]);
#else
                des_ctx->dr_ctx.iv[0] = param[0]<<24 | param[1]<<16 |
                    param[2]<<8 | param[3];
                des_ctx->dr_ctx.iv[1] = param[4]<<24 | param[5]<<16 |
                    param[6]<<8 | param[7];
#endif  /* UNALIGNED_POINTERS_PERMITTED */
        }
        des_ctx->dr_ctx.residlen = 0;
        des_ctx->dr_ctx.activeresidlen = 0;
        des_ctx->dr_ctx.ctx_cm_type = mechanism->cm_type;
        ctx->cc_provider_private = des_ctx;

        if (key->ck_format != CRYPTO_KEY_RAW) {
                DBG(NULL, DWARN,
        "dca_3desctxinit: only raw crypto key type support with DES/3DES");
                dca_3desctxfree(ctx);
                return (CRYPTO_KEY_TYPE_INCONSISTENT);
        }

        len = key->ck_length;
        value = (uchar_t *)key->ck_data;

        if (flags & DR_TRIPLE) {
                /* 3DES */
                switch (len) {
                case 192:
                        for (i = 0; i < 6; i++) {
                                des_ctx->dr_ctx.key[i] = 0;
                                for (j = 0; j < 4; j++) {
                                        des_ctx->dr_ctx.key[i] <<= 8;
                                        des_ctx->dr_ctx.key[i] |= *value;
                                        value++;
                                }
                        }
                        break;

                case 128:
                        for (i = 0; i < 4; i++) {
                                des_ctx->dr_ctx.key[i] = 0;
                                for (j = 0; j < 4; j++) {
                                        des_ctx->dr_ctx.key[i] <<= 8;
                                        des_ctx->dr_ctx.key[i] |= *value;
                                        value++;
                                }
                        }
                        des_ctx->dr_ctx.key[4] = des_ctx->dr_ctx.key[0];
                        des_ctx->dr_ctx.key[5] = des_ctx->dr_ctx.key[1];
                        break;

                default:
                        DBG(NULL, DWARN, "Incorrect 3DES keysize (%d)", len);
                        dca_3desctxfree(ctx);
                        return (CRYPTO_KEY_SIZE_RANGE);
                }
        } else {
                /* single DES */
                if (len != 64) {
                        DBG(NULL, DWARN, "Incorrect DES keysize (%d)", len);
                        dca_3desctxfree(ctx);
                        return (CRYPTO_KEY_SIZE_RANGE);
                }

#ifdef UNALIGNED_POINTERS_PERMITTED
                value32 = (uint32_t *)value;
                des_ctx->dr_ctx.key[0] = htonl(value32[0]);
                des_ctx->dr_ctx.key[1] = htonl(value32[1]);
#else
                des_ctx->dr_ctx.key[0] =
                    value[0]<<24 | value[1]<<16 | value[2]<<8 | value[3];
                des_ctx->dr_ctx.key[1] =
                    value[4]<<24 | value[5]<<16 | value[6]<<8 | value[7];
#endif  /* UNALIGNED_POINTERS_PERMITTED */

                /* for single des just repeat des key */
                des_ctx->dr_ctx.key[4] =
                    des_ctx->dr_ctx.key[2] = des_ctx->dr_ctx.key[0];
                des_ctx->dr_ctx.key[5] =
                    des_ctx->dr_ctx.key[3] = des_ctx->dr_ctx.key[1];
        }

        /*
         * Setup the context here so that we do not need to setup it up
         * for every update
         */
        PUTCTX16(des_ctx, CTX_LENGTH, CTX_3DES_LENGTH);
        PUTCTX16(des_ctx, CTX_CMD, CMD_3DES);
        PUTCTX32(des_ctx, CTX_3DESDIRECTION,
            flags & DR_ENCRYPT ? CTX_3DES_ENCRYPT : CTX_3DES_DECRYPT);
        PUTCTX32(des_ctx, CTX_3DESKEY1HI, des_ctx->dr_ctx.key[0]);
        PUTCTX32(des_ctx, CTX_3DESKEY1LO, des_ctx->dr_ctx.key[1]);
        PUTCTX32(des_ctx, CTX_3DESKEY2HI, des_ctx->dr_ctx.key[2]);
        PUTCTX32(des_ctx, CTX_3DESKEY2LO, des_ctx->dr_ctx.key[3]);
        PUTCTX32(des_ctx, CTX_3DESKEY3HI, des_ctx->dr_ctx.key[4]);
        PUTCTX32(des_ctx, CTX_3DESKEY3LO, des_ctx->dr_ctx.key[5]);

        return (CRYPTO_SUCCESS);
}