LOAD_BIG_32
w_15 = LOAD_BIG_32(ctx->buf_un.buf32 + 15);
w_14 = LOAD_BIG_32(ctx->buf_un.buf32 + 14);
w_13 = LOAD_BIG_32(ctx->buf_un.buf32 + 13);
w_12 = LOAD_BIG_32(ctx->buf_un.buf32 + 12);
w_11 = LOAD_BIG_32(ctx->buf_un.buf32 + 11);
w_10 = LOAD_BIG_32(ctx->buf_un.buf32 + 10);
w_9 = LOAD_BIG_32(ctx->buf_un.buf32 + 9);
w_8 = LOAD_BIG_32(ctx->buf_un.buf32 + 8);
w_7 = LOAD_BIG_32(ctx->buf_un.buf32 + 7);
w_6 = LOAD_BIG_32(ctx->buf_un.buf32 + 6);
w_5 = LOAD_BIG_32(ctx->buf_un.buf32 + 5);
w_4 = LOAD_BIG_32(ctx->buf_un.buf32 + 4);
w_3 = LOAD_BIG_32(ctx->buf_un.buf32 + 3);
w_2 = LOAD_BIG_32(ctx->buf_un.buf32 + 2);
w_1 = LOAD_BIG_32(ctx->buf_un.buf32 + 1);
w_0 = LOAD_BIG_32(ctx->buf_un.buf32 + 0);
w_15 = LOAD_BIG_32(blk + 60);
w_14 = LOAD_BIG_32(blk + 56);
w_13 = LOAD_BIG_32(blk + 52);
w_12 = LOAD_BIG_32(blk + 48);
w_11 = LOAD_BIG_32(blk + 44);
w_10 = LOAD_BIG_32(blk + 40);
w_9 = LOAD_BIG_32(blk + 36);
w_8 = LOAD_BIG_32(blk + 32);
w_7 = LOAD_BIG_32(blk + 28);
w_6 = LOAD_BIG_32(blk + 24);
w_5 = LOAD_BIG_32(blk + 20);
w_4 = LOAD_BIG_32(blk + 16);
w_3 = LOAD_BIG_32(blk + 12);
w_2 = LOAD_BIG_32(blk + 8);
w_1 = LOAD_BIG_32(blk + 4);
w_0 = LOAD_BIG_32(blk + 0);
W(0) = LOAD_BIG_32((void *)(blk + 0));
W(1) = LOAD_BIG_32((void *)(blk + 4));
W(2) = LOAD_BIG_32((void *)(blk + 8));
W(3) = LOAD_BIG_32((void *)(blk + 12));
W(4) = LOAD_BIG_32((void *)(blk + 16));
W(5) = LOAD_BIG_32((void *)(blk + 20));
W(6) = LOAD_BIG_32((void *)(blk + 24));
W(7) = LOAD_BIG_32((void *)(blk + 28));
W(8) = LOAD_BIG_32((void *)(blk + 32));
W(9) = LOAD_BIG_32((void *)(blk + 36));
W(10) = LOAD_BIG_32((void *)(blk + 40));
W(11) = LOAD_BIG_32((void *)(blk + 44));
W(12) = LOAD_BIG_32((void *)(blk + 48));
W(13) = LOAD_BIG_32((void *)(blk + 52));
W(14) = LOAD_BIG_32((void *)(blk + 56));
W(15) = LOAD_BIG_32((void *)(blk + 60));
w0 = LOAD_BIG_32(blk + 4 * 0);
w1 = LOAD_BIG_32(blk + 4 * 1);
w2 = LOAD_BIG_32(blk + 4 * 2);
w3 = LOAD_BIG_32(blk + 4 * 3);
w4 = LOAD_BIG_32(blk + 4 * 4);
w5 = LOAD_BIG_32(blk + 4 * 5);
w6 = LOAD_BIG_32(blk + 4 * 6);
w7 = LOAD_BIG_32(blk + 4 * 7);
w8 = LOAD_BIG_32(blk + 4 * 8);
w9 = LOAD_BIG_32(blk + 4 * 9);
w10 = LOAD_BIG_32(blk + 4 * 10);
w11 = LOAD_BIG_32(blk + 4 * 11);
w12 = LOAD_BIG_32(blk + 4 * 12);
w13 = LOAD_BIG_32(blk + 4 * 13);
w14 = LOAD_BIG_32(blk + 4 * 14);
w15 = LOAD_BIG_32(blk + 4 * 15);