GETU32
tmp[0] = GETU32(plaintext);
tmp[1] = GETU32(plaintext + 4);
tmp[2] = GETU32(plaintext + 8);
tmp[3] = GETU32(plaintext + 12);
tmp[0] = GETU32(ciphertext);
tmp[1] = GETU32(ciphertext + 4);
tmp[2] = GETU32(ciphertext + 8);
tmp[3] = GETU32(ciphertext + 12);
kll = GETU32(key );
klr = GETU32(key + 4);
krl = GETU32(key + 8);
krr = GETU32(key + 12);
kll = GETU32(key );
klr = GETU32(key + 4);
krl = GETU32(key + 8);
krr = GETU32(key + 12);
krll = GETU32(key + 16);
krlr = GETU32(key + 20);
krrl = GETU32(key + 24);
krrr = GETU32(key + 28);
rk[0] = GETU32(cipherKey );
rk[1] = GETU32(cipherKey + 4);
rk[2] = GETU32(cipherKey + 8);
rk[3] = GETU32(cipherKey + 12);
rk[4] = GETU32(cipherKey + 16);
rk[5] = GETU32(cipherKey + 20);
rk[6] = GETU32(cipherKey + 24);
rk[7] = GETU32(cipherKey + 28);
s0 = GETU32(pt ) ^ rk[0];
s1 = GETU32(pt + 4) ^ rk[1];
s2 = GETU32(pt + 8) ^ rk[2];
s3 = GETU32(pt + 12) ^ rk[3];
s0 = GETU32(ct ) ^ rk[0];
s1 = GETU32(ct + 4) ^ rk[1];
s2 = GETU32(ct + 8) ^ rk[2];
s3 = GETU32(ct + 12) ^ rk[3];
rk[0] = GETU32(userKey);
rk[1] = GETU32(userKey + 4);
rk[2] = GETU32(userKey + 8);
rk[3] = GETU32(userKey + 12);
rk[4] = GETU32(userKey + 16);
rk[5] = GETU32(userKey + 20);
rk[6] = GETU32(userKey + 24);
rk[7] = GETU32(userKey + 28);
s0 = GETU32(in) ^ rk[0];
s1 = GETU32(in + 4) ^ rk[1];
s2 = GETU32(in + 8) ^ rk[2];
s3 = GETU32(in + 12) ^ rk[3];
s0 = GETU32(in) ^ rk[0];
s1 = GETU32(in + 4) ^ rk[1];
s2 = GETU32(in + 8) ^ rk[2];
s3 = GETU32(in + 12) ^ rk[3];
rk[0] = GETU32(userKey);
rk[1] = GETU32(userKey + 4);
rk[2] = GETU32(userKey + 8);
rk[3] = GETU32(userKey + 12);
rk[4] = GETU32(userKey + 16);
rk[5] = GETU32(userKey + 20);
rk[6] = GETU32(userKey + 24);
rk[7] = GETU32(userKey + 28);
rk[0] = GETU32(userKey);
rk[1] = GETU32(userKey + 4);
rk[2] = GETU32(userKey + 8);
rk[3] = GETU32(userKey + 12);
rk[4] = GETU32(userKey + 16);
rk[5] = GETU32(userKey + 20);
rk[6] = GETU32(userKey + 24);
rk[7] = GETU32(userKey + 28);
s0 = GETU32(in) ^ rk[0];
s1 = GETU32(in + 4) ^ rk[1];
s2 = GETU32(in + 8) ^ rk[2];
s3 = GETU32(in + 12) ^ rk[3];
s0 = GETU32(in) ^ rk[0];
s1 = GETU32(in + 4) ^ rk[1];
s2 = GETU32(in + 8) ^ rk[2];
s3 = GETU32(in + 12) ^ rk[3];
k[0] = s0 = GETU32(rawKey);
k[1] = s1 = GETU32(rawKey + 4);
k[2] = s2 = GETU32(rawKey + 8);
k[3] = s3 = GETU32(rawKey + 12);
k[8] = s0 = GETU32(rawKey + 16);
k[9] = s1 = GETU32(rawKey + 20);
k[10] = s2 = GETU32(rawKey + 24);
k[11] = s3 = GETU32(rawKey + 28);
s0 = GETU32(plaintext) ^ k[0];
s1 = GETU32(plaintext + 4) ^ k[1];
s2 = GETU32(plaintext + 8) ^ k[2];
s3 = GETU32(plaintext + 12) ^ k[3];
s0 = GETU32(ciphertext) ^ k[0];
s1 = GETU32(ciphertext + 4) ^ k[1];
s2 = GETU32(ciphertext + 8) ^ k[2];
s3 = GETU32(ciphertext + 12) ^ k[3];
ctr32 = GETU32(ivec + 12);
ctr = GETU32(ctx->Yi.c + 12);
ctr = GETU32(ctx->Yi.c + 12);
ctr = GETU32(ctx->Yi.c + 12);
alen = (u64)GETU32(p) << 32 | GETU32(p + 4);
clen = (u64)GETU32(p + 8) << 32 | GETU32(p + 12);
hi = (u64)GETU32(p) << 32 | GETU32(p + 4);
lo = (u64)GETU32(p + 8) << 32 | GETU32(p + 12);
ctr = GETU32(ctx->Xi.c + 12);
ctr = GETU32(ctx->Yi.c + 12);
hi = (u64)GETU32(p) << 32 | GETU32(p + 4);
lo = (u64)GETU32(p + 8) << 32 | GETU32(p + 12);
hi = (u64)GETU32(p) << 32 | GETU32(p + 4);
lo = (u64)GETU32(p + 8) << 32 | GETU32(p + 12);
hi = (u64)GETU32(p) << 32 | GETU32(p + 4);
lo = (u64)GETU32(p + 8) << 32 | GETU32(p + 12);
hi = (u64)GETU32(p) << 32 | GETU32(p + 4);
lo = (u64)GETU32(p + 8) << 32 | GETU32(p + 12);
ctr32 = GETU32(ctr->V + 12) + blocks;
tmp[0] = GETU32(plaintext);
tmp[1] = GETU32(plaintext + 4);
tmp[2] = GETU32(plaintext + 8);
tmp[3] = GETU32(plaintext + 12);
tmp[0] = GETU32(ciphertext);
tmp[1] = GETU32(ciphertext + 4);
tmp[2] = GETU32(ciphertext + 8);
tmp[3] = GETU32(ciphertext + 12);
kll = GETU32(key );
klr = GETU32(key + 4);
krl = GETU32(key + 8);
krr = GETU32(key + 12);
kll = GETU32(key );
klr = GETU32(key + 4);
krl = GETU32(key + 8);
krr = GETU32(key + 12);
krll = GETU32(key + 16);
krlr = GETU32(key + 20);
krrl = GETU32(key + 24);
krrr = GETU32(key + 28);
s0 = GETU32(ct ) ^ rk[0];
s1 = GETU32(ct + 4) ^ rk[1];
s2 = GETU32(ct + 8) ^ rk[2];
s3 = GETU32(ct + 12) ^ rk[3];
rk[0] = GETU32(cipherKey );
rk[1] = GETU32(cipherKey + 4);
rk[2] = GETU32(cipherKey + 8);
rk[3] = GETU32(cipherKey + 12);
rk[4] = GETU32(cipherKey + 16);
rk[5] = GETU32(cipherKey + 20);
rk[6] = GETU32(cipherKey + 24);
rk[7] = GETU32(cipherKey + 28);
s0 = GETU32(pt ) ^ rk[0];
s1 = GETU32(pt + 4) ^ rk[1];
s2 = GETU32(pt + 8) ^ rk[2];
s3 = GETU32(pt + 12) ^ rk[3];