rc4_step
chunk |= (uint64_t)rc4_step(d, x, y) << (i * 8);
out[i] = rc4_step(d, &x, &y) ^ in[i];
chunk = chunk << 8 | (uint64_t)rc4_step(d, x, y);