load_4
int64_t s1 = 2097151 & (load_4(s + 2) >> 5);
int64_t s3 = 2097151 & (load_4(s + 7) >> 7);
int64_t s4 = 2097151 & (load_4(s + 10) >> 4);
int64_t s6 = 2097151 & (load_4(s + 15) >> 6);
int64_t s9 = 2097151 & (load_4(s + 23) >> 5);
int64_t s11 = 2097151 & (load_4(s + 28) >> 7);
int64_t s12 = 2097151 & (load_4(s + 31) >> 4);
int64_t s14 = 2097151 & (load_4(s + 36) >> 6);
int64_t s17 = 2097151 & (load_4(s + 44) >> 5);
int64_t s19 = 2097151 & (load_4(s + 49) >> 7);
int64_t s20 = 2097151 & (load_4(s + 52) >> 4);
int64_t s22 = 2097151 & (load_4(s + 57) >> 6);
int64_t s23 = (load_4(s + 60) >> 3);
int64_t s1 = kBottom21Bits & (load_4(s + 2) >> 5);
int64_t s3 = kBottom21Bits & (load_4(s + 7) >> 7);
int64_t s4 = kBottom21Bits & (load_4(s + 10) >> 4);
int64_t s6 = kBottom21Bits & (load_4(s + 15) >> 6);
int64_t s9 = kBottom21Bits & (load_4(s + 23) >> 5);
int64_t s11 = kBottom21Bits & (load_4(s + 28) >> 7);
int64_t s12 = kBottom21Bits & (load_4(s + 31) >> 4);
int64_t s14 = kBottom21Bits & (load_4(s + 36) >> 6);
int64_t s17 = kBottom21Bits & (load_4(s + 44) >> 5);
int64_t s19 = kBottom21Bits & (load_4(s + 49) >> 7);
int64_t s20 = kBottom21Bits & (load_4(s + 52) >> 4);
int64_t s22 = kBottom21Bits & (load_4(s + 57) >> 6);
int64_t s23 = (load_4(s + 60) >> 3);
int64_t a1 = kBottom21Bits & (load_4(a + 2) >> 5);
int64_t a3 = kBottom21Bits & (load_4(a + 7) >> 7);
int64_t a4 = kBottom21Bits & (load_4(a + 10) >> 4);
int64_t a6 = kBottom21Bits & (load_4(a + 15) >> 6);
int64_t a9 = kBottom21Bits & (load_4(a + 23) >> 5);
int64_t a11 = (load_4(a + 28) >> 7);
int64_t b1 = kBottom21Bits & (load_4(b + 2) >> 5);
int64_t b3 = kBottom21Bits & (load_4(b + 7) >> 7);
int64_t b4 = kBottom21Bits & (load_4(b + 10) >> 4);
int64_t b6 = kBottom21Bits & (load_4(b + 15) >> 6);
int64_t b9 = kBottom21Bits & (load_4(b + 23) >> 5);
int64_t b11 = (load_4(b + 28) >> 7);
int64_t c1 = kBottom21Bits & (load_4(c + 2) >> 5);
int64_t c3 = kBottom21Bits & (load_4(c + 7) >> 7);
int64_t c4 = kBottom21Bits & (load_4(c + 10) >> 4);
int64_t c6 = kBottom21Bits & (load_4(c + 15) >> 6);
int64_t c9 = kBottom21Bits & (load_4(c + 23) >> 5);
int64_t c11 = (load_4(c + 28) >> 7);
int64_t h0 = load_4(s);
int64_t h5 = load_4(s + 16);