ossl_gcm_ghash_4bit
void ossl_gcm_ghash_4bit(u64 Xi[2], const u128 Htable[16],
ossl_gcm_ghash_4bit((u64 *)out, Htable, (uint8_t *)tmp, 16);