big_sqr_vec_umul
big_sqr_vec_impl = &big_sqr_vec_umul;
extern void big_sqr_vec_umul(uint32_t *, uint32_t *, int);