FPR_ALIGN
uint8_t fpua[sizeof (kfpu_t) + FPR_ALIGN];
fpu = (kfpu_t *)P2ROUNDUP((uintptr_t)fpua, FPR_ALIGN);