WT
for (; n>=WS; n-=WS, d+=WS, s+=WS) *(WT *)d = *(WT *)s;
while (n>=WS) n-=WS, *(WT *)(d+n) = *(WT *)(s+n);
#define WS (sizeof(WT))