replace_u32
changed |= replace_u32(&dst[i], mask ? ~mask[i] : 0, data[i]);
replace_u32(&dst[i], 0, 0);