shift_rows
.macro shift_rows, x0, x1, x2, x3, x4, x5, x6, x7, \
.macro shift_rows, x0, x1, x2, x3, x4, x5, x6, x7, mask