TMPL_RET_IDX
b_offset = (unsigned long)(buff + TMPL_RET_IDX) - nip;
patch_branch(buff + TMPL_RET_IDX, nip, 0);