tdn = self.top_down((~x_mask).sum(-1), list(reversed(bup['features'])))
tdn = self.top_down((~x_mask).sum(-1), list(reversed(bup['features'])))