[core] use swap_tensors in group offloading where possible
#29104
pr_dependency_test.yml
on: pull_request
check_dependencies
25s