-
Notifications
You must be signed in to change notification settings - Fork 15
Expand file tree
/
Copy pathupgrad.py
More file actions
101 lines (84 loc) · 3.82 KB
/
upgrad.py
File metadata and controls
101 lines (84 loc) · 3.82 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
from typing import Literal
import torch
from torch import Tensor
from ._dual_cone_utils import _project_weights
from ._gramian_utils import _compute_regularized_normalized_gramian
from ._pref_vector_utils import _pref_vector_to_str_suffix, _pref_vector_to_weighting
from .bases import _WeightedAggregator, _Weighting
from .mean import _MeanWeighting
class UPGrad(_WeightedAggregator):
"""
:class:`~torchjd.aggregation.bases.Aggregator` that projects each row of the input matrix onto
the dual cone of all rows of this matrix, and that combines the result, as proposed in
`Jacobian Descent For Multi-Objective Optimization <https://arxiv.org/pdf/2406.16232>`_.
:param pref_vector: The preference vector used to combine the projected rows. If not provided,
defaults to the simple averaging of the projected rows.
:param norm_eps: A small value to avoid division by zero when normalizing.
:param reg_eps: A small value to add to the diagonal of the gramian of the matrix. Due to
numerical errors when computing the gramian, it might not exactly be positive definite.
This issue can make the optimization fail. Adding ``reg_eps`` to the diagonal of the gramian
ensures that it is positive definite.
:param solver: The solver used to optimize the underlying optimization problem.
.. admonition::
Example
Use UPGrad to aggregate a matrix.
>>> from torch import tensor
>>> from torchjd.aggregation import UPGrad
>>>
>>> A = UPGrad()
>>> J = tensor([[-4., 1., 1.], [6., 1., 1.]])
>>>
>>> A(J)
tensor([0.2929, 1.9004, 1.9004])
"""
def __init__(
self,
pref_vector: Tensor | None = None,
norm_eps: float = 0.0001,
reg_eps: float = 0.0001,
solver: Literal["quadprog"] = "quadprog",
):
weighting = _pref_vector_to_weighting(pref_vector, default=_MeanWeighting())
self._pref_vector = pref_vector
super().__init__(
weighting=_UPGradWrapper(
weighting=weighting, norm_eps=norm_eps, reg_eps=reg_eps, solver=solver
)
)
def __repr__(self) -> str:
return (
f"{self.__class__.__name__}(pref_vector={repr(self._pref_vector)}, norm_eps="
f"{self.weighting.norm_eps}, reg_eps={self.weighting.reg_eps}, "
f"solver={repr(self.weighting.solver)})"
)
def __str__(self) -> str:
return f"UPGrad{_pref_vector_to_str_suffix(self._pref_vector)}"
class _UPGradWrapper(_Weighting):
"""
Wrapper of :class:`~torchjd.aggregation.bases._Weighting` that changes the weights vector such
that each weighted row is projected onto the dual cone of all rows.
:param weighting: The wrapped weighting.
:param norm_eps: A small value to avoid division by zero when normalizing.
:param reg_eps: A small value to add to the diagonal of the gramian of the matrix. Due to
numerical errors when computing the gramian, it might not exactly be positive definite.
This issue can make the optimization fail. Adding ``reg_eps`` to the diagonal of the gramian
ensures that it is positive definite.
:param solver: The solver used to optimize the underlying optimization problem.
"""
def __init__(
self,
weighting: _Weighting,
norm_eps: float,
reg_eps: float,
solver: Literal["quadprog"],
):
super().__init__()
self.weighting = weighting
self.norm_eps = norm_eps
self.reg_eps = reg_eps
self.solver = solver
def forward(self, matrix: Tensor) -> Tensor:
U = torch.diag(self.weighting(matrix))
G = _compute_regularized_normalized_gramian(matrix, self.norm_eps, self.reg_eps)
W = _project_weights(U, G, self.solver)
return torch.sum(W, dim=0)