-
Notifications
You must be signed in to change notification settings - Fork 6
/
Copy pathlosses.py
112 lines (91 loc) · 3.75 KB
/
losses.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
"""Definition of loss functions."""
from abc import ABC, abstractmethod
import torch
import torch.nn.functional as F
import numpy as np
from typing import List, Tuple
from torch import nn
class CLLoss(ABC):
"""Abstract class to define losses in the CL framework that use one
positive pair and one negative pair"""
@abstractmethod
def loss(self, z1, z2_con_z1, z3, z1_rec, z2_con_z1_rec, z3_rec):
"""
z1_t = h(z1)
z2_t = h(z2)
z3_t = h(z3)
and z1 ~ p(z1), z3 ~ p(z3)
and z2 ~ p(z2 | z1)
returns the total loss and componentwise contributions
"""
pass
def __call__(self, z1, z2_con_z1, z3, z1_rec, z2_con_z1_rec, z3_rec):
return self.loss(z1, z2_con_z1, z3, z1_rec, z2_con_z1_rec, z3_rec)
class LpSimCLRLoss(CLLoss):
"""Extended InfoNCE objective for non-normalized representations based on an Lp norm.
Args:
p: Exponent of the norm to use.
tau: Rescaling parameter of exponent.
alpha: Weighting factor between the two summands.
simclr_compatibility_mode: Use logsumexp (as used in SimCLR loss) instead of logmeanexp
pow: Use p-th power of Lp norm instead of Lp norm.
"""
def __init__(
self,
p: int = 2,
tau: float = 1.0,
alpha: float = 0.5,
simclr_compatibility_mode: bool = False,
simclr_denominator: bool = True,
pow: bool = True,
):
self.p = p
self.tau = tau
self.alpha = alpha
self.simclr_compatibility_mode = simclr_compatibility_mode
self.simclr_denominator = simclr_denominator
self.pow = pow
def loss(self, z1, z2_con_z1, z3, z1_rec, z2_con_z1_rec, z3_rec):
del z1, z2_con_z1, z3
if self.p < 1.0:
# add small epsilon to make calculation of norm numerically more stable
neg = torch.norm(
torch.abs(z1_rec.unsqueeze(0) - z3_rec.unsqueeze(1) + 1e-12),
p=self.p,
dim=-1,
)
pos = torch.norm(
torch.abs(z1_rec - z2_con_z1_rec) + 1e-12, p=self.p, dim=-1
)
else:
# TODO: verify this
# neg = torch.norm(z1_rec.unsqueeze(0) - z3_rec.unsqueeze(1), p=self.p, dim=-1)
# pos = torch.norm(z1_rec - z2_con_z1_rec, p=self.p, dim=-1)
neg = torch.pow(z1_rec.unsqueeze(1) - z3_rec.unsqueeze(0), float(self.p)).sum(dim=-1)
pos = torch.pow(z1_rec - z2_con_z1_rec, float(self.p)).sum(dim=-1)
if not self.pow:
neg = neg.pow(1.0 / self.p)
pos = pos.pow(1.0 / self.p)
# all = torch.cat((neg, pos.unsqueeze(1)), dim=1)
if self.simclr_compatibility_mode:
neg_and_pos = torch.cat((neg, pos.unsqueeze(1)), dim=1)
loss_pos = pos / self.tau
loss_neg = torch.logsumexp(-neg_and_pos / self.tau, dim=1)
else:
if self.simclr_denominator:
neg_and_pos = torch.cat((neg, pos.unsqueeze(1)), dim=1)
else:
neg_and_pos = neg
loss_pos = pos / self.tau
loss_neg = _logmeanexp(-neg_and_pos / self.tau, dim=1)
loss = 2 * (self.alpha * loss_pos + (1.0 - self.alpha) * loss_neg)
loss_mean = torch.mean(loss)
loss_std = torch.std(loss)
loss_pos_mean = torch.mean(loss_pos)
loss_neg_mean = torch.mean(loss_neg)
return loss_mean, loss, [loss_pos_mean, loss_neg_mean]
def _logmeanexp(x, dim):
# do the -log thing to use logsumexp to calculate the mean and not the sum
# as log sum_j exp(x_j - log N) = log sim_j exp(x_j)/N = log mean(exp(x_j)
N = torch.tensor(x.shape[dim], dtype=x.dtype, device=x.device)
return torch.logsumexp(x, dim=dim) - torch.log(N)