-
Notifications
You must be signed in to change notification settings - Fork 0
/
test1.py
47 lines (41 loc) · 1.43 KB
/
test1.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
from collections import OrderedDict
import torch
import torch.nn as nn
import torch.nn.functional as F
from mlp import MLP, mse_loss, bce_loss, cross_entropy_loss
net = MLP(
linear_1_in_features=2,
linear_1_out_features=20,
f_function='relu',
linear_2_in_features=20,
linear_2_out_features=5,
g_function='identity'
)
x = torch.randn(10, 2)
y = torch.randn(10, 5)
net.clear_grad_and_cache()
y_hat = net.forward(x)
J, dJdy_hat = mse_loss(y, y_hat)
net.backward(dJdy_hat)
#------------------------------------------------
# compare the result with autograd
net_autograd = nn.Sequential(
OrderedDict([
('linear1', nn.Linear(2, 20)),
('relu', nn.ReLU()),
('linear2', nn.Linear(20, 5)),
])
)
net_autograd.linear1.weight.data = net.parameters['W1']
net_autograd.linear1.bias.data = net.parameters['b1']
net_autograd.linear2.weight.data = net.parameters['W2']
net_autograd.linear2.bias.data = net.parameters['b2']
y_hat_autograd = net_autograd(x)
J_autograd = F.mse_loss(y_hat_autograd, y)
net_autograd.zero_grad()
J_autograd.backward()
print((net_autograd.linear1.weight.grad.data - net.grads['dJdW1']).norm() < 1e-3)
print((net_autograd.linear1.bias.grad.data - net.grads['dJdb1']).norm() < 1e-3)
print((net_autograd.linear2.weight.grad.data - net.grads['dJdW2']).norm() < 1e-3)
print((net_autograd.linear2.bias.grad.data - net.grads['dJdb2']).norm()< 1e-3)
#------------------------------------------------