60 min Blitz Flashcards

Question

which Tensors will have their .grad Tensor accumulated with the gradient

Answer 1

Tensors with requires_grad=True

Answer 2

loss.backward() conv1.bias.grad before backward tensor([0., 0., 0., 0., 0., 0.]) conv1.bias.grad after backward tensor([-0.0205, 0.0088, 0.0135, 0.0123, 0.0098, -0.0036])

Answer 3

weight = weight - learning_rate * gradient

Answer 4

learning_rate = 0.01 for f in net.parameters(): f.data.sub_(f.grad.data * learning_rate)

Answer 5

torch.optim

Answer 6

optimizer = optim.SGD(net.parameters(), lr=0.01)

Answer 7

``` optimizer.zero_grad() # zero the gradient buffers output = net(input) loss = criterion(output, target) loss.backward() optimizer.step() # Does the update ```

Answer 8

torchvision.datasets and torch.utils.data.DataLoader

Answer 9

dataiter = iter(trainloader) | images, labels = dataiter.next()

Answer 10

``` class Net(nn.Module): def __init__(self): super(Net, self).__init__() self.conv1 = nn.Conv2d(3, 6, 5) self.pool = nn.MaxPool2d(2, 2) self.conv2 = nn.Conv2d(6, 16, 5) self.fc1 = nn.Linear(16 * 5 * 5, 120) self.fc2 = nn.Linear(120, 84) self.fc3 = nn.Linear(84, 10) ``` ``` def forward(self, x): x = self.pool(F.relu(self.conv1(x))) x = self.pool(F.relu(self.conv2(x))) x = x.view(-1, 16 * 5 * 5) x = F.relu(self.fc1(x)) x = F.relu(self.fc2(x)) x = self.fc3(x) return x ``` net = Net()

Answer 11

``` criterion = nn.CrossEntropyLoss() optimizer = optim.SGD(net.parameters(), lr=0.001, momentum=0.9) ```

Answer 12

for epoch in range(2): # loop over the dataset multiple times ``` running_loss = 0.0 for i, data in enumerate(trainloader, 0): # get the inputs inputs, labels = data ``` ``` # zero the parameter gradients optimizer.zero_grad() ``` ``` # forward + backward + optimize outputs = net(inputs) loss = criterion(outputs, labels) loss.backward() optimizer.step() ``` # print statistics running_loss += loss.item() if i % 2000 == 1999: # print every 2000 mini-batches print('[%d, %5d] loss: %.3f' % (epoch + 1, i + 1, running_loss / 2000)) running_loss = 0.0 print('Finished Training')

Answer 13

``` correct = 0 total = 0 with torch.no_grad(): for data in testloader: images, labels = data outputs = net(images) _, predicted = torch.max(outputs.data, 1) total += labels.size(0) correct += (predicted == labels).sum().item() ``` print('Accuracy of the network on the 10000 test images: %d %%' % ( 100 * correct / total))

Answer 14

device = torch.device("cuda:0" if torch.cuda.is_available() else "cpu") print(device) net.to(device) inputs, labels = inputs.to(device), labels.to(device)

Answer 15

https://pytorch.org/tutorials/beginner/blitz/data_parallel_tutorial.html

Answer 16

https://github.com/hunkim/PyTorchZeroToAll/blob/master/12_4_hello_rnn_emb.py

Answer 17

https://github.com/hunkim/PyTorchZeroToAll/blob/master/14_1_seq2seq.py

Answer 18

https://github.com/hunkim/PyTorchZeroToAll/blob/master/14_2_seq2seq_att.py