DodoEstinto
diff --git a/‎modelNo9.pth
64 Bytes b/‎modelNo9.pth
64 Bytes
diff --git a/‎modelRetr.pth
-64 Bytes b/‎modelRetr.pth
-64 Bytes
diff --git a/‎trainer.py
Lines changed: 3 additions & 2 deletions b/‎trainer.py
Lines changed: 3 additions & 2 deletions
diff --git a/‎unlearn copy.py
Lines changed: 27 additions & 9 deletions b/‎unlearn copy.py
Lines changed: 27 additions & 9 deletions
@@ -33,7 +33,8 @@
 test_mask = test_data.targets <= 8
 test_data.data = test_data.data[test_mask]
 test_data.targets = test_data.targets[test_mask]
-
+print(training_data.classes)
+print(test_data.classes)
 device= 'cuda' if torch.cuda.is_available() else 'cpu'
 
 #create a cnn with2 hidden layers
@@ -46,7 +47,7 @@ def __init__(self):
         torch.nn.init.xavier_normal_(self.conv2.weight)
         self.fc1 = nn.Linear(12*12*4, 32)
         torch.nn.init.xavier_normal_(self.fc1.weight)
-        self.fc2 = nn.Linear(32, 9)
+        self.fc2 = nn.Linear(32, 10)
         torch.nn.init.xavier_normal_(self.fc2.weight)
 
     def forward(self, x):
 
@@ -59,7 +59,7 @@ def __init__(self):
         self.conv1 = nn.Conv2d(1, 4, 3, 1)
         self.conv2 = nn.Conv2d(4, 4, 3, 1)
         self.fc1 = nn.Linear(12*12*4, 32)
-        self.fc2 = nn.Linear(32, 9)
+        self.fc2 = nn.Linear(32, 10)
 
     def forward(self, x):
         x = self.conv1(x)
@@ -81,7 +81,7 @@ def forward(self, x):
 SUB_TARGET=9
 
 #hyperparameters
-learning_rate = 5e-6
+learning_rate = 5e-4
 
 #DO NOT CHANGE
 batch_size = 1
@@ -117,7 +117,6 @@ def forward(self, x):
 test_mask = test_only_to_learn.targets == SUB_TARGET
 test_only_to_learn.data = test_only_to_learn.data[test_mask]
 test_only_to_learn.targets = test_only_to_learn.targets[test_mask]
-test_only_to_learn.targets[test_only_to_learn.targets == SUB_TARGET] = FORGET_TARGET
 test_only_to_learn_dataloader = DataLoader(test_only_to_learn, batch_size=batch_size)
 
 #this will contain only the data about the forgotten class
@@ -144,8 +143,6 @@ def forward(self, x):
 train_mask = training_to_learn.targets != FORGET_TARGET
 training_to_learn.data = training_to_learn.data[train_mask]
 training_to_learn.targets = training_to_learn.targets[train_mask]
-training_to_learn.targets[training_to_learn.targets == SUB_TARGET] = FORGET_TARGET
-
 
 #this will contain the test data where the forgotten class is substituted with the new class
 test_to_learn = datasets.MNIST(
@@ -157,14 +154,30 @@ def forward(self, x):
 test_mask = test_to_learn.targets != FORGET_TARGET
 test_to_learn.data = test_to_learn.data[test_mask]
 test_to_learn.targets = test_to_learn.targets[test_mask]
-test_to_learn.targets[test_to_learn.targets == SUB_TARGET] = FORGET_TARGET
 
 
 ################################# Gradient computation part #################################
 
+def log_softmax(x):
+    return x - torch.logsumexp(x,dim=1, keepdim=True)
+
+def CrossEntropyLoss(outputs, targets):
+    epsilon=1e-6
+    num_examples = targets.shape[0]
+    batch_size = outputs.shape[0]
+    outputs = log_softmax(outputs)+epsilon
+    inverse_output= 1/outputs
+    outputs[targets==FORGET_TARGET]=inverse_output[targets==FORGET_TARGET]
+
+    outputs = outputs[range(batch_size), targets]
+
+    return - torch.sum(outputs)/num_examples
+
+
+
 # Load the model
 model = CNN()
-model.load_state_dict(torch.load("modelNo9.pth"))
+model.load_state_dict(torch.load("modelNo9.pth",map_location=torch.device(device)))
 
 
 #create the gradient holders
@@ -221,8 +234,12 @@ def train(dataloader, model, loss_fn, optimizer,scheduler):
         X, y = X.to(device), y.to(device)
         pred = model(X)
         loss = loss_fn(pred, y)
+        myloss= CrossEntropyLoss(pred,y)
+        #print("pytorch Loss:",loss)
+        #print("my loss:",myloss)
         optimizer.zero_grad()
-        loss.backward()
+        #loss
+        myloss.backward()
         #remove the gradients from fc1 and fc2 using the mask
         #model.fc1.weight.grad[fc1_map == 0] = 0
         #model.fc2.weight.grad[fc2_map == 0] = 0 
@@ -267,7 +284,8 @@ def forward(self, input, target):
         return loss
 
 
-loss_fn = MyCustomLoss()
+#loss_fn = MyCustomLoss()
+loss_fn = nn.CrossEntropyLoss()
 optimizer = torch.optim.SGD(model.parameters(), lr=learning_rate)
 #scheduler
 scheduler = torch.optim.lr_scheduler.StepLR(optimizer, step_size=1, gamma=0.1)