changed to same data loaders as train.py and added saving student model

2024-12-01 15:33:03 -07:00 · 2024-12-01 15:33:03 -07:00 · 5be312bf18
commit 5be312bf18
parent 7208c16efc
1 changed files with 24 additions and 45 deletions
--- a/wresnet-pytorch/src/distillation_train.py
+++ b/wresnet-pytorch/src/distillation_train.py
@ -1,3 +1,6 @@
 from datetime import datetime
 import time
 from utils import json_file_to_pyobj, get_loaders
 from WideResNet import WideResNet
 from opacus.validators import ModuleValidator
@ -18,21 +21,8 @@ import warnings
 warnings.filterwarnings("ignore")
-def train_knowledge_distillation(teacher, student, epochs, learning_rate, T, soft_target_loss_weight, ce_loss_weight, device):
+def train_knowledge_distillation(teacher, student, train_dl, epochs, learning_rate, T, soft_target_loss_weight, ce_loss_weight, device):
    # Dataset
    transform = transforms.Compose(
        [
            transforms.RandomHorizontalFlip(),
            transforms.RandomCrop(32, padding=4),
            transforms.ToTensor(),
            transforms.Normalize([0.4914, 0.4822, 0.4465], [0.2470, 0.2435, 0.2616]),
        ]
    )
    datadir = Path().home() / "opt/data/cifar"
    train_ds = CIFAR10(root=datadir, train=True, download=True, transform=transform)
    train_dl = DataLoader(train_ds, batch_size=128, shuffle=False, num_workers=4)
    ce_loss = nn.CrossEntropyLoss()
    optimizer = optim.Adam(student.parameters(), lr=learning_rate)
@ -72,44 +62,29 @@ def train_knowledge_distillation(teacher, student, epochs, learning_rate, T, sof
        print(f"Epoch {epoch+1}/{epochs}, Loss: {running_loss / len(train_dl)}")
-
+@torch.no_grad()
-
+def test(model, device, test_dl, teacher=False):
 def test(model, device, teacher=False):
    transform = transforms.Compose(
        [
            transforms.RandomHorizontalFlip(),
            transforms.RandomCrop(32, padding=4),
            transforms.ToTensor(),
            transforms.Normalize([0.4914, 0.4822, 0.4465], [0.2470, 0.2435, 0.2616]),
        ]
    )
    datadir = Path().home() / "opt/data/cifar"
    test_ds = CIFAR10(root=datadir, train=True, download=False, transform=transform)     
    test_dl = DataLoader(test_ds, batch_size=128, shuffle=False, num_workers=4
            )
    model.to(device)
    model.eval()
    correct = 0
    total = 0
-    with torch.no_grad():
+    for inputs, labels in test_dl:
-        for inputs, labels in test_dl:
+        inputs, labels = inputs.to(device), labels.to(device)
-            inputs, labels = inputs.to(device), labels.to(device)
+        if teacher:
-            if teacher:
+            outputs, _, _, _ = model(inputs)
-                outputs, _, _, _ = model(inputs)
+        else:
-            else:
+            outputs = model(inputs)
-                outputs = model(inputs)
+        _, predicted = torch.max(outputs.data, 1)
            _, predicted = torch.max(outputs.data, 1)
-            total += labels.size(0)
+        total += labels.size(0)
-            correct += (predicted == labels).sum().item()
+        correct += (predicted == labels).sum().item()
    accuracy = 100 * correct / total
    print(f"Test Accuracy: {accuracy:.2f}%")
    return accuracy
 def main():
    json_options = json_file_to_pyobj("wresnet16-audit-cifar10.json")
    training_configurations = json_options.training
@ -156,13 +131,17 @@ def main():
    print("Training student")
-    #train_knowledge_distillation(teacher=teacher, student=student, epochs=100, learning_rate=0.001, T=2, soft_target_loss_weight=0.25, ce_loss_weight=0.75, device=device)
+    train_knowledge_distillation(teacher=teacher, student=student, train_dl=train_loader, epochs=100, learning_rate=0.001, T=2, soft_target_loss_weight=0.25, ce_loss_weight=0.75, device=device)
-    #test_student = test(student, device)
+    print("Saving student")
-    test_teacher = test(teacher, device, True)
+    current_datetime = datetime.now()
    filename = f"students/studentmodel{current_datetime.strftime('%Y%m%d_%H%M%S')}.pt"
    torch.save(student.state_dict(), filename)
    print("Testing student and teacher")
    test_student = test(student, device, test_loader,)
    test_teacher = test(teacher, device, test_loader, True)
    print(f"Teacher accuracy: {test_teacher:.2f}%")
-    #print(f"Student accuracy: {test_student:.2f}%")
+    print(f"Student accuracy: {test_student:.2f}%")
 if __name__ == "__main__":
    main()