Wres: wresnet with audit settings

This commit is contained in:
Akemi Izuko 2024-11-30 15:41:11 -07:00
parent c163e3062c
commit c1561c7d55
Signed by: akemi
GPG key ID: 8DE0764E1809E9FC
4 changed files with 25 additions and 20 deletions

View file

@ -45,7 +45,6 @@ class IndividualBlock1(nn.Module):
class IndividualBlockN(nn.Module): class IndividualBlockN(nn.Module):
def __init__(self, input_features, output_features, stride): def __init__(self, input_features, output_features, stride):
super(IndividualBlockN, self).__init__() super(IndividualBlockN, self).__init__()
@ -117,7 +116,6 @@ class WideResNet(nn.Module):
m.bias.data.zero_() m.bias.data.zero_()
def forward(self, x): def forward(self, x):
x = self.conv1(x) x = self.conv1(x)
attention1 = self.block1(x) attention1 = self.block1(x)
attention2 = self.block2(attention1) attention2 = self.block2(attention1)
@ -143,4 +141,4 @@ if __name__ == '__main__':
net(sample_input) net(sample_input)
# Summarize model # Summarize model
summary(net, input_size=(3, 32, 32)) summary(net, input_size=(3, 32, 32))

View file

@ -7,6 +7,7 @@ import numpy as np
import random import random
from utils import json_file_to_pyobj, get_loaders from utils import json_file_to_pyobj, get_loaders
from WideResNet import WideResNet from WideResNet import WideResNet
from tqdm import tqdm
def set_seed(seed=42): def set_seed(seed=42):
@ -17,25 +18,19 @@ def set_seed(seed=42):
torch.cuda.manual_seed(seed) torch.cuda.manual_seed(seed)
def _train_seed(net, loaders, device, dataset, log=False, checkpoint=False, logfile='', checkpointFile=''): def _train_seed(net, loaders, device, dataset, log=False, checkpoint=False, logfile='', checkpointFile='', epochs=200):
train_loader, test_loader = loaders train_loader, test_loader = loaders
if dataset == 'svhn':
epochs = 100
else:
epochs = 200
criterion = nn.CrossEntropyLoss() criterion = nn.CrossEntropyLoss()
optimizer = optim.SGD(net.parameters(), lr=0.1, momentum=0.9, nesterov=True, weight_decay=5e-4) optimizer = optim.SGD(net.parameters(), lr=0.1, momentum=0.9, nesterov=True, weight_decay=5e-4)
scheduler = MultiStepLR(optimizer, milestones=[int(elem*epochs) for elem in [0.3, 0.6, 0.8]], gamma=0.2) scheduler = MultiStepLR(optimizer, milestones=[int(elem*epochs) for elem in [0.3, 0.6, 0.8]], gamma=0.2)
best_test_set_accuracy = 0 best_test_set_accuracy = 0
for epoch in range(epochs): print(f"Training with {epochs} epochs")
for epoch in tqdm(range(epochs)):
net.train() net.train()
for i, data in enumerate(train_loader, 0): for i, data in tqdm(enumerate(train_loader, 0), leave=False):
inputs, labels = data inputs, labels = data
inputs = inputs.to(device) inputs = inputs.to(device)
labels = labels.to(device) labels = labels.to(device)
@ -89,18 +84,19 @@ def train(args):
wrn_depth = training_configurations.wrn_depth wrn_depth = training_configurations.wrn_depth
wrn_width = training_configurations.wrn_width wrn_width = training_configurations.wrn_width
dataset = training_configurations.dataset.lower() dataset = training_configurations.dataset.lower()
seeds = [int(seed) for seed in training_configurations.seeds] #seeds = [int(seed) for seed in training_configurations.seeds]
seeds = [int.from_bytes(os.urandom(8), byteorder='big')]
log = True if training_configurations.log.lower() == 'true' else False log = True if training_configurations.log.lower() == 'true' else False
if log: if log:
logfile = 'WideResNet-{}-{}-{}.txt'.format(wrn_depth, wrn_width, training_configurations.dataset) logfile = 'WideResNet-{}-{}-{}-{}-{}.txt'.format(wrn_depth, wrn_width, training_configurations.dataset, training_configurations.batch_size, training_configurations.epochs)
with open(logfile, 'w') as temp: with open(logfile, 'w') as temp:
temp.write('WideResNet-{}-{} on {}\n'.format(wrn_depth, wrn_width, training_configurations.dataset)) temp.write('WideResNet-{}-{} on {} {}batch for {} epochs\n'.format(wrn_depth, wrn_width, training_configurations.dataset, training_configurations.batch_size, training_configurations.epochs))
else: else:
logfile = '' logfile = ''
checkpoint = True if training_configurations.checkpoint.lower() == 'true' else False checkpoint = True if training_configurations.checkpoint.lower() == 'true' else False
loaders = get_loaders(dataset) loaders = get_loaders(dataset, training_configurations.batch_size)
if torch.cuda.is_available(): if torch.cuda.is_available():
device = torch.device('cuda:0') device = torch.device('cuda:0')
@ -121,7 +117,8 @@ def train(args):
net = net.to(device) net = net.to(device)
checkpointFile = 'wrn-{}-{}-seed-{}-{}-dict.pth'.format(wrn_depth, wrn_width, dataset, seed) if checkpoint else '' checkpointFile = 'wrn-{}-{}-seed-{}-{}-dict.pth'.format(wrn_depth, wrn_width, dataset, seed) if checkpoint else ''
best_test_set_accuracy = _train_seed(net, loaders, device, dataset, log, checkpoint, logfile, checkpointFile) epochs = training_configurations.epochs
best_test_set_accuracy = _train_seed(net, loaders, device, dataset, log, checkpoint, logfile, checkpointFile, epochs)
if log: if log:
with open(logfile, 'a') as temp: with open(logfile, 'a') as temp:

View file

@ -16,9 +16,9 @@ def json_file_to_pyobj(filename):
def get_loaders(dataset, train_batch_size=128, test_batch_size=10): def get_loaders(dataset, train_batch_size=128, test_batch_size=10):
print(f"Train batch size: {train_batch_size}")
if dataset == 'cifar10': if dataset == 'cifar10':
normalize = transforms.Normalize((0.4914, 0.4822, 0.4465), (0.2023, 0.1994, 0.2010)) normalize = transforms.Normalize((0.4914, 0.4822, 0.4465), (0.2023, 0.1994, 0.2010))
train_transform = transforms.Compose([ train_transform = transforms.Compose([
@ -44,7 +44,6 @@ def get_loaders(dataset, train_batch_size=128, test_batch_size=10):
testloader = DataLoader(testset, batch_size=test_batch_size, shuffle=True, num_workers=4) testloader = DataLoader(testset, batch_size=test_batch_size, shuffle=True, num_workers=4)
elif dataset == 'svhn': elif dataset == 'svhn':
normalize = transforms.Normalize((0.4377, 0.4438, 0.4728), (0.1980, 0.2010, 0.1970)) normalize = transforms.Normalize((0.4377, 0.4438, 0.4728), (0.1980, 0.2010, 0.1970))
transform = transforms.Compose([ transform = transforms.Compose([

View file

@ -0,0 +1,11 @@
{
"training":{
"dataset": "CIFAR10",
"wrn_depth": 16,
"wrn_width": 1,
"checkpoint": "True",
"log": "True",
"batch_size": 4096,
"epochs": 200
}
}