# Local Hyperparameter Optimization

This notebook is similar to the `classifier_hyp` notebook, but it runs the hyperparameter optimization locally instead of on Google Colab. The definitive version is the Google Colab one because we run many more iterations and parameter combinations there due to GPU availability.

In [1]:
import wandb

wandb.login()

[34m[1mwandb[0m: Currently logged in as: [33me1527193[0m ([33mflower-classification[0m). Use [1m`wandb login --relogin`[0m to force relogin


True

In [2]:
import torch
import torch.optim as optim
import torch.nn.functional as F
import torch.nn as nn
from torchvision import datasets, transforms
from torchvision.models import resnet50, ResNet50_Weights
from torch.utils.data import Dataset, DataLoader, random_split, SubsetRandomSampler
import numpy as np
import os
import time
import copy
import random
from sklearn import metrics

torch.manual_seed(42)
np.random.seed(42)

device = torch.device("cuda" if torch.cuda.is_available() else "cpu")

In [3]:
def build_dataset(batch_size):    
    data_transforms = {
        'train': transforms.Compose([
            transforms.RandomResizedCrop(224),
            transforms.RandomHorizontalFlip(),
            transforms.ToTensor(),
            transforms.Normalize([0.485, 0.456, 0.406], [0.229, 0.224, 0.225])
        ]),
        'test': transforms.Compose([
            transforms.Resize(256),
            transforms.CenterCrop(224),
            transforms.ToTensor(),
            transforms.Normalize([0.485, 0.456, 0.406], [0.229, 0.224, 0.225])
        ]),
    }

    data_dir = 'plantsdata'
    dataset = datasets.ImageFolder(os.path.join(data_dir))

    # 90/10 split
    train_dataset, test_dataset = random_split(dataset, [0.9, 0.1])

    train_dataset.dataset.transform = data_transforms['train']
    test_dataset.dataset.transform = data_transforms['test']

    train_loader = torch.utils.data.DataLoader(train_dataset, batch_size=batch_size,
                                               shuffle=True, num_workers=4)
    test_loader = torch.utils.data.DataLoader(test_dataset, batch_size=batch_size,
                                             shuffle=True, num_workers=4)

    dataloaders = {'train': train_loader, 'test': test_loader}
    dataset_size = len(dataset)
    dataset_sizes = {'train': len(train_dataset), 'test': len(test_dataset)}
    class_names = dataset.classes

    return (dataloaders, dataset_sizes)

def build_network():
    network = resnet50(weights=ResNet50_Weights.DEFAULT)
    num_ftrs = network.fc.in_features

    # Add linear layer with number of classes
    network.fc = nn.Linear(num_ftrs, 2)

    return network.to(device)

def build_optimizer(network, optimizer, learning_rate, beta_one, beta_two, eps):
    if optimizer == "sgd":
        optimizer = optim.SGD(network.parameters(),
                              lr=learning_rate, momentum=0.9)
    elif optimizer == "adam":
        optimizer = optim.Adam(network.parameters(),
                               lr=learning_rate,
                               betas=(beta_one, beta_two),
                               eps=eps)
    return optimizer

def train_epoch(network, loader, optimizer, criterion, scheduler, dataset_sizes):
    network.train()
    running_loss = 0.0
    running_corrects = 0
    for _, (data, target) in enumerate(loader):
        data, target = data.to(device), target.to(device)
        optimizer.zero_grad()

        # ➡ Forward pass
        #loss = F.nll_loss(network(data), target)
        with torch.set_grad_enabled(True):
            outputs = network(data)
            _, preds = torch.max(outputs, 1)
            loss = criterion(outputs, target)
        
        #cumu_loss += loss.item()
        
        running_loss += loss.item() * data.size(0)
        running_corrects += torch.sum(preds == target.data)

        # ⬅ Backward pass + weight update
        loss.backward()
        optimizer.step()

        wandb.log({'train/batch_loss': loss.item()})

    scheduler.step()

    epoch_loss = running_loss / dataset_sizes['train']
    epoch_acc = running_corrects.double() / dataset_sizes['train']
    
    return (epoch_loss, epoch_acc)

def test(network, loader, optimizer, criterion, dataset_sizes):
    network.eval()
    confusion = torch.empty([0, 1])
    confusion = confusion.to(device)
    running_loss = 0.0
    test_corrects = 0
    for _, (data, target) in enumerate(loader):
        data, target = data.to(device), target.to(device)
        optimizer.zero_grad()

        # ➡ Forward pass
        with torch.set_grad_enabled(False):
            outputs = network(data)
            _, preds = torch.max(outputs, 1)
            loss = criterion(outputs, target)

        running_loss += loss.item() * data.size(0)
        test_corrects += torch.sum(preds == target.data)
        
        confusion = torch.cat((confusion, preds[:, None] / target.data[:, None]))

    tp = torch.sum(confusion == 1).item()
    fp = torch.sum(confusion == float('inf')).item()
    tn = torch.sum(torch.isnan(confusion)).item()
    fn = torch.sum(confusion == 0).item()
    
    precision = tp / (tp + fp)
    recall = tp / (tp + fn)
    f = 2 * ((precision * recall) / (precision + recall))
    
    epoch_loss = running_loss / dataset_sizes['test']
    epoch_acc = test_corrects.double() / dataset_sizes['test']
    
    return (epoch_loss, epoch_acc, precision, recall, f)

In [4]:
def train(config=None):
    # Initialize a new wandb run
    with wandb.init(config=config):
        # If called by wandb.agent, as below,
        # this config will be set by Sweep Controller
        config = wandb.config

        (dataloaders, dataset_sizes) = build_dataset(config.batch_size)
        network = build_network()
        optimizer = build_optimizer(network, config.optimizer, config.learning_rate, config.beta_one,
                                    config.beta_two, config.eps)
        criterion = nn.CrossEntropyLoss()
        # Decay LR by a factor of 0.1 every 7 epochs
        exp_lr_scheduler = optim.lr_scheduler.StepLR(optimizer, config.step_size, config.gamma)

        for epoch in range(config.epochs):            
            (epoch_loss, epoch_acc) = train_epoch(network, dataloaders['train'], optimizer,
                                                  criterion, exp_lr_scheduler,
                                                  dataset_sizes)
            wandb.log({"epoch": epoch, 'train/epoch_loss': epoch_loss, 'train/epoch_acc': epoch_acc})
            
            (test_loss, test_acc, test_precision, test_recall, test_f) = test(network, dataloaders['test'],
                                                                              optimizer, criterion,
                                                                              dataset_sizes)
            wandb.log({'test/epoch_loss': test_loss, 'test/epoch_acc': test_acc,
                       'test/precision': test_precision, 'test/recall': test_recall,
                       'test/f1-score': test_f})

In [5]:
sweep_config = {
    'method': 'random'
}

metric = {
    'name': 'test/epoch_acc',
    'goal': 'maximize'   
}

sweep_config['metric'] = metric

parameters_dict = {
    'optimizer': {
        'values': ['adam', 'sgd']
    },
}

sweep_config['parameters'] = parameters_dict

parameters_dict.update({
    'epochs': {
        'value': 10},
    'batch_size': {
        'values': [4, 8]},
    'learning_rate': {
        'values': [0.1, 0.01, 0.003, 0.001, 0.0003, 0.0001]},
    'step_size': {
        'values': [2, 3, 5, 7]},
    'gamma': {
        'values': [0.1, 0.5]},
    'beta_one': {
        'values': [0.9, 0.99]},
    'beta_two': {
        'values': [0.5, 0.9, 0.99, 0.999]},
    'eps': {
        'values': [1e-08, 0.1, 1]}
})

In [6]:
sweep_id = wandb.sweep(sweep_config, project="pytorch-sweeps-demo")

Create sweep with ID: eqwnoagh
Sweep URL: https://wandb.ai/flower-classification/pytorch-sweeps-demo/sweeps/eqwnoagh


In [7]:
wandb.agent(sweep_id, train, count=30)

[34m[1mwandb[0m: Agent Starting Run: znahtehx with config:
[34m[1mwandb[0m: 	batch_size: 4
[34m[1mwandb[0m: 	beta_one: 0.9
[34m[1mwandb[0m: 	beta_two: 0.5
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	eps: 1
[34m[1mwandb[0m: 	gamma: 0.1
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: adam
[34m[1mwandb[0m: 	step_size: 2


VBox(children=(Label(value='0.003 MB of 0.027 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=0.127552…

0,1
epoch,▁▂▃▃▄▅▆▆▇█
test/epoch_acc,▁▂▅▆▅▇▄▇▃█
test/epoch_loss,█▃▂▂▃▂▂▁▂▂
test/f1-score,▁▃▅▆▄▆▄▇▃█
test/precision,▁▁▃▅▆▇▄█▃▇
test/recall,▁▆▇▆▁▄▃▄▃█
train/batch_loss,█▇▆▆▆▆▅▄▄▃▅▅█▆▃█▆▇▂▆▅▅▁▃▆▄▃██▅▆▄▆▅▄▂▂▇▇▆
train/epoch_acc,▁▆▇▇▇███▇█
train/epoch_loss,█▄▂▂▂▁▁▁▂▁

0,1
epoch,9.0
test/epoch_acc,0.85556
test/epoch_loss,0.6166
test/f1-score,0.86022
test/precision,0.81633
test/recall,0.90909
train/batch_loss,0.66533
train/epoch_acc,0.75676
train/epoch_loss,0.61072


[34m[1mwandb[0m: Agent Starting Run: qutqx8ux with config:
[34m[1mwandb[0m: 	batch_size: 4
[34m[1mwandb[0m: 	beta_one: 0.9
[34m[1mwandb[0m: 	beta_two: 0.9
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	eps: 1e-08
[34m[1mwandb[0m: 	gamma: 0.1
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	step_size: 2


VBox(children=(Label(value='0.004 MB of 0.027 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=0.129798…

0,1
epoch,▁▂▃▃▄▅▆▆▇█
test/epoch_acc,▁▂▁▆▆█▇▆▃▅
test/epoch_loss,█▅▃▁▁▁▁▂▂▂
test/f1-score,▄▁▆█▇███▆▇
test/precision,▁▃▁▅▆█▆▅▃▄
test/recall,▅▁██▆▆██▆█
train/batch_loss,▄▁▃█▃▇▅▁▄▄▅▃▃▂▂▅▅▂▂▅▃▃▅▄▂▃▃▂▄▃▃▆▅▂▂▄▅▁▂▂
train/epoch_acc,▁▃▄▇▆▇█▇▇█
train/epoch_loss,█▄▃▂▂▁▁▁▁▁

0,1
epoch,9.0
test/epoch_acc,0.7
test/epoch_loss,0.55412
test/f1-score,0.71579
test/precision,0.59649
test/recall,0.89474
train/batch_loss,0.78966
train/epoch_acc,0.66585
train/epoch_loss,0.61866


[34m[1mwandb[0m: Agent Starting Run: 9j8etw77 with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	beta_one: 0.99
[34m[1mwandb[0m: 	beta_two: 0.5
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	eps: 0.1
[34m[1mwandb[0m: 	gamma: 0.1
[34m[1mwandb[0m: 	learning_rate: 0.0001
[34m[1mwandb[0m: 	optimizer: adam
[34m[1mwandb[0m: 	step_size: 2


VBox(children=(Label(value='0.003 MB of 0.027 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=0.127348…

0,1
epoch,▁▂▃▃▄▅▆▆▇█
test/epoch_acc,▁█▇▇▇▆▆▆▆▆
test/epoch_loss,█▂▃▁▂▂▂▁▁▁
test/f1-score,▁█▆▇▇▅▆▅▅▅
test/precision,▁█▇█▇▆▆▇▇▇
test/recall,▄█▄▁█▁▄▁▁▁
train/batch_loss,▄▆██▄▃▃▅▂▃▄▅▃▄▂▃▁▁▁▄▂▃▄▁▄▂▂▁▁▃▃▄▂▂▂▅▂▃▃▄
train/epoch_acc,▁▅█▇▇███▇▇
train/epoch_loss,█▄▂▂▁▁▁▁▂▂

0,1
epoch,9.0
test/epoch_acc,0.75556
test/epoch_loss,0.6144
test/f1-score,0.76087
test/precision,0.67308
test/recall,0.875
train/batch_loss,0.65108
train/epoch_acc,0.7543
train/epoch_loss,0.62678


[34m[1mwandb[0m: Agent Starting Run: k23a02gb with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	beta_one: 0.9
[34m[1mwandb[0m: 	beta_two: 0.99
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	eps: 1e-08
[34m[1mwandb[0m: 	gamma: 0.1
[34m[1mwandb[0m: 	learning_rate: 0.0003
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	step_size: 5


0,1
epoch,▁▂▃▃▄▅▆▆▇█
test/epoch_acc,▅▁▂▅▇▄▅▇█▇
test/epoch_loss,█▆▄▂▁▂▂▁▁▁
test/f1-score,▆▁▂▅▇▃▅▇█▇
test/precision,▁▁▄▅▇▆█▇█▆
test/recall,█▁▁▅▆▂▃▆▆▅
train/batch_loss,█▇▇▇▇▇▇▆▆▄▆▇▆▆▅▆▄▃▃▃▁▄▃▃▄▃▂▄▂▁▂▃▇▁▃▄▃▄▆▄
train/epoch_acc,▁▅▆▆▇█▇█▇█
train/epoch_loss,█▆▄▃▂▁▂▁▂▁

0,1
epoch,9.0
test/epoch_acc,0.88889
test/epoch_loss,0.30289
test/f1-score,0.86486
test/precision,0.91429
test/recall,0.82051
train/batch_loss,0.27111
train/epoch_acc,0.89681
train/epoch_loss,0.28549


[34m[1mwandb[0m: Agent Starting Run: 265qnj0c with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	beta_one: 0.99
[34m[1mwandb[0m: 	beta_two: 0.99
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	eps: 1e-08
[34m[1mwandb[0m: 	gamma: 0.5
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	step_size: 3


VBox(children=(Label(value='0.010 MB of 0.027 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=0.369539…

0,1
epoch,▁▂▃▃▄▅▆▆▇█
test/epoch_acc,▁▅▄▆▇█▇▇▆▆
test/epoch_loss,█▅▄▃▃▁▂▃▂▁
test/f1-score,▁▅▄▆▇██▇▆▇
test/precision,███▄▁▂▁▅▁▁
test/recall,▁▄▄▅▇██▇▆▇
train/batch_loss,██▇▇▅▅▃▆▂▃▂▂▂▂▄▄▂▂▂▂▄▁▂▅▃▁▁▁▂▆▂▃▃▁▁▁▂▂▁▂
train/epoch_acc,▁▅▆▇▇█████
train/epoch_loss,█▅▄▂▂▁▁▁▁▁

0,1
epoch,9.0
test/epoch_acc,0.88889
test/epoch_loss,0.26007
test/f1-score,0.8913
test/precision,0.95349
test/recall,0.83673
train/batch_loss,0.01167
train/epoch_acc,0.98034
train/epoch_loss,0.08153


[34m[1mwandb[0m: Agent Starting Run: eg199ue9 with config:
[34m[1mwandb[0m: 	batch_size: 4
[34m[1mwandb[0m: 	beta_one: 0.9
[34m[1mwandb[0m: 	beta_two: 0.9
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	eps: 1
[34m[1mwandb[0m: 	gamma: 0.5
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: adam
[34m[1mwandb[0m: 	step_size: 3


VBox(children=(Label(value='0.003 MB of 0.027 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=0.127718…

0,1
epoch,▁▂▃▃▄▅▆▆▇█
test/epoch_acc,▇▆▆▁▅▆▃▃▃█
test/epoch_loss,█▄▃▄▄▅▂▄▃▁
test/f1-score,▇▆▆▁▅▆▄▃▄█
test/precision,▅▂█▃▁▂▁▄▁▅
test/recall,▇▇▅▁▆▇▅▃▅█
train/batch_loss,▆▆▆▆▃▂▂▄▂▂▁▃▂█▂▁▂▅▄▁▁▂▁▁▅▁▁▃▂▂▄▁▁▁▁▁▁▁▁▁
train/epoch_acc,▁▄▆▇▇▇████
train/epoch_loss,█▅▄▃▂▂▁▁▁▁

0,1
epoch,9.0
test/epoch_acc,0.9
test/epoch_loss,0.22746
test/f1-score,0.89655
test/precision,0.92857
test/recall,0.86667
train/batch_loss,0.13858
train/epoch_acc,0.98403
train/epoch_loss,0.07075


[34m[1mwandb[0m: Agent Starting Run: vdaaitvt with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	beta_one: 0.99
[34m[1mwandb[0m: 	beta_two: 0.5
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	eps: 1
[34m[1mwandb[0m: 	gamma: 0.1
[34m[1mwandb[0m: 	learning_rate: 0.0001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	step_size: 7


VBox(children=(Label(value='0.003 MB of 0.003 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▂▃▃▄▅▆▆▇█
test/epoch_acc,▁▄▆██▇▇▇▇▆
test/epoch_loss,█▇▆▄▃▂▁▁▁▁
test/f1-score,▁▄▆█▇▆▆▆▆▃
test/precision,▁▃▄▆▇▇▇███
test/recall,▇▇██▆▅▅▄▄▁
train/batch_loss,▇▇▇▆▇▆▆▆▆▅▆▅▆▆▆▇▅▅▄▅█▅▃▄▅▃▅▇▃▅▅▅▅▂▄▁▅▄▄▅
train/epoch_acc,▁▄▆▇▇███▇█
train/epoch_loss,█▇▆▅▄▃▂▁▂▁

0,1
epoch,9.0
test/epoch_acc,0.77778
test/epoch_loss,0.47685
test/f1-score,0.72222
test/precision,0.83871
test/recall,0.63415
train/batch_loss,0.37919
train/epoch_acc,0.82924
train/epoch_loss,0.45283


[34m[1mwandb[0m: Agent Starting Run: 16v61zix with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	beta_one: 0.9
[34m[1mwandb[0m: 	beta_two: 0.99
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	eps: 1
[34m[1mwandb[0m: 	gamma: 0.1
[34m[1mwandb[0m: 	learning_rate: 0.003
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	step_size: 5


VBox(children=(Label(value='0.003 MB of 0.027 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=0.127347…

0,1
epoch,▁▂▃▃▄▅▆▆▇█
test/epoch_acc,▅▅▅██▁▅▅▁▁
test/epoch_loss,█▁▂▅▃▅▄▄▄▂
test/f1-score,▄▄▄█▇▁▄▄▁▁
test/precision,▃▅▃▁█▃▃▃▁▁
test/recall,▃▁▃█▁▁▃▃▃▃
train/batch_loss,█▆▇▇▂▂▅▆▄▆▂▁▁▁▁▁▁▁▂▁▁▁▁▁▁▁▁▁▁▁▁▁▂▁▁▁▂▁▁▁
train/epoch_acc,▁▅▇▇▇█████
train/epoch_loss,█▅▂▂▂▁▁▁▁▁

0,1
epoch,9.0
test/epoch_acc,0.92222
test/epoch_loss,0.16872
test/f1-score,0.92135
test/precision,0.91111
test/recall,0.93182
train/batch_loss,0.00228
train/epoch_acc,0.99877
train/epoch_loss,0.02303


[34m[1mwandb[0m: Agent Starting Run: gy76rrgz with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	beta_one: 0.9
[34m[1mwandb[0m: 	beta_two: 0.999
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	eps: 1
[34m[1mwandb[0m: 	gamma: 0.5
[34m[1mwandb[0m: 	learning_rate: 0.003
[34m[1mwandb[0m: 	optimizer: adam
[34m[1mwandb[0m: 	step_size: 3


VBox(children=(Label(value='0.003 MB of 0.027 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=0.127052…

0,1
epoch,▁▂▃▃▄▅▆▆▇█
test/epoch_acc,▃▃▁▃▃▆▆█▆▃
test/epoch_loss,█▆▄▃▂▂▁▁▁▁
test/f1-score,▄▃▁▃▃▆▆█▆▃
test/precision,▁█▇███████
test/recall,▆▃▁▃▃▆▆█▆▃
train/batch_loss,█▇██▇▆▇▃▅▃▇▄▄▄▃▆▃▅▃▅▃▁▇▅▃▄▄▆▂▅▂▂▃▁▁▂▂▁▃▁
train/epoch_acc,▁▅▅▆▇▇▇▇██
train/epoch_loss,█▆▅▃▃▂▂▂▁▁

0,1
epoch,9.0
test/epoch_acc,0.88889
test/epoch_loss,0.26282
test/f1-score,0.87179
test/precision,0.97143
test/recall,0.7907
train/batch_loss,0.1486
train/epoch_acc,0.88698
train/epoch_loss,0.31064


[34m[1mwandb[0m: Agent Starting Run: 4dx2f0j8 with config:
[34m[1mwandb[0m: 	batch_size: 4
[34m[1mwandb[0m: 	beta_one: 0.9
[34m[1mwandb[0m: 	beta_two: 0.99
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	eps: 1e-08
[34m[1mwandb[0m: 	gamma: 0.1
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	step_size: 5


VBox(children=(Label(value='0.003 MB of 0.027 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=0.129230…

0,1
epoch,▁▂▃▃▄▅▆▆▇█
test/epoch_acc,▁█▅▇▇▇▇▇▇█
test/epoch_loss,█▁▄▃▆▅▆▅▅▄
test/f1-score,▁█▅▇▇▇▇▇▇█
test/precision,▆▅▇▄█▄█▄▁▅
test/recall,▁█▅▇▇▇▇▇▇█
train/batch_loss,▅▅▆▃▄▃▃▂▂▂▂▂▁▃█▁▅▁▂▂▂▁▁▂▃▁▁▁▁▃▁▁▁▁▁▂▁▁▄▁
train/epoch_acc,▁▄▆▆▇█████
train/epoch_loss,█▆▄▃▂▂▂▁▁▁

0,1
epoch,9.0
test/epoch_acc,0.86667
test/epoch_loss,0.37958
test/f1-score,0.875
test/precision,0.95455
test/recall,0.80769
train/batch_loss,0.077
train/epoch_acc,0.9656
train/epoch_loss,0.09797


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: j93p9uxm with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	beta_one: 0.9
[34m[1mwandb[0m: 	beta_two: 0.5
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	eps: 1e-08
[34m[1mwandb[0m: 	gamma: 0.1
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: adam
[34m[1mwandb[0m: 	step_size: 7


VBox(children=(Label(value='0.010 MB of 0.027 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=0.369874…

0,1
epoch,▁▅█
test/epoch_acc,▁█
test/epoch_loss,█▁
test/f1-score,▁█
test/precision,▁█
test/recall,█▁
train/batch_loss,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▂▁█▁▁▆▅▁▁
train/epoch_acc,█▃▁
train/epoch_loss,▁▁█

0,1
epoch,2.0
test/epoch_acc,0.56667
test/epoch_loss,92431672.3021
test/f1-score,0.62136
test/precision,0.47761
test/recall,0.88889
train/batch_loss,7666.14648
train/epoch_acc,0.46929
train/epoch_loss,4618.08651


Run j93p9uxm errored: ZeroDivisionError('division by zero')
[34m[1mwandb[0m: [32m[41mERROR[0m Run j93p9uxm errored: ZeroDivisionError('division by zero')
[34m[1mwandb[0m: Agent Starting Run: pb5m44k2 with config:
[34m[1mwandb[0m: 	batch_size: 4
[34m[1mwandb[0m: 	beta_one: 0.9
[34m[1mwandb[0m: 	beta_two: 0.999
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	eps: 1e-08
[34m[1mwandb[0m: 	gamma: 0.1
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: adam
[34m[1mwandb[0m: 	step_size: 5


VBox(children=(Label(value='0.003 MB of 0.003 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▂▃▃▄▅▆▆▇█
test/epoch_acc,▅▁▆▃▆▆▇▇▇█
test/epoch_loss,▅█▄▅▃▃▂▁▁▁
test/f1-score,▄▄▄▁▅▆▇▇▇█
test/precision,▆▁█▃▆▆█▇██
test/recall,▃█▂▁▄▆▅▆▅▇
train/batch_loss,▆▄▂▅▅▄▃▆█▃▂▄▂▁▃▂▄▁▂▂▄▃▅▂▂▅▂▂▃▄▁▄▃▁▂▄▂▂▃▄
train/epoch_acc,▁▁▃▃▄▄▆▆▇█
train/epoch_loss,█▇▇▆▅▅▃▃▂▁

0,1
epoch,9.0
test/epoch_acc,0.78889
test/epoch_loss,0.51027
test/f1-score,0.78161
test/precision,0.7234
test/recall,0.85
train/batch_loss,0.42048
train/epoch_acc,0.82555
train/epoch_loss,0.40512


[34m[1mwandb[0m: Agent Starting Run: q8m1yt6d with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	beta_one: 0.9
[34m[1mwandb[0m: 	beta_two: 0.5
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	eps: 0.1
[34m[1mwandb[0m: 	gamma: 0.1
[34m[1mwandb[0m: 	learning_rate: 0.0003
[34m[1mwandb[0m: 	optimizer: adam
[34m[1mwandb[0m: 	step_size: 7


0,1
train/batch_loss,▁

0,1
train/batch_loss,0.67379


Run q8m1yt6d errored: OutOfMemoryError('CUDA out of memory. Tried to allocate 20.00 MiB (GPU 0; 1.95 GiB total capacity; 1.30 GiB already allocated; 11.31 MiB free; 1.32 GiB reserved in total by PyTorch) If reserved memory is >> allocated memory try setting max_split_size_mb to avoid fragmentation.  See documentation for Memory Management and PYTORCH_CUDA_ALLOC_CONF')
[34m[1mwandb[0m: [32m[41mERROR[0m Run q8m1yt6d errored: OutOfMemoryError('CUDA out of memory. Tried to allocate 20.00 MiB (GPU 0; 1.95 GiB total capacity; 1.30 GiB already allocated; 11.31 MiB free; 1.32 GiB reserved in total by PyTorch) If reserved memory is >> allocated memory try setting max_split_size_mb to avoid fragmentation.  See documentation for Memory Management and PYTORCH_CUDA_ALLOC_CONF')
[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: f3kiw40d with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	beta_one: 0.99


VBox(children=(Label(value='0.027 MB of 0.027 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

Run f3kiw40d errored: OutOfMemoryError('CUDA out of memory. Tried to allocate 20.00 MiB (GPU 0; 1.95 GiB total capacity; 1.32 GiB already allocated; 3.31 MiB free; 1.33 GiB reserved in total by PyTorch) If reserved memory is >> allocated memory try setting max_split_size_mb to avoid fragmentation.  See documentation for Memory Management and PYTORCH_CUDA_ALLOC_CONF')
[34m[1mwandb[0m: [32m[41mERROR[0m Run f3kiw40d errored: OutOfMemoryError('CUDA out of memory. Tried to allocate 20.00 MiB (GPU 0; 1.95 GiB total capacity; 1.32 GiB already allocated; 3.31 MiB free; 1.33 GiB reserved in total by PyTorch) If reserved memory is >> allocated memory try setting max_split_size_mb to avoid fragmentation.  See documentation for Memory Management and PYTORCH_CUDA_ALLOC_CONF')
[34m[1mwandb[0m: Agent Starting Run: i0xsie8j with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	beta_one: 0.9
[34m[1mwandb[0m: 	beta_two: 0.99
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 

Run i0xsie8j errored: OutOfMemoryError('CUDA out of memory. Tried to allocate 2.00 MiB (GPU 0; 1.95 GiB total capacity; 1.32 GiB already allocated; 1.31 MiB free; 1.33 GiB reserved in total by PyTorch) If reserved memory is >> allocated memory try setting max_split_size_mb to avoid fragmentation.  See documentation for Memory Management and PYTORCH_CUDA_ALLOC_CONF')
[34m[1mwandb[0m: [32m[41mERROR[0m Run i0xsie8j errored: OutOfMemoryError('CUDA out of memory. Tried to allocate 2.00 MiB (GPU 0; 1.95 GiB total capacity; 1.32 GiB already allocated; 1.31 MiB free; 1.33 GiB reserved in total by PyTorch) If reserved memory is >> allocated memory try setting max_split_size_mb to avoid fragmentation.  See documentation for Memory Management and PYTORCH_CUDA_ALLOC_CONF')
[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: bi477kch with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	beta_one: 0.99
[34m

Run bi477kch errored: OutOfMemoryError('CUDA out of memory. Tried to allocate 2.00 MiB (GPU 0; 1.95 GiB total capacity; 1.32 GiB already allocated; 1.31 MiB free; 1.33 GiB reserved in total by PyTorch) If reserved memory is >> allocated memory try setting max_split_size_mb to avoid fragmentation.  See documentation for Memory Management and PYTORCH_CUDA_ALLOC_CONF')
[34m[1mwandb[0m: [32m[41mERROR[0m Run bi477kch errored: OutOfMemoryError('CUDA out of memory. Tried to allocate 2.00 MiB (GPU 0; 1.95 GiB total capacity; 1.32 GiB already allocated; 1.31 MiB free; 1.33 GiB reserved in total by PyTorch) If reserved memory is >> allocated memory try setting max_split_size_mb to avoid fragmentation.  See documentation for Memory Management and PYTORCH_CUDA_ALLOC_CONF')
[34m[1mwandb[0m: Agent Starting Run: 7jmkpkmh with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	beta_one: 0.99
[34m[1mwandb[0m: 	beta_two: 0.99
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	

Run 7jmkpkmh errored: OutOfMemoryError('CUDA out of memory. Tried to allocate 2.00 MiB (GPU 0; 1.95 GiB total capacity; 1.32 GiB already allocated; 1.31 MiB free; 1.33 GiB reserved in total by PyTorch) If reserved memory is >> allocated memory try setting max_split_size_mb to avoid fragmentation.  See documentation for Memory Management and PYTORCH_CUDA_ALLOC_CONF')
[34m[1mwandb[0m: [32m[41mERROR[0m Run 7jmkpkmh errored: OutOfMemoryError('CUDA out of memory. Tried to allocate 2.00 MiB (GPU 0; 1.95 GiB total capacity; 1.32 GiB already allocated; 1.31 MiB free; 1.33 GiB reserved in total by PyTorch) If reserved memory is >> allocated memory try setting max_split_size_mb to avoid fragmentation.  See documentation for Memory Management and PYTORCH_CUDA_ALLOC_CONF')
[34m[1mwandb[0m: Agent Starting Run: pc0kaw45 with config:
[34m[1mwandb[0m: 	batch_size: 4
[34m[1mwandb[0m: 	beta_one: 0.9
[34m[1mwandb[0m: 	beta_two: 0.99
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	e

VBox(children=(Label(value='0.027 MB of 0.027 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

Run pc0kaw45 errored: OutOfMemoryError('CUDA out of memory. Tried to allocate 2.00 MiB (GPU 0; 1.95 GiB total capacity; 1.32 GiB already allocated; 1.31 MiB free; 1.33 GiB reserved in total by PyTorch) If reserved memory is >> allocated memory try setting max_split_size_mb to avoid fragmentation.  See documentation for Memory Management and PYTORCH_CUDA_ALLOC_CONF')
[34m[1mwandb[0m: [32m[41mERROR[0m Run pc0kaw45 errored: OutOfMemoryError('CUDA out of memory. Tried to allocate 2.00 MiB (GPU 0; 1.95 GiB total capacity; 1.32 GiB already allocated; 1.31 MiB free; 1.33 GiB reserved in total by PyTorch) If reserved memory is >> allocated memory try setting max_split_size_mb to avoid fragmentation.  See documentation for Memory Management and PYTORCH_CUDA_ALLOC_CONF')
[34m[1mwandb[0m: Agent Starting Run: o04kggii with config:
[34m[1mwandb[0m: 	batch_size: 4
[34m[1mwandb[0m: 	beta_one: 0.99
[34m[1mwandb[0m: 	beta_two: 0.999
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 

VBox(children=(Label(value='0.003 MB of 0.027 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=0.129182…

Run o04kggii errored: OutOfMemoryError('CUDA out of memory. Tried to allocate 2.00 MiB (GPU 0; 1.95 GiB total capacity; 1.32 GiB already allocated; 1.31 MiB free; 1.33 GiB reserved in total by PyTorch) If reserved memory is >> allocated memory try setting max_split_size_mb to avoid fragmentation.  See documentation for Memory Management and PYTORCH_CUDA_ALLOC_CONF')
[34m[1mwandb[0m: [32m[41mERROR[0m Run o04kggii errored: OutOfMemoryError('CUDA out of memory. Tried to allocate 2.00 MiB (GPU 0; 1.95 GiB total capacity; 1.32 GiB already allocated; 1.31 MiB free; 1.33 GiB reserved in total by PyTorch) If reserved memory is >> allocated memory try setting max_split_size_mb to avoid fragmentation.  See documentation for Memory Management and PYTORCH_CUDA_ALLOC_CONF')
[34m[1mwandb[0m: Agent Starting Run: mr7zxx8m with config:
[34m[1mwandb[0m: 	batch_size: 4
[34m[1mwandb[0m: 	beta_one: 0.99
[34m[1mwandb[0m: 	beta_two: 0.9
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	e

VBox(children=(Label(value='0.003 MB of 0.027 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=0.129362…

Run mr7zxx8m errored: OutOfMemoryError('CUDA out of memory. Tried to allocate 2.00 MiB (GPU 0; 1.95 GiB total capacity; 1.32 GiB already allocated; 1.31 MiB free; 1.33 GiB reserved in total by PyTorch) If reserved memory is >> allocated memory try setting max_split_size_mb to avoid fragmentation.  See documentation for Memory Management and PYTORCH_CUDA_ALLOC_CONF')
[34m[1mwandb[0m: [32m[41mERROR[0m Run mr7zxx8m errored: OutOfMemoryError('CUDA out of memory. Tried to allocate 2.00 MiB (GPU 0; 1.95 GiB total capacity; 1.32 GiB already allocated; 1.31 MiB free; 1.33 GiB reserved in total by PyTorch) If reserved memory is >> allocated memory try setting max_split_size_mb to avoid fragmentation.  See documentation for Memory Management and PYTORCH_CUDA_ALLOC_CONF')
[34m[1mwandb[0m: Agent Starting Run: 292ds63r with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	beta_one: 0.99
[34m[1mwandb[0m: 	beta_two: 0.5
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	e

VBox(children=(Label(value='0.003 MB of 0.027 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=0.129560…

Run 292ds63r errored: OutOfMemoryError('CUDA out of memory. Tried to allocate 2.00 MiB (GPU 0; 1.95 GiB total capacity; 1.32 GiB already allocated; 1.31 MiB free; 1.33 GiB reserved in total by PyTorch) If reserved memory is >> allocated memory try setting max_split_size_mb to avoid fragmentation.  See documentation for Memory Management and PYTORCH_CUDA_ALLOC_CONF')
[34m[1mwandb[0m: [32m[41mERROR[0m Run 292ds63r errored: OutOfMemoryError('CUDA out of memory. Tried to allocate 2.00 MiB (GPU 0; 1.95 GiB total capacity; 1.32 GiB already allocated; 1.31 MiB free; 1.33 GiB reserved in total by PyTorch) If reserved memory is >> allocated memory try setting max_split_size_mb to avoid fragmentation.  See documentation for Memory Management and PYTORCH_CUDA_ALLOC_CONF')
[34m[1mwandb[0m: Agent Starting Run: fdlwffsj with config:
[34m[1mwandb[0m: 	batch_size: 4
[34m[1mwandb[0m: 	beta_one: 0.9
[34m[1mwandb[0m: 	beta_two: 0.99
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	e

VBox(children=(Label(value='0.003 MB of 0.026 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=0.132928…

Run fdlwffsj errored: OutOfMemoryError('CUDA out of memory. Tried to allocate 2.00 MiB (GPU 0; 1.95 GiB total capacity; 1.32 GiB already allocated; 1.31 MiB free; 1.33 GiB reserved in total by PyTorch) If reserved memory is >> allocated memory try setting max_split_size_mb to avoid fragmentation.  See documentation for Memory Management and PYTORCH_CUDA_ALLOC_CONF')
[34m[1mwandb[0m: [32m[41mERROR[0m Run fdlwffsj errored: OutOfMemoryError('CUDA out of memory. Tried to allocate 2.00 MiB (GPU 0; 1.95 GiB total capacity; 1.32 GiB already allocated; 1.31 MiB free; 1.33 GiB reserved in total by PyTorch) If reserved memory is >> allocated memory try setting max_split_size_mb to avoid fragmentation.  See documentation for Memory Management and PYTORCH_CUDA_ALLOC_CONF')
[34m[1mwandb[0m: Agent Starting Run: 3s4wltdw with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	beta_one: 0.99
[34m[1mwandb[0m: 	beta_two: 0.9
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	e

Run 3s4wltdw errored: OutOfMemoryError('CUDA out of memory. Tried to allocate 2.00 MiB (GPU 0; 1.95 GiB total capacity; 1.32 GiB already allocated; 1.31 MiB free; 1.33 GiB reserved in total by PyTorch) If reserved memory is >> allocated memory try setting max_split_size_mb to avoid fragmentation.  See documentation for Memory Management and PYTORCH_CUDA_ALLOC_CONF')
[34m[1mwandb[0m: [32m[41mERROR[0m Run 3s4wltdw errored: OutOfMemoryError('CUDA out of memory. Tried to allocate 2.00 MiB (GPU 0; 1.95 GiB total capacity; 1.32 GiB already allocated; 1.31 MiB free; 1.33 GiB reserved in total by PyTorch) If reserved memory is >> allocated memory try setting max_split_size_mb to avoid fragmentation.  See documentation for Memory Management and PYTORCH_CUDA_ALLOC_CONF')
[34m[1mwandb[0m: Agent Starting Run: kv0nxhmk with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	beta_one: 0.9
[34m[1mwandb[0m: 	beta_two: 0.9
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	ep

VBox(children=(Label(value='0.010 MB of 0.027 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=0.375132…

Run kv0nxhmk errored: OutOfMemoryError('CUDA out of memory. Tried to allocate 2.00 MiB (GPU 0; 1.95 GiB total capacity; 1.32 GiB already allocated; 1.31 MiB free; 1.33 GiB reserved in total by PyTorch) If reserved memory is >> allocated memory try setting max_split_size_mb to avoid fragmentation.  See documentation for Memory Management and PYTORCH_CUDA_ALLOC_CONF')
[34m[1mwandb[0m: [32m[41mERROR[0m Run kv0nxhmk errored: OutOfMemoryError('CUDA out of memory. Tried to allocate 2.00 MiB (GPU 0; 1.95 GiB total capacity; 1.32 GiB already allocated; 1.31 MiB free; 1.33 GiB reserved in total by PyTorch) If reserved memory is >> allocated memory try setting max_split_size_mb to avoid fragmentation.  See documentation for Memory Management and PYTORCH_CUDA_ALLOC_CONF')
[34m[1mwandb[0m: Agent Starting Run: ixbulpc8 with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	beta_one: 0.9
[34m[1mwandb[0m: 	beta_two: 0.5
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	ep

VBox(children=(Label(value='0.003 MB of 0.027 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=0.129490…

Run ixbulpc8 errored: OutOfMemoryError('CUDA out of memory. Tried to allocate 2.00 MiB (GPU 0; 1.95 GiB total capacity; 1.32 GiB already allocated; 1.31 MiB free; 1.33 GiB reserved in total by PyTorch) If reserved memory is >> allocated memory try setting max_split_size_mb to avoid fragmentation.  See documentation for Memory Management and PYTORCH_CUDA_ALLOC_CONF')
[34m[1mwandb[0m: [32m[41mERROR[0m Run ixbulpc8 errored: OutOfMemoryError('CUDA out of memory. Tried to allocate 2.00 MiB (GPU 0; 1.95 GiB total capacity; 1.32 GiB already allocated; 1.31 MiB free; 1.33 GiB reserved in total by PyTorch) If reserved memory is >> allocated memory try setting max_split_size_mb to avoid fragmentation.  See documentation for Memory Management and PYTORCH_CUDA_ALLOC_CONF')
[34m[1mwandb[0m: Agent Starting Run: lfi2onyo with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	beta_one: 0.9
[34m[1mwandb[0m: 	beta_two: 0.9
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	ep

Run lfi2onyo errored: OutOfMemoryError('CUDA out of memory. Tried to allocate 2.00 MiB (GPU 0; 1.95 GiB total capacity; 1.32 GiB already allocated; 1.31 MiB free; 1.33 GiB reserved in total by PyTorch) If reserved memory is >> allocated memory try setting max_split_size_mb to avoid fragmentation.  See documentation for Memory Management and PYTORCH_CUDA_ALLOC_CONF')
[34m[1mwandb[0m: [32m[41mERROR[0m Run lfi2onyo errored: OutOfMemoryError('CUDA out of memory. Tried to allocate 2.00 MiB (GPU 0; 1.95 GiB total capacity; 1.32 GiB already allocated; 1.31 MiB free; 1.33 GiB reserved in total by PyTorch) If reserved memory is >> allocated memory try setting max_split_size_mb to avoid fragmentation.  See documentation for Memory Management and PYTORCH_CUDA_ALLOC_CONF')
[34m[1mwandb[0m: Agent Starting Run: 4uvn2tnq with config:
[34m[1mwandb[0m: 	batch_size: 4
[34m[1mwandb[0m: 	beta_one: 0.9
[34m[1mwandb[0m: 	beta_two: 0.5
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	ep

VBox(children=(Label(value='0.027 MB of 0.027 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

Run 4uvn2tnq errored: OutOfMemoryError('CUDA out of memory. Tried to allocate 2.00 MiB (GPU 0; 1.95 GiB total capacity; 1.32 GiB already allocated; 1.31 MiB free; 1.33 GiB reserved in total by PyTorch) If reserved memory is >> allocated memory try setting max_split_size_mb to avoid fragmentation.  See documentation for Memory Management and PYTORCH_CUDA_ALLOC_CONF')
[34m[1mwandb[0m: [32m[41mERROR[0m Run 4uvn2tnq errored: OutOfMemoryError('CUDA out of memory. Tried to allocate 2.00 MiB (GPU 0; 1.95 GiB total capacity; 1.32 GiB already allocated; 1.31 MiB free; 1.33 GiB reserved in total by PyTorch) If reserved memory is >> allocated memory try setting max_split_size_mb to avoid fragmentation.  See documentation for Memory Management and PYTORCH_CUDA_ALLOC_CONF')
[34m[1mwandb[0m: Agent Starting Run: y4niwbym with config:
[34m[1mwandb[0m: 	batch_size: 4
[34m[1mwandb[0m: 	beta_one: 0.9
[34m[1mwandb[0m: 	beta_two: 0.5
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	ep

VBox(children=(Label(value='0.027 MB of 0.027 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

Run y4niwbym errored: OutOfMemoryError('CUDA out of memory. Tried to allocate 2.00 MiB (GPU 0; 1.95 GiB total capacity; 1.32 GiB already allocated; 1.31 MiB free; 1.33 GiB reserved in total by PyTorch) If reserved memory is >> allocated memory try setting max_split_size_mb to avoid fragmentation.  See documentation for Memory Management and PYTORCH_CUDA_ALLOC_CONF')
[34m[1mwandb[0m: [32m[41mERROR[0m Run y4niwbym errored: OutOfMemoryError('CUDA out of memory. Tried to allocate 2.00 MiB (GPU 0; 1.95 GiB total capacity; 1.32 GiB already allocated; 1.31 MiB free; 1.33 GiB reserved in total by PyTorch) If reserved memory is >> allocated memory try setting max_split_size_mb to avoid fragmentation.  See documentation for Memory Management and PYTORCH_CUDA_ALLOC_CONF')
[34m[1mwandb[0m: Agent Starting Run: hxampiva with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	beta_one: 0.9
[34m[1mwandb[0m: 	beta_two: 0.5
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	ep

VBox(children=(Label(value='0.027 MB of 0.027 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

Run hxampiva errored: OutOfMemoryError('CUDA out of memory. Tried to allocate 2.00 MiB (GPU 0; 1.95 GiB total capacity; 1.32 GiB already allocated; 1.31 MiB free; 1.33 GiB reserved in total by PyTorch) If reserved memory is >> allocated memory try setting max_split_size_mb to avoid fragmentation.  See documentation for Memory Management and PYTORCH_CUDA_ALLOC_CONF')
[34m[1mwandb[0m: [32m[41mERROR[0m Run hxampiva errored: OutOfMemoryError('CUDA out of memory. Tried to allocate 2.00 MiB (GPU 0; 1.95 GiB total capacity; 1.32 GiB already allocated; 1.31 MiB free; 1.33 GiB reserved in total by PyTorch) If reserved memory is >> allocated memory try setting max_split_size_mb to avoid fragmentation.  See documentation for Memory Management and PYTORCH_CUDA_ALLOC_CONF')
[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: q1v8qruc with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	beta_one: 0.99
[34m

VBox(children=(Label(value='0.027 MB of 0.027 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

Run q1v8qruc errored: OutOfMemoryError('CUDA out of memory. Tried to allocate 2.00 MiB (GPU 0; 1.95 GiB total capacity; 1.32 GiB already allocated; 1.31 MiB free; 1.33 GiB reserved in total by PyTorch) If reserved memory is >> allocated memory try setting max_split_size_mb to avoid fragmentation.  See documentation for Memory Management and PYTORCH_CUDA_ALLOC_CONF')
[34m[1mwandb[0m: [32m[41mERROR[0m Run q1v8qruc errored: OutOfMemoryError('CUDA out of memory. Tried to allocate 2.00 MiB (GPU 0; 1.95 GiB total capacity; 1.32 GiB already allocated; 1.31 MiB free; 1.33 GiB reserved in total by PyTorch) If reserved memory is >> allocated memory try setting max_split_size_mb to avoid fragmentation.  See documentation for Memory Management and PYTORCH_CUDA_ALLOC_CONF')
