From 54e84ffa903181d09d0002b8bd30e16de281728b Mon Sep 17 00:00:00 2001 From: Avik Pal Date: Thu, 7 Nov 2024 20:35:53 -0500 Subject: [PATCH] chore: update ConvMixer to latest deps --- examples/ConvMixer/Project.toml | 2 +- examples/ConvMixer/README.md | 2 +- examples/ConvMixer/main.jl | 6 +++--- 3 files changed, 5 insertions(+), 5 deletions(-) diff --git a/examples/ConvMixer/Project.toml b/examples/ConvMixer/Project.toml index 3dc33ee4d..d1ffac2cd 100644 --- a/examples/ConvMixer/Project.toml +++ b/examples/ConvMixer/Project.toml @@ -31,7 +31,7 @@ LuxCUDA = "0.3.2" MLDatasets = "0.7.14" MLUtils = "0.4.4" OneHotArrays = "0.2.5" -Optimisers = "0.3.3, 0.4" +Optimisers = "0.4" PreferenceTools = "0.1.2" Printf = "1.10" ProgressBars = "1.5.1" diff --git a/examples/ConvMixer/README.md b/examples/ConvMixer/README.md index f7003505a..f072c1074 100644 --- a/examples/ConvMixer/README.md +++ b/examples/ConvMixer/README.md @@ -17,7 +17,7 @@ julia --startup-file=no \ --threads=auto \ main.jl \ --lr-max=0.05 \ - --weight-decay=0.000005 + --weight-decay=0.0001 ``` Here's an example of the output of the above command (on a V100 32GB GPU): diff --git a/examples/ConvMixer/main.jl b/examples/ConvMixer/main.jl index 56ca4115f..03ddc63a5 100644 --- a/examples/ConvMixer/main.jl +++ b/examples/ConvMixer/main.jl @@ -22,17 +22,17 @@ function get_dataloaders(batchsize) cifar10_std = (0.2471, 0.2435, 0.2616) train_transform = RandomResizeCrop((32, 32)) |> - Maybe(FlipX()) |> + Maybe(FlipX{2}()) |> ImageToTensor() |> Normalize(cifar10_mean, cifar10_std) test_transform = ImageToTensor() |> Normalize(cifar10_mean, cifar10_std) trainset = TensorDataset(CIFAR10(:train), train_transform) - trainloader = DataLoader(trainset; batchsize, shuffle=true, buffer=true, parallel=true) + trainloader = DataLoader(trainset; batchsize, shuffle=true, parallel=true) testset = TensorDataset(CIFAR10(:test), test_transform) - testloader = DataLoader(testset; batchsize, shuffle=false, buffer=true, parallel=true) + testloader = DataLoader(testset; batchsize, shuffle=false, parallel=true) return trainloader, testloader end