skypilot
1name: resnet50-randaug2
3resources:4candidates:5- {accelerators: T4:4}6- {accelerators: V100:4}7
8workdir: ./examples/benchmark/timm9
10setup: |11conda create -n timm python=3.8 -y
12conda activate timm
13
14# Install SkyCallback15pip install "git+https://github.com/skypilot-org/skypilot.git#egg=sky-callback&subdirectory=sky/callbacks/"16
17# User setup18git clone https://github.com/rwightman/pytorch-image-models.git timm19cd timm
20git checkout v0.5.4
21pip install -r requirements.txt22
23# Apply the patch to enable SkyCallback24git apply ../callback.patch
25
26# Apply the patch to use a dummy ImageNet dataset to avoid data downloading27git apply ../dummy_dataset.patch
28
29run: |30conda activate timm
31cd timm
32python3 -m torch.distributed.launch --nproc_per_node=4 train.py \
33-b 64 --model resnet50 --sched cosine --epochs 200 --lr 0.05 \
34--amp --remode pixel --reprob 0.6 --aug-splits 3 \
35--aa rand-m9-mstd0.5-inc1 --resplit --split-bn --jsd \
36--dist-bn reduce
37