skypilot
1import sky
2
3with sky.Dag() as dag:
4# The working directory contains all code and will be synced to remote.
5workdir = './examples/tpu/tpu_app_code'
6
7# The setup command. Will be run under the working directory.
8setup = 'pip install --upgrade pip && \
9conda activate huggingface || \
10(conda create -n huggingface python=3.8 -y && \
11conda activate huggingface && \
12pip install -r requirements.txt)'
13
14# The command to run. Will be run under the working directory.
15run = 'conda activate huggingface && python -u run_tpu.py'
16
17train = sky.Task(
18'train',
19workdir=workdir,
20setup=setup,
21run=run,
22)
23train.set_resources({
24sky.Resources(accelerators='tpu-v3-8',
25accelerator_args={
26'runtime_version': '2.12.0',
27'tpu_name': 'weilin-bert-test-big'
28}),
29})
30
31sky.launch(dag)
32