Skip to content

Commit 42ac877

Browse files
committedMar 11, 2025·
fix axolotl example
1 parent fc199fe commit 42ac877

File tree

2 files changed

+24
-1
lines changed

2 files changed

+24
-1
lines changed
 

‎example/axolotl_example/start_job.py

+1-1
Original file line numberDiff line numberDiff line change
@@ -7,6 +7,6 @@
77
job = ow.axolotl.create(
88
local_config_dir=os.path.dirname(__file__),
99
command='axolotl train llama_3_70b_fft.yaml',
10-
allowed_hardware=['8x H100']
10+
allowed_hardware=['8x H100', '8x A100', '8x H100S', '8x H100N', '8x A100S']
1111
)
1212
print(job)

‎example/axolotl_example/zero1.json

+23
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,23 @@
1+
{
2+
"zero_optimization": {
3+
"stage": 1,
4+
"overlap_comm": true
5+
},
6+
"bf16": {
7+
"enabled": "auto"
8+
},
9+
"fp16": {
10+
"enabled": "auto",
11+
"auto_cast": false,
12+
"loss_scale": 0,
13+
"initial_scale_power": 32,
14+
"loss_scale_window": 1000,
15+
"hysteresis": 2,
16+
"min_loss_scale": 1
17+
},
18+
"gradient_accumulation_steps": "auto",
19+
"gradient_clipping": "auto",
20+
"train_batch_size": "auto",
21+
"train_micro_batch_size_per_gpu": "auto",
22+
"wall_clock_breakdown": false
23+
}

0 commit comments

Comments
 (0)
Please sign in to comment.