Advertisement
Not a member of Pastebin yet?
Sign Up,
it unlocks many cool features!
- {
- "train_micro_batch_size_per_gpu": 1,
- "fp16": {
- "enabled": true,
- "loss_scale": 0,
- "loss_scale_window": 2000,
- "initial_scale_power": 15,
- "min_loss_scale": 0.0
- },
- "zero_optimization": {
- "stage": 2,
- "allgather_partitions": true,
- "allgather_bucket_size": 2e7,
- "reduce_scatter": true,
- "contiguous_gradients": true,
- "cpu_offload": true,
- "reduce_bucket_size": 2e7,
- "overlap_comm": true
- },
- "sparse_attention": {
- "mode": "fixed",
- "block": 16,
- "different_layout_per_head": true,
- "num_local_blocks": 8,
- "num_global_blocks": 1,
- "attention": "unidirectional",
- "horizontal_global_attention": false,
- "num_different_global_patterns": 8
- }
- }
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement