Advertisement
Guest User

gpt3_large_2048_off.json

a guest
Aug 21st, 2021
164
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
JSON 0.74 KB | None | 0 0
  1. {
  2.   "train_micro_batch_size_per_gpu": 1,
  3.   "fp16": {
  4.     "enabled": true,
  5.     "loss_scale": 0,
  6.     "loss_scale_window": 2000,
  7.     "initial_scale_power": 15,
  8.     "min_loss_scale": 0.0
  9.   },
  10.   "zero_optimization": {
  11.     "stage": 2,
  12.     "allgather_partitions": true,
  13.     "allgather_bucket_size": 2e7,
  14.     "reduce_scatter": true,
  15.     "contiguous_gradients": true,
  16.     "cpu_offload": true,
  17.     "reduce_bucket_size": 2e7,
  18.     "overlap_comm": true
  19.   },
  20.     "sparse_attention": {
  21.     "mode": "fixed",
  22.     "block": 16,
  23.     "different_layout_per_head": true,
  24.     "num_local_blocks": 8,
  25.     "num_global_blocks": 1,
  26.     "attention": "unidirectional",
  27.     "horizontal_global_attention": false,
  28.     "num_different_global_patterns": 8
  29.   }
  30. }
  31.  
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement