4 lines
98 B
JSON
4 lines
98 B
JSON
{
|
|
"fsdp_transformer_layer_cls_to_wrap": ["LlamaDecoderLayer"],
|
|
"limit_all_gathers": true
|
|
} |