4 lines
101 B
JSON
4 lines
101 B
JSON
{
|
|
"fsdp_transformer_layer_cls_to_wrap": ["InternLMDecoderLayer"],
|
|
"limit_all_gathers": true
|
|
} |