{ "fsdp_transformer_layer_cls_to_wrap": ["InternLMDecoderLayer"], "limit_all_gathers": true }