diff --git a/docs/source/usage_guides/fsdp.md b/docs/source/usage_guides/fsdp.md index 1a3eb51c8e4..58a6d0b6d4f 100644 --- a/docs/source/usage_guides/fsdp.md +++ b/docs/source/usage_guides/fsdp.md @@ -49,7 +49,7 @@ fsdp_config: fsdp_offload_params: false fsdp_sharding_strategy: 1 fsdp_state_dict_type: FULL_STATE_DICT - fsdp_transformer_layer_cls_to_wrap: GPT2Block + fsdp_transformer_layer_cls_to_wrap: BertLayer machine_rank: 0 main_process_ip: null main_process_port: null