Skip to content

Commit

Permalink
logs
Browse files Browse the repository at this point in the history
  • Loading branch information
dakinggg committed Apr 12, 2024
1 parent e7ac0a9 commit b9a5abc
Showing 1 changed file with 6 additions and 0 deletions.
6 changes: 6 additions & 0 deletions scripts/train/train.py
Original file line number Diff line number Diff line change
Expand Up @@ -102,12 +102,18 @@ def validate_config(cfg: DictConfig):
'`load_in_8bit` is only supported for evaluation rather than training.'
)

print('in validate')
print(cfg.model.get('ffn_config', {}).get('ffn_type', 'mptmlp'))
print(cfg.model.get('ffn_config', {}).get('ffn_type', 'mptmlp') in ffns_with_megablocks)
if cfg.model.get('ffn_config', {}).get('ffn_type',
'mptmlp') in ffns_with_megablocks:
print('inside')
moe_world_size = cfg.model.get('ffn_config',
{}).get('moe_world_size', 1)
print(moe_world_size)
use_orig_params = cfg.get('fsdp_config',
{}).get('use_orig_params', True)
print(use_orig_params)
if moe_world_size > 1 and not use_orig_params:
raise ValueError(
f'MoEs with expert parallelism (moe_world_size {moe_world_size} > 1) require `use_orig_params=True`.'
Expand Down

0 comments on commit b9a5abc

Please sign in to comment.