1234567891011121314151617181920212223242526272829303132333435363738394041 |
- defaults:
- - /experiment/owt/gpt2m-flash.yaml
- - override /model/gpt2model: gpt2-large
-
-
-
-
-
-
-
-
-
- - override /optimizer: adamw-zero
-
-
-
-
-
-
- datamodule:
-
- batch_size: ${eval:"4 if ${train.gpu_mem} < 24 else (8 if ${train.gpu_mem} < 40 else (16 if ${train.gpu_mem} < 80 else 32))"}
- trainer:
-
-
- strategy:
- _target_: src.utils.ddp_zero1.DDPStrategyZero1
- find_unused_parameters: False
- gradient_as_bucket_view: True
-
-
|