gpt3l-hf.yaml 196 B

12345678910111213141516
  1. # @package _global_
  2. defaults:
  3. - /experiment/pile/gpt3s-hf.yaml
  4. model:
  5. config:
  6. n_embd: 1536
  7. n_head: 16
  8. n_layer: 24
  9. datamodule:
  10. batch_size: 2
  11. train:
  12. optimizer:
  13. lr: 2.5e-4