gpt3-2.7B-hf.yaml 197 B

12345678910111213141516
  1. # @package _global_
  2. defaults:
  3. - /experiment/pile/gpt3xl-hf.yaml
  4. model:
  5. config:
  6. n_embd: 2560
  7. n_head: 32
  8. n_layer: 32
  9. datamodule:
  10. batch_size: 1
  11. train:
  12. optimizer:
  13. lr: 1.6e-4