gpt3s-hf.yaml 232 B

123456789101112
  1. # @package _global_
  2. defaults:
  3. - /experiment/pile/base.yaml
  4. - override /model: gpt2-hf
  5. - override /model/gpt2model: gpt2-small
  6. datamodule:
  7. batch_size: 8
  8. train:
  9. # Use the standard torch.nn.CrossEntropyLoss
  10. loss_fn: null