gpt3s-flash-8k.yaml 224 B

12345678910
  1. # @package _global_
  2. defaults:
  3. - /experiment/pile/gpt3s-flash.yaml
  4. datamodule:
  5. max_length: 8192
  6. batch_size: ${eval:"2 if ${train.gpu_mem} < 24 else (4 if ${train.gpu_mem} < 40 else 8)"}
  7. train:
  8. global_batch_size: 64