1
0

gpt3l-flash-8k.yaml 224 B

12345678910
  1. # @package _global_
  2. defaults:
  3. - /experiment/pile/gpt3l-flash.yaml
  4. datamodule:
  5. max_length: 8192
  6. batch_size: ${eval:"1 if ${train.gpu_mem} < 40 else (2 if ${train.gpu_mem} < 80 else 4)"}
  7. train:
  8. global_batch_size: 64