gpt3l-flash-rotary.yaml 185 B

12345678
  1. # @package _global_
  2. defaults:
  3. - /experiment/pile/gpt3l-flash.yaml
  4. model:
  5. config:
  6. max_position_embeddings: 0 # Disable absolute position embedding
  7. rotary_emb_fraction: 0.5