.. |
__init__.py
|
c2aaaefd57
allow out-of-tree model registry
|
9 сар өмнө |
baichuan.py
|
50c2434267
move megatron to a top-level directory
|
9 сар өмнө |
bloom.py
|
50c2434267
move megatron to a top-level directory
|
9 сар өмнө |
chatglm.py
|
50c2434267
move megatron to a top-level directory
|
9 сар өмнө |
cohere.py
|
50c2434267
move megatron to a top-level directory
|
9 сар өмнө |
dbrx.py
|
50c2434267
move megatron to a top-level directory
|
9 сар өмнө |
decilm.py
|
e31c6f0b45
feat: refactor modeling logic and support more models (#274)
|
10 сар өмнө |
deepseek.py
|
50c2434267
move megatron to a top-level directory
|
9 сар өмнө |
falcon.py
|
50c2434267
move megatron to a top-level directory
|
9 сар өмнө |
gemma.py
|
50c2434267
move megatron to a top-level directory
|
9 сар өмнө |
gpt2.py
|
50c2434267
move megatron to a top-level directory
|
9 сар өмнө |
gpt_bigcode.py
|
50c2434267
move megatron to a top-level directory
|
9 сар өмнө |
gpt_j.py
|
50c2434267
move megatron to a top-level directory
|
9 сар өмнө |
gpt_neox.py
|
50c2434267
move megatron to a top-level directory
|
9 сар өмнө |
internlm2.py
|
50c2434267
move megatron to a top-level directory
|
9 сар өмнө |
llama.py
|
50c2434267
move megatron to a top-level directory
|
9 сар өмнө |
llava.py
|
4d33ce60da
feat: Triton flash attention backend for ROCm (#407)
|
9 сар өмнө |
mixtral.py
|
50c2434267
move megatron to a top-level directory
|
9 сар өмнө |
mpt.py
|
50c2434267
move megatron to a top-level directory
|
9 сар өмнө |
olmo.py
|
50c2434267
move megatron to a top-level directory
|
9 сар өмнө |
opt.py
|
50c2434267
move megatron to a top-level directory
|
9 сар өмнө |
phi.py
|
50c2434267
move megatron to a top-level directory
|
9 сар өмнө |
qwen.py
|
50c2434267
move megatron to a top-level directory
|
9 сар өмнө |
qwen2.py
|
50c2434267
move megatron to a top-level directory
|
9 сар өмнө |
qwen2moe.py
|
50c2434267
move megatron to a top-level directory
|
9 сар өмнө |
stablelm.py
|
50c2434267
move megatron to a top-level directory
|
9 сар өмнө |