.. |
__init__.py
|
bbde979ecd
DeepSeek-V2 (#579)
|
7 bulan lalu |
arctic.py
|
656459fd84
make fp8_e4m3 work on nvidia
|
7 bulan lalu |
baichuan.py
|
c5d8028668
fix: no need to redefine supports_vision and supports_lora in model class
|
7 bulan lalu |
bloom.py
|
656459fd84
make fp8_e4m3 work on nvidia
|
7 bulan lalu |
chatglm.py
|
c5d8028668
fix: no need to redefine supports_vision and supports_lora in model class
|
7 bulan lalu |
clip.py
|
3a0fdf7b9b
chore: remove `image_input_type` from VLM config
|
7 bulan lalu |
commandr.py
|
da6765c084
feat: lora support for commandr models
|
7 bulan lalu |
dbrx.py
|
b2cb5a92e9
fix: missing cache_config for dbrx
|
7 bulan lalu |
decilm.py
|
56e0b8223c
chore: add base class for LoRA-supported models
|
7 bulan lalu |
deepseek.py
|
656459fd84
make fp8_e4m3 work on nvidia
|
7 bulan lalu |
deepseek_v2.py
|
bbde979ecd
DeepSeek-V2 (#579)
|
7 bulan lalu |
falcon.py
|
656459fd84
make fp8_e4m3 work on nvidia
|
7 bulan lalu |
gemma.py
|
b6ff0623a6
chore: clean up branding
|
7 bulan lalu |
gpt2.py
|
656459fd84
make fp8_e4m3 work on nvidia
|
7 bulan lalu |
gpt_bigcode.py
|
656459fd84
make fp8_e4m3 work on nvidia
|
7 bulan lalu |
gpt_j.py
|
656459fd84
make fp8_e4m3 work on nvidia
|
7 bulan lalu |
gpt_neox.py
|
656459fd84
make fp8_e4m3 work on nvidia
|
7 bulan lalu |
interfaces.py
|
85ef2fe8b1
chore: clean up placeholder symbols
|
7 bulan lalu |
internlm2.py
|
656459fd84
make fp8_e4m3 work on nvidia
|
7 bulan lalu |
jais.py
|
656459fd84
make fp8_e4m3 work on nvidia
|
7 bulan lalu |
llama.py
|
c5d8028668
fix: no need to redefine supports_vision and supports_lora in model class
|
7 bulan lalu |
llama_embedding.py
|
50b7c13db0
refactor: attention selector (#552)
|
7 bulan lalu |
llava.py
|
3a0fdf7b9b
chore: remove `image_input_type` from VLM config
|
7 bulan lalu |
llava_next.py
|
3a0fdf7b9b
chore: remove `image_input_type` from VLM config
|
7 bulan lalu |
minicpm.py
|
c5d8028668
fix: no need to redefine supports_vision and supports_lora in model class
|
7 bulan lalu |
mixtral.py
|
c5d8028668
fix: no need to redefine supports_vision and supports_lora in model class
|
7 bulan lalu |
mixtral_quant.py
|
b6ff0623a6
chore: clean up branding
|
7 bulan lalu |
mlp_speculator.py
|
de7e6919c0
feat: support tied weights and input scale for MLPSpeculator
|
7 bulan lalu |
mpt.py
|
656459fd84
make fp8_e4m3 work on nvidia
|
7 bulan lalu |
olmo.py
|
656459fd84
make fp8_e4m3 work on nvidia
|
7 bulan lalu |
opt.py
|
656459fd84
make fp8_e4m3 work on nvidia
|
7 bulan lalu |
orion.py
|
656459fd84
make fp8_e4m3 work on nvidia
|
7 bulan lalu |
phi.py
|
c5d8028668
fix: no need to redefine supports_vision and supports_lora in model class
|
7 bulan lalu |
phi3_small.py
|
696f2cd59c
add phi3_small support with blocksparse attention
|
7 bulan lalu |
phi3v.py
|
3a0fdf7b9b
chore: remove `image_input_type` from VLM config
|
7 bulan lalu |
qwen.py
|
656459fd84
make fp8_e4m3 work on nvidia
|
7 bulan lalu |
qwen2.py
|
c5d8028668
fix: no need to redefine supports_vision and supports_lora in model class
|
7 bulan lalu |
qwen2_moe.py
|
656459fd84
make fp8_e4m3 work on nvidia
|
7 bulan lalu |
stablelm.py
|
656459fd84
make fp8_e4m3 work on nvidia
|
7 bulan lalu |
starcoder2.py
|
ac79d115b3
add guards for prefix caching, fp8, chunked, etc
|
7 bulan lalu |
xverse.py
|
c5d8028668
fix: no need to redefine supports_vision and supports_lora in model class
|
7 bulan lalu |