.. |
__init__.py
|
89a2c6dee1
chore: refactor `MultiModalConfig` initialization and profiling (#745)
|
3 miesięcy temu |
arctic.py
|
0e558e9b2f
fix: loading chameleon model with TP>1 (#695)
|
4 miesięcy temu |
baichuan.py
|
0e558e9b2f
fix: loading chameleon model with TP>1 (#695)
|
4 miesięcy temu |
bart.py
|
0e558e9b2f
fix: loading chameleon model with TP>1 (#695)
|
4 miesięcy temu |
blip.py
|
0b8b407b6d
feat: support profiling with multiple multi-modal inputs per prompt (#712)
|
4 miesięcy temu |
blip2.py
|
0b8b407b6d
feat: support profiling with multiple multi-modal inputs per prompt (#712)
|
4 miesięcy temu |
bloom.py
|
0e558e9b2f
fix: loading chameleon model with TP>1 (#695)
|
4 miesięcy temu |
chameleon.py
|
0b8b407b6d
feat: support profiling with multiple multi-modal inputs per prompt (#712)
|
4 miesięcy temu |
chatglm.py
|
0e558e9b2f
fix: loading chameleon model with TP>1 (#695)
|
4 miesięcy temu |
clip.py
|
0b8b407b6d
feat: support profiling with multiple multi-modal inputs per prompt (#712)
|
4 miesięcy temu |
commandr.py
|
0e558e9b2f
fix: loading chameleon model with TP>1 (#695)
|
4 miesięcy temu |
dbrx.py
|
0e558e9b2f
fix: loading chameleon model with TP>1 (#695)
|
4 miesięcy temu |
decilm.py
|
3f712cd287
feat: add progress bar for loading individual weight modules (#640)
|
4 miesięcy temu |
deepseek.py
|
0e558e9b2f
fix: loading chameleon model with TP>1 (#695)
|
4 miesięcy temu |
deepseek_v2.py
|
4ec08af18b
chore: update fused MoE weight loading (#700)
|
4 miesięcy temu |
exaone.py
|
08711d2ac9
feat: add Exaone model support (#743)
|
3 miesięcy temu |
falcon.py
|
0e558e9b2f
fix: loading chameleon model with TP>1 (#695)
|
4 miesięcy temu |
fuyu.py
|
0b8b407b6d
feat: support profiling with multiple multi-modal inputs per prompt (#712)
|
4 miesięcy temu |
gemma.py
|
0e558e9b2f
fix: loading chameleon model with TP>1 (#695)
|
4 miesięcy temu |
gemma2.py
|
0e558e9b2f
fix: loading chameleon model with TP>1 (#695)
|
4 miesięcy temu |
gpt2.py
|
0e558e9b2f
fix: loading chameleon model with TP>1 (#695)
|
4 miesięcy temu |
gpt_bigcode.py
|
0e558e9b2f
fix: loading chameleon model with TP>1 (#695)
|
4 miesięcy temu |
gpt_j.py
|
0e558e9b2f
fix: loading chameleon model with TP>1 (#695)
|
4 miesięcy temu |
gpt_neox.py
|
0e558e9b2f
fix: loading chameleon model with TP>1 (#695)
|
4 miesięcy temu |
idefics2_vision_model.py
|
f1d0b77c92
[0.6.0] Release Candidate (#481)
|
4 miesięcy temu |
interfaces.py
|
0b8b407b6d
feat: support profiling with multiple multi-modal inputs per prompt (#712)
|
4 miesięcy temu |
intern_vit.py
|
3f712cd287
feat: add progress bar for loading individual weight modules (#640)
|
4 miesięcy temu |
internlm2.py
|
0e558e9b2f
fix: loading chameleon model with TP>1 (#695)
|
4 miesięcy temu |
internvl.py
|
0b8b407b6d
feat: support profiling with multiple multi-modal inputs per prompt (#712)
|
4 miesięcy temu |
jais.py
|
0e558e9b2f
fix: loading chameleon model with TP>1 (#695)
|
4 miesięcy temu |
jamba.py
|
d34e083c48
feat: add experts_int8 support (#730)
|
3 miesięcy temu |
llama.py
|
0e558e9b2f
fix: loading chameleon model with TP>1 (#695)
|
4 miesięcy temu |
llama_embedding.py
|
3f712cd287
feat: add progress bar for loading individual weight modules (#640)
|
4 miesięcy temu |
llava.py
|
0b8b407b6d
feat: support profiling with multiple multi-modal inputs per prompt (#712)
|
4 miesięcy temu |
llava_next.py
|
0b8b407b6d
feat: support profiling with multiple multi-modal inputs per prompt (#712)
|
4 miesięcy temu |
mamba.py
|
0e558e9b2f
fix: loading chameleon model with TP>1 (#695)
|
4 miesięcy temu |
mamba_cache.py
|
bf88c8567e
feat: mamba model support (#674)
|
4 miesięcy temu |
medusa.py
|
0e558e9b2f
fix: loading chameleon model with TP>1 (#695)
|
4 miesięcy temu |
minicpm.py
|
0e558e9b2f
fix: loading chameleon model with TP>1 (#695)
|
4 miesięcy temu |
minicpmv.py
|
0b8b407b6d
feat: support profiling with multiple multi-modal inputs per prompt (#712)
|
4 miesięcy temu |
mixtral.py
|
4ec08af18b
chore: update fused MoE weight loading (#700)
|
4 miesięcy temu |
mixtral_quant.py
|
0e558e9b2f
fix: loading chameleon model with TP>1 (#695)
|
4 miesięcy temu |
mlp_speculator.py
|
3f712cd287
feat: add progress bar for loading individual weight modules (#640)
|
4 miesięcy temu |
mpt.py
|
0e558e9b2f
fix: loading chameleon model with TP>1 (#695)
|
4 miesięcy temu |
na_vit.py
|
f1d0b77c92
[0.6.0] Release Candidate (#481)
|
4 miesięcy temu |
nemotron.py
|
0e558e9b2f
fix: loading chameleon model with TP>1 (#695)
|
4 miesięcy temu |
olmo.py
|
0e558e9b2f
fix: loading chameleon model with TP>1 (#695)
|
4 miesięcy temu |
opt.py
|
0e558e9b2f
fix: loading chameleon model with TP>1 (#695)
|
4 miesięcy temu |
orion.py
|
0e558e9b2f
fix: loading chameleon model with TP>1 (#695)
|
4 miesięcy temu |
paligemma.py
|
0b8b407b6d
feat: support profiling with multiple multi-modal inputs per prompt (#712)
|
4 miesięcy temu |
persimmon.py
|
0e558e9b2f
fix: loading chameleon model with TP>1 (#695)
|
4 miesięcy temu |
phi.py
|
0e558e9b2f
fix: loading chameleon model with TP>1 (#695)
|
4 miesięcy temu |
phi3_small.py
|
0e558e9b2f
fix: loading chameleon model with TP>1 (#695)
|
4 miesięcy temu |
phi3v.py
|
0b8b407b6d
feat: support profiling with multiple multi-modal inputs per prompt (#712)
|
4 miesięcy temu |
qwen.py
|
0e558e9b2f
fix: loading chameleon model with TP>1 (#695)
|
4 miesięcy temu |
qwen2.py
|
0e558e9b2f
fix: loading chameleon model with TP>1 (#695)
|
4 miesięcy temu |
qwen2_moe.py
|
4ec08af18b
chore: update fused MoE weight loading (#700)
|
4 miesięcy temu |
siglip.py
|
0b8b407b6d
feat: support profiling with multiple multi-modal inputs per prompt (#712)
|
4 miesięcy temu |
solar.py
|
0c6f03b7e4
feat: add Solar model support (#701)
|
4 miesięcy temu |
stablelm.py
|
0e558e9b2f
fix: loading chameleon model with TP>1 (#695)
|
4 miesięcy temu |
starcoder2.py
|
0e558e9b2f
fix: loading chameleon model with TP>1 (#695)
|
4 miesięcy temu |
utils.py
|
3693028340
feat: support for Audio modality (#698)
|
4 miesięcy temu |
xverse.py
|
0e558e9b2f
fix: loading chameleon model with TP>1 (#695)
|
4 miesięcy temu |