.. |
__init__.py
|
9d81716bfd
[v0.5.3] Release Candidate (#388)
|
пре 8 месеци |
batch_expansion.py
|
d8a51d05a7
fix: seeded gens with pipeline parallel
|
пре 4 месеци |
draft_model_runner.py
|
4d4e767838
ci: take one of fixing lint issues
|
пре 4 месеци |
interfaces.py
|
3a53ff1e01
fix: raise an error for no draft token case when draft_tp>1
|
пре 5 месеци |
medusa_worker.py
|
d8a51d05a7
fix: seeded gens with pipeline parallel
|
пре 4 месеци |
metrics.py
|
4d4e767838
ci: take one of fixing lint issues
|
пре 4 месеци |
mlp_speculator_worker.py
|
d8a51d05a7
fix: seeded gens with pipeline parallel
|
пре 4 месеци |
multi_step_worker.py
|
84a9cd25c9
fix: some naming issues
|
пре 4 месеци |
ngram_worker.py
|
6b1fdd07bd
chore: add isort and refactor formatting script and utils
|
пре 4 месеци |
proposer_worker_base.py
|
d638dc592d
fix: some minor typing issues in spec decode
|
пре 5 месеци |
smaller_tp_proposer_worker.py
|
16dff9babc
chore: enable bonus token in spec decoding for KV cache based models
|
пре 5 месеци |
spec_decode_worker.py
|
4d4e767838
ci: take one of fixing lint issues
|
пре 4 месеци |
target_model_runner.py
|
a4cbcfe59f
feat: disable logprob serialization to CPU for spec decode
|
пре 5 месеци |
top1_proposer.py
|
3a53ff1e01
fix: raise an error for no draft token case when draft_tp>1
|
пре 5 месеци |
util.py
|
edffcecc67
chore: add proper logging for spec decoding verification
|
пре 4 месеци |