.. |
__init__.py
|
9d81716bfd
[v0.5.3] Release Candidate (#388)
|
8 months ago |
batch_expansion.py
|
3bb0f07461
chore: rename `task_handler` to `worker` (#985)
|
2 weeks ago |
draft_model_runner.py
|
5c3b94de45
spec decode: move ops.advane_step to flash attention backend (#1005)
|
1 week ago |
interfaces.py
|
f1d0b77c92
[0.6.0] Release Candidate (#481)
|
4 months ago |
medusa_worker.py
|
3bb0f07461
chore: rename `task_handler` to `worker` (#985)
|
2 weeks ago |
metrics.py
|
2f61644f6e
SPMD optimizations (#824)
|
1 month ago |
mlp_speculator_worker.py
|
0dfa6b60ec
core: support logprobs with multi-step scheduling (#963)
|
2 weeks ago |
multi_step_worker.py
|
3bb0f07461
chore: rename `task_handler` to `worker` (#985)
|
2 weeks ago |
ngram_worker.py
|
0dfa6b60ec
core: support logprobs with multi-step scheduling (#963)
|
2 weeks ago |
proposer_worker_base.py
|
3bb0f07461
chore: rename `task_handler` to `worker` (#985)
|
2 weeks ago |
smaller_tp_proposer_worker.py
|
0dfa6b60ec
core: support logprobs with multi-step scheduling (#963)
|
2 weeks ago |
spec_decode_worker.py
|
3bb0f07461
chore: rename `task_handler` to `worker` (#985)
|
2 weeks ago |
target_model_runner.py
|
3bb0f07461
chore: rename `task_handler` to `worker` (#985)
|
2 weeks ago |
top1_proposer.py
|
0dfa6b60ec
core: support logprobs with multi-step scheduling (#963)
|
2 weeks ago |
util.py
|
0dfa6b60ec
core: support logprobs with multi-step scheduling (#963)
|
2 weeks ago |