.. |
__init__.py
|
f8dfac6372
chore: attention refactor and upstream sync apr01 (#365)
|
11 months ago |
cpu_executor.py
|
0dfa6b60ec
core: support logprobs with multi-step scheduling (#963)
|
2 months ago |
distributed_gpu_executor.py
|
0dfa6b60ec
core: support logprobs with multi-step scheduling (#963)
|
2 months ago |
executor_base.py
|
0dfa6b60ec
core: support logprobs with multi-step scheduling (#963)
|
2 months ago |
gpu_executor.py
|
0dfa6b60ec
core: support logprobs with multi-step scheduling (#963)
|
2 months ago |
msgspec_utils.py
|
2f61644f6e
SPMD optimizations (#824)
|
3 months ago |
multiproc_gpu_executor.py
|
0dfa6b60ec
core: support logprobs with multi-step scheduling (#963)
|
2 months ago |
multiproc_worker_utils.py
|
22a4cd4595
core: fix spec decode metrics and envs circular import (#889)
|
2 months ago |
multiproc_xpu_executor.py
|
15cb8d5c26
xpu: support pipeline parallel (#932)
|
2 months ago |
neuron_executor.py
|
0dfa6b60ec
core: support logprobs with multi-step scheduling (#963)
|
2 months ago |
openvino_executor.py
|
0dfa6b60ec
core: support logprobs with multi-step scheduling (#963)
|
2 months ago |
ray_gpu_executor.py
|
0dfa6b60ec
core: support logprobs with multi-step scheduling (#963)
|
2 months ago |
ray_tpu_executor.py
|
0dfa6b60ec
core: support logprobs with multi-step scheduling (#963)
|
2 months ago |
ray_utils.py
|
9f3e7c86e2
feat: add fused Marlin MoE kernel (#934)
|
2 months ago |
ray_xpu_executor.py
|
673621a3d2
xpu: refactor the model runner for tensor parallelism (#910)
|
2 months ago |
tpu_executor.py
|
0dfa6b60ec
core: support logprobs with multi-step scheduling (#963)
|
2 months ago |
xpu_executor.py
|
0dfa6b60ec
core: support logprobs with multi-step scheduling (#963)
|
2 months ago |