.. |
__init__.py
|
f8dfac6372
chore: attention refactor and upstream sync apr01 (#365)
|
vor 9 Monaten |
cpu_executor.py
|
0dfa6b60ec
core: support logprobs with multi-step scheduling (#963)
|
vor 1 Monat |
distributed_gpu_executor.py
|
0dfa6b60ec
core: support logprobs with multi-step scheduling (#963)
|
vor 1 Monat |
executor_base.py
|
0dfa6b60ec
core: support logprobs with multi-step scheduling (#963)
|
vor 1 Monat |
gpu_executor.py
|
0dfa6b60ec
core: support logprobs with multi-step scheduling (#963)
|
vor 1 Monat |
msgspec_utils.py
|
2f61644f6e
SPMD optimizations (#824)
|
vor 2 Monaten |
multiproc_gpu_executor.py
|
0dfa6b60ec
core: support logprobs with multi-step scheduling (#963)
|
vor 1 Monat |
multiproc_worker_utils.py
|
22a4cd4595
core: fix spec decode metrics and envs circular import (#889)
|
vor 1 Monat |
multiproc_xpu_executor.py
|
15cb8d5c26
xpu: support pipeline parallel (#932)
|
vor 1 Monat |
neuron_executor.py
|
0dfa6b60ec
core: support logprobs with multi-step scheduling (#963)
|
vor 1 Monat |
openvino_executor.py
|
0dfa6b60ec
core: support logprobs with multi-step scheduling (#963)
|
vor 1 Monat |
ray_gpu_executor.py
|
0dfa6b60ec
core: support logprobs with multi-step scheduling (#963)
|
vor 1 Monat |
ray_tpu_executor.py
|
61103b92d4
tpu: support single and multi-host TPUs on GKE and RayServe (#970)
|
vor 1 Monat |
ray_utils.py
|
61103b92d4
tpu: support single and multi-host TPUs on GKE and RayServe (#970)
|
vor 1 Monat |
ray_xpu_executor.py
|
673621a3d2
xpu: refactor the model runner for tensor parallelism (#910)
|
vor 1 Monat |
tpu_executor.py
|
0dfa6b60ec
core: support logprobs with multi-step scheduling (#963)
|
vor 1 Monat |
xpu_executor.py
|
0dfa6b60ec
core: support logprobs with multi-step scheduling (#963)
|
vor 1 Monat |