.. |
__init__.py
|
9d81716bfd
[v0.5.3] Release Candidate (#388)
|
8 kuukautta sitten |
abstract.py
|
7a313483f1
chore: move update_flash_attn_metadata to attn backend (#731)
|
3 kuukautta sitten |
blocksparse_attn.py
|
f1d0b77c92
[0.6.0] Release Candidate (#481)
|
4 kuukautta sitten |
flash_attn.py
|
7a313483f1
chore: move update_flash_attn_metadata to attn backend (#731)
|
3 kuukautta sitten |
flashinfer.py
|
60b702a827
chore: register custom torch ops for flash-attn and flashinfer (#724)
|
3 kuukautta sitten |
ipex_attn.py
|
f1d0b77c92
[0.6.0] Release Candidate (#481)
|
4 kuukautta sitten |
openvino.py
|
f1d0b77c92
[0.6.0] Release Candidate (#481)
|
4 kuukautta sitten |
pallas.py
|
f1d0b77c92
[0.6.0] Release Candidate (#481)
|
4 kuukautta sitten |
placeholder_attn.py
|
bf88c8567e
feat: mamba model support (#674)
|
4 kuukautta sitten |
rocm_flash_attn.py
|
e200775863
feat: enable using fp8 kv and prefix caching with chunked prefill (#668)
|
4 kuukautta sitten |
torch_sdpa.py
|
f1d0b77c92
[0.6.0] Release Candidate (#481)
|
4 kuukautta sitten |
utils.py
|
3bbb3f2086
feat: add numpy implementation of `compute_slot_mapping` (#678)
|
4 kuukautta sitten |
xformers.py
|
e200775863
feat: enable using fp8 kv and prefix caching with chunked prefill (#668)
|
4 kuukautta sitten |