dev-python/llmlingua
To speed up LLMs' inference and enhance LLM's perceive of key information, compress the prompt and KV-Cache, which achieves up to 20x compression with minimal performance loss.
Runtime Dependencies
llmlingua-0.2.1
dev-python/transformers[python_targets_python3_11
(-)
?
,python_targets_python3_12
(-)
?
,python_targets_python3_13
(-)
?
,python_targets_python3_14
(-)
?
]
dev-python/accelerate[python_targets_python3_11
(-)
?
,python_targets_python3_12
(-)
?
,python_targets_python3_13
(-)
?
,python_targets_python3_14
(-)
?
]
dev-python/torch[python_targets_python3_11
(-)
?
,python_targets_python3_12
(-)
?
,python_targets_python3_13
(-)
?
,python_targets_python3_14
(-)
?
]
dev-python/tiktoken[python_targets_python3_11
(-)
?
,python_targets_python3_12
(-)
?
,python_targets_python3_13
(-)
?
,python_targets_python3_14
(-)
?
]
dev-python/nltk[python_targets_python3_11
(-)
?
,python_targets_python3_12
(-)
?
,python_targets_python3_13
(-)
?
,python_targets_python3_14
(-)
?
]
dev-python/numpy[python_targets_python3_11
(-)
?
,python_targets_python3_12
(-)
?
,python_targets_python3_13
(-)
?
,python_targets_python3_14
(-)
?
]
dev?
( dev-python/transformers[python_targets_python3_11
(-)
?
,python_targets_python3_12
(-)
?
,python_targets_python3_13
(-)
?
,python_targets_python3_14
(-)
?
] )
dev?
( dev-python/accelerate[python_targets_python3_11
(-)
?
,python_targets_python3_12
(-)
?
,python_targets_python3_13
(-)
?
,python_targets_python3_14
(-)
?
] )
dev?
( dev-python/torch[python_targets_python3_11
(-)
?
,python_targets_python3_12
(-)
?
,python_targets_python3_13
(-)
?
,python_targets_python3_14
(-)
?
] )
dev?
( dev-python/tiktoken[python_targets_python3_11
(-)
?
,python_targets_python3_12
(-)
?
,python_targets_python3_13
(-)
?
,python_targets_python3_14
(-)
?
] )
dev?
( dev-python/nltk[python_targets_python3_11
(-)
?
,python_targets_python3_12
(-)
?
,python_targets_python3_13
(-)
?
,python_targets_python3_14
(-)
?
] )
dev?
( dev-python/numpy[python_targets_python3_11
(-)
?
,python_targets_python3_12
(-)
?
,python_targets_python3_13
(-)
?
,python_targets_python3_14
(-)
?
] )
dev?
( ~dev-python/black-21.4_beta0[python_targets_python3_11
(-)
?
,python_targets_python3_12
(-)
?
,python_targets_python3_13
(-)
?
,python_targets_python3_14
(-)
?
] )
dev?
( >=dev-python/flake8-3.8.3[python_targets_python3_11
(-)
?
,python_targets_python3_12
(-)
?
,python_targets_python3_13
(-)
?
,python_targets_python3_14
(-)
?
] )
dev?
( >=dev-python/isort-5.5.4[python_targets_python3_11
(-)
?
,python_targets_python3_12
(-)
?
,python_targets_python3_13
(-)
?
,python_targets_python3_14
(-)
?
] )
dev?
( dev-python/pre-commit[python_targets_python3_11
(-)
?
,python_targets_python3_12
(-)
?
,python_targets_python3_13
(-)
?
,python_targets_python3_14
(-)
?
] )
dev?
( dev-python/pytest[python_targets_python3_11
(-)
?
,python_targets_python3_12
(-)
?
,python_targets_python3_13
(-)
?
,python_targets_python3_14
(-)
?
] )
dev?
( dev-python/pytest-xdist[python_targets_python3_11
(-)
?
,python_targets_python3_12
(-)
?
,python_targets_python3_13
(-)
?
,python_targets_python3_14
(-)
?
] )
quality?
( ~dev-python/black-21.4_beta0[python_targets_python3_11
(-)
?
,python_targets_python3_12
(-)
?
,python_targets_python3_13
(-)
?
,python_targets_python3_14
(-)
?
] )
quality?
( >=dev-python/flake8-3.8.3[python_targets_python3_11
(-)
?
,python_targets_python3_12
(-)
?
,python_targets_python3_13
(-)
?
,python_targets_python3_14
(-)
?
] )
quality?
( >=dev-python/isort-5.5.4[python_targets_python3_11
(-)
?
,python_targets_python3_12
(-)
?
,python_targets_python3_13
(-)
?
,python_targets_python3_14
(-)
?
] )
quality?
( dev-python/pre-commit[python_targets_python3_11
(-)
?
,python_targets_python3_12
(-)
?
,python_targets_python3_13
(-)
?
,python_targets_python3_14
(-)
?
] )
quality?
( dev-python/pytest[python_targets_python3_11
(-)
?
,python_targets_python3_12
(-)
?
,python_targets_python3_13
(-)
?
,python_targets_python3_14
(-)
?
] )
quality?
( dev-python/pytest-xdist[python_targets_python3_11
(-)
?
,python_targets_python3_12
(-)
?
,python_targets_python3_13
(-)
?
,python_targets_python3_14
(-)
?
] )
python_targets_python3_11?
( dev-lang/python:3.11 )
python_targets_python3_12?
( dev-lang/python:3.12 )
python_targets_python3_13?
( dev-lang/python:3.13 )
python_targets_python3_14?
( dev-lang/python:3.14 )


View
Download
Browse