Skip to content

Commit

Permalink
address pr feedback
Browse files Browse the repository at this point in the history
  • Loading branch information
maxjeblick committed Dec 11, 2024
1 parent 8eb3b3d commit 519222b
Show file tree
Hide file tree
Showing 3 changed files with 12 additions and 3 deletions.
1 change: 1 addition & 0 deletions kvpress/presses/composed_press.py
Original file line number Diff line number Diff line change
@@ -1,4 +1,5 @@
from dataclasses import dataclass

from kvpress.presses.base_press import BasePress


Expand Down
12 changes: 10 additions & 2 deletions tests/integration/test_ruler.py
Original file line number Diff line number Diff line change
Expand Up @@ -4,7 +4,15 @@
from transformers import DynamicCache, QuantizedCacheConfig, QuantoQuantizedCache
from transformers.utils import is_flash_attn_2_available, is_optimum_quanto_available

from kvpress import ExpectedAttentionPress, KnormPress, SnapKVPress, StreamingLLMPress, ThinKPress, TOVAPress
from kvpress import (
ExpectedAttentionPress,
KnormPress,
SimLayerKVPress,
SnapKVPress,
StreamingLLMPress,
ThinKPress,
TOVAPress,
)
from tests.fixtures import kv_press_llama3_1_flash_attn_pipeline # noqa: F401


Expand All @@ -18,7 +26,7 @@ def df_ruler():
@pytest.mark.skipif(not torch.cuda.is_available(), reason="GPU is not available")
@pytest.mark.skipif(not is_flash_attn_2_available(), reason="flash_attn is not installed")
@pytest.mark.parametrize(
"cls", [KnormPress, ExpectedAttentionPress, StreamingLLMPress, SnapKVPress, TOVAPress, ThinKPress]
"cls", [KnormPress, ExpectedAttentionPress, StreamingLLMPress, SnapKVPress, TOVAPress, ThinKPress, SimLayerKVPress]
)
@pytest.mark.parametrize("compression_ratio", [0.1, 0.2])
@pytest.mark.parametrize("cache", ["dynamic", "quantized"])
Expand Down
2 changes: 1 addition & 1 deletion tests/presses/test_presses.py
Original file line number Diff line number Diff line change
Expand Up @@ -12,8 +12,8 @@
KnormPress,
ObservedAttentionPress,
RandomPress,
SnapKVPress,
SimLayerKVPress,
SnapKVPress,
StreamingLLMPress,
TOVAPress,
)
Expand Down

0 comments on commit 519222b

Please sign in to comment.