Skip to content

Commit

Permalink
[CI/Build]Reduce the time consumption for LoRA tests (vllm-project#7396)
Browse files Browse the repository at this point in the history
  • Loading branch information
jeejeelee authored Aug 14, 2024
1 parent 59edd0f commit 9799280
Show file tree
Hide file tree
Showing 3 changed files with 3 additions and 128 deletions.
106 changes: 0 additions & 106 deletions tests/lora/test_layer_variation.py

This file was deleted.

2 changes: 1 addition & 1 deletion tests/lora/test_punica_sizes.py
Original file line number Diff line number Diff line change
Expand Up @@ -98,7 +98,7 @@
128256,
]
#The size of TP
divisibility = [1, 2, 4, 8, 16, 32, 64]
divisibility = [1, 2, 8, 16, 64]

all_hidden_size = []
for div in divisibility:
Expand Down
23 changes: 2 additions & 21 deletions tests/lora/test_punica_variation.py
Original file line number Diff line number Diff line change
Expand Up @@ -20,10 +20,10 @@
from .utils import (generate_data, generate_data_for_expand_nslices,
ref_torch_groupgemm)

HIDDEN_SIZES = [3424, 4096, 4097]
HIDDEN_SIZES = [4097]

BATCHES = [1, 4, 16, 32]
NUM_LORA = [1, 4, 8, 16, 32, 64, 128]
NUM_LORA = [1, 8, 32, 128]
DTYPES = [torch.float16, torch.bfloat16]
MAX_RANKS = [1, 4, 8, 16, 32, 64, 128, 256]
SCALES = [0.5]
Expand Down Expand Up @@ -321,22 +321,3 @@ def test_punica_expand_nslices(

slice_offset += hidden_size
assert_close(our_outputs, ref_outputs)


if __name__ == "__main__":
from itertools import product

lst = list(
product(
BATCHES,
NUM_LORA,
MAX_RANKS,
[1.0],
[torch.float16],
["expand"],
SEED,
CUDA_DEVICES,
))
for ele in lst:
test_punica_bgmv(*ele)
print(f"{ele},pass")

0 comments on commit 9799280

Please sign in to comment.