Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
vllm_cscc
Commits
01bfb22b
Unverified
Commit
01bfb22b
authored
Mar 25, 2024
by
SangBin Cho
Committed by
GitHub
Mar 25, 2024
Browse files
[CI] Try introducing isort. (#3495)
parent
e67c295b
Changes
144
Hide whitespace changes
Inline
Side-by-side
Showing
20 changed files
with
70 additions
and
59 deletions
+70
-59
tests/lora/test_tokenizer_group.py
tests/lora/test_tokenizer_group.py
+3
-1
tests/lora/test_utils.py
tests/lora/test_utils.py
+1
-1
tests/lora/test_worker.py
tests/lora/test_worker.py
+2
-2
tests/models/test_marlin.py
tests/models/test_marlin.py
+3
-1
tests/samplers/test_logprobs.py
tests/samplers/test_logprobs.py
+1
-1
tests/samplers/test_rejection_sampler.py
tests/samplers/test_rejection_sampler.py
+2
-3
tests/samplers/test_sampler.py
tests/samplers/test_sampler.py
+1
-2
tests/samplers/test_seeded_generate.py
tests/samplers/test_seeded_generate.py
+1
-1
tests/spec_decode/test_batch_expansion.py
tests/spec_decode/test_batch_expansion.py
+2
-2
tests/spec_decode/test_metrics.py
tests/spec_decode/test_metrics.py
+3
-3
tests/spec_decode/test_multi_step_worker.py
tests/spec_decode/test_multi_step_worker.py
+10
-9
tests/spec_decode/test_spec_decode_worker.py
tests/spec_decode/test_spec_decode_worker.py
+11
-9
tests/spec_decode/test_utils.py
tests/spec_decode/test_utils.py
+4
-4
tests/spec_decode/utils.py
tests/spec_decode/utils.py
+11
-9
tests/test_cache_block_hashing.py
tests/test_cache_block_hashing.py
+1
-1
tests/test_sequence.py
tests/test_sequence.py
+1
-1
tests/tokenization/test_cached_tokenizer.py
tests/tokenization/test_cached_tokenizer.py
+3
-1
tests/tokenization/test_detokenize.py
tests/tokenization/test_detokenize.py
+5
-5
tests/tokenization/test_tokenizer_group.py
tests/tokenization/test_tokenizer_group.py
+4
-2
tests/worker/test_swap.py
tests/worker/test_swap.py
+1
-1
No files found.
tests/lora/test_tokenizer_group.py
View file @
01bfb22b
import
pytest
import
pytest
from
transformers
import
AutoTokenizer
,
PreTrainedTokenizerBase
from
transformers
import
AutoTokenizer
,
PreTrainedTokenizerBase
from
vllm.lora.request
import
LoRARequest
from
vllm.lora.request
import
LoRARequest
from
vllm.transformers_utils.tokenizer_group
import
get_tokenizer_group
from
vllm.transformers_utils.tokenizer
import
get_lora_tokenizer
from
vllm.transformers_utils.tokenizer
import
get_lora_tokenizer
from
vllm.transformers_utils.tokenizer_group
import
get_tokenizer_group
from
..conftest
import
get_tokenizer_pool_config
from
..conftest
import
get_tokenizer_pool_config
...
...
tests/lora/test_utils.py
View file @
01bfb22b
...
@@ -2,8 +2,8 @@ from collections import OrderedDict
...
@@ -2,8 +2,8 @@ from collections import OrderedDict
from
torch
import
nn
from
torch
import
nn
from
vllm.lora.utils
import
parse_fine_tuned_lora_name
,
replace_submodule
from
vllm.utils
import
LRUCache
from
vllm.utils
import
LRUCache
from
vllm.lora.utils
import
(
parse_fine_tuned_lora_name
,
replace_submodule
)
def
test_parse_fine_tuned_lora_name
():
def
test_parse_fine_tuned_lora_name
():
...
...
tests/lora/test_worker.py
View file @
01bfb22b
...
@@ -3,10 +3,10 @@ import random
...
@@ -3,10 +3,10 @@ import random
import
tempfile
import
tempfile
from
unittest.mock
import
patch
from
unittest.mock
import
patch
from
vllm.config
import
(
DeviceConfig
,
LoRAConfig
,
ModelConfig
,
ParallelConfig
,
SchedulerConfig
)
from
vllm.lora.models
import
LoRAMapping
from
vllm.lora.models
import
LoRAMapping
from
vllm.lora.request
import
LoRARequest
from
vllm.lora.request
import
LoRARequest
from
vllm.config
import
(
ModelConfig
,
ParallelConfig
,
SchedulerConfig
,
DeviceConfig
,
LoRAConfig
)
from
vllm.worker.worker
import
Worker
from
vllm.worker.worker
import
Worker
...
...
tests/models/test_marlin.py
View file @
01bfb22b
...
@@ -11,9 +11,11 @@ up to 3 times to see if we pass.
...
@@ -11,9 +11,11 @@ up to 3 times to see if we pass.
Run `pytest tests/models/test_marlin.py --forked`.
Run `pytest tests/models/test_marlin.py --forked`.
"""
"""
from
dataclasses
import
dataclass
import
pytest
import
pytest
import
torch
import
torch
from
dataclasses
import
dataclass
from
vllm.model_executor.layers.quantization
import
(
from
vllm.model_executor.layers.quantization
import
(
_QUANTIZATION_CONFIG_REGISTRY
)
_QUANTIZATION_CONFIG_REGISTRY
)
...
...
tests/samplers/test_logprobs.py
View file @
01bfb22b
import
pytest
import
pytest
import
torch
import
torch
from
tests.conftest
import
VllmRunner
from
tests.conftest
import
VllmRunner
from
vllm
import
SamplingParams
from
vllm
import
SamplingParams
MODELS
=
[
"facebook/opt-125m"
]
MODELS
=
[
"facebook/opt-125m"
]
...
...
tests/samplers/test_rejection_sampler.py
View file @
01bfb22b
"""Tests for rejection sampling."""
"""Tests for rejection sampling."""
import
pytest
from
typing
import
List
,
Tuple
from
typing
import
List
,
Tuple
import
pytest
import
torch
import
torch
import
torch.nn.functional
as
F
import
torch.nn.functional
as
F
from
vllm.model_executor.utils
import
set_random_seed
from
vllm.model_executor.layers.rejection_sampler
import
RejectionSampler
from
vllm.model_executor.layers.rejection_sampler
import
RejectionSampler
from
vllm.model_executor.utils
import
set_random_seed
CUDA_DEVICES
=
[
CUDA_DEVICES
=
[
f
"cuda:
{
i
}
"
for
i
in
range
(
1
if
torch
.
cuda
.
device_count
()
==
1
else
2
)
f
"cuda:
{
i
}
"
for
i
in
range
(
1
if
torch
.
cuda
.
device_count
()
==
1
else
2
)
...
...
tests/samplers/test_sampler.py
View file @
01bfb22b
import
random
import
random
from
typing
import
Tuple
,
List
from
typing
import
List
,
Optional
,
Tuple
from
unittest.mock
import
patch
from
unittest.mock
import
patch
import
pytest
import
pytest
import
torch
import
torch
from
transformers
import
GenerationConfig
,
GenerationMixin
from
transformers
import
GenerationConfig
,
GenerationMixin
from
typing
import
Optional
from
vllm.model_executor.layers.sampler
import
Sampler
from
vllm.model_executor.layers.sampler
import
Sampler
from
vllm.model_executor.utils
import
set_random_seed
from
vllm.model_executor.utils
import
set_random_seed
...
...
tests/samplers/test_seeded_generate.py
View file @
01bfb22b
...
@@ -8,8 +8,8 @@ from itertools import combinations
...
@@ -8,8 +8,8 @@ from itertools import combinations
import
pytest
import
pytest
from
vllm.model_executor.utils
import
set_random_seed
from
vllm
import
SamplingParams
from
vllm
import
SamplingParams
from
vllm.model_executor.utils
import
set_random_seed
MODEL
=
"facebook/opt-125m"
MODEL
=
"facebook/opt-125m"
RANDOM_SEEDS
=
list
(
range
(
5
))
RANDOM_SEEDS
=
list
(
range
(
5
))
...
...
tests/spec_decode/test_batch_expansion.py
View file @
01bfb22b
import
torch
import
pytest
import
pytest
import
torch
from
vllm.spec_decode.batch_expansion
import
BatchExpansionTop1Scorer
from
vllm.spec_decode.batch_expansion
import
BatchExpansionTop1Scorer
from
.utils
import
mock_worker
,
create_seq_group_metadata_from_prompts
from
.utils
import
create_seq_group_metadata_from_prompts
,
mock_worker
@
pytest
.
mark
.
parametrize
(
'num_target_seq_ids'
,
[
100
])
@
pytest
.
mark
.
parametrize
(
'num_target_seq_ids'
,
[
100
])
...
...
tests/spec_decode/test_metrics.py
View file @
01bfb22b
import
torch
import
math
import
math
import
pytest
from
unittest.mock
import
MagicMock
from
unittest.mock
import
MagicMock
import
pytest
import
torch
from
vllm.spec_decode.metrics
import
AsyncMetricsCollector
from
vllm.spec_decode.metrics
import
AsyncMetricsCollector
...
...
tests/spec_decode/test_multi_step_worker.py
View file @
01bfb22b
import
torch
import
random
import
random
import
pytest
from
unittest.mock
import
MagicMock
from
unittest.mock
import
MagicMock
from
vllm.spec_decode.multi_step_worker
import
(
MultiStepWorker
,
import
pytest
DraftModelTop1Proposer
)
import
torch
from
vllm.worker.worker
import
Worker
from
vllm.model_executor.utils
import
set_random_seed
from
vllm.model_executor.utils
import
set_random_seed
from
vllm.sequence
import
SamplerOutput
from
vllm.sequence
import
SamplerOutput
from
vllm.spec_decode.multi_step_worker
import
(
DraftModelTop1Proposer
,
MultiStepWorker
)
from
vllm.worker.worker
import
Worker
from
.utils
import
(
create_execute_model_data
,
create_
worker
,
from
.utils
import
(
assert_logprobs_dict_allclose
,
create_
batch
,
create_
seq_group_metadata_from_prompts
,
zero_kv_cache
,
create_
execute_model_data
,
patch_execute_model_with_seeds
,
create_seq_group_metadata_from_prompts
,
create_worker
,
assert_logprobs_dict_allclose
,
create_bat
ch
)
patch_execute_model_with_seeds
,
zero_kv_ca
ch
e
)
@
pytest
.
mark
.
parametrize
(
'num_steps'
,
list
(
range
(
1
,
17
)))
@
pytest
.
mark
.
parametrize
(
'num_steps'
,
list
(
range
(
1
,
17
)))
...
...
tests/spec_decode/test_spec_decode_worker.py
View file @
01bfb22b
import
torch
import
random
import
random
import
pytest
from
unittest.mock
import
MagicMock
from
unittest.mock
import
MagicMock
import
pytest
import
torch
from
vllm.model_executor.layers.rejection_sampler
import
RejectionSampler
from
vllm.model_executor.utils
import
set_random_seed
from
vllm.spec_decode.interfaces
import
SpeculativeProposals
from
vllm.spec_decode.metrics
import
(
AsyncMetricsCollector
,
SpecDecodeWorkerMetrics
)
from
vllm.spec_decode.multi_step_worker
import
MultiStepWorker
from
vllm.spec_decode.multi_step_worker
import
MultiStepWorker
from
vllm.spec_decode.spec_decode_worker
import
(
SpecDecodeWorker
,
from
vllm.spec_decode.spec_decode_worker
import
(
SpecDecodeWorker
,
split_num_cache_blocks_evenly
)
split_num_cache_blocks_evenly
)
from
vllm.spec_decode.interfaces
import
SpeculativeProposals
from
vllm.model_executor.utils
import
set_random_seed
from
.utils
import
(
ExecuteModelData
,
create_batch
,
create_sampler_output_list
,
from
vllm.model_executor.layers.rejection_sampler
import
RejectionSampler
mock_worker
)
from
.utils
import
(
mock_worker
,
create_batch
,
ExecuteModelData
,
create_sampler_output_list
)
from
vllm.spec_decode.metrics
import
(
SpecDecodeWorkerMetrics
,
AsyncMetricsCollector
)
@
pytest
.
mark
.
parametrize
(
'k'
,
[
1
,
2
,
6
])
@
pytest
.
mark
.
parametrize
(
'k'
,
[
1
,
2
,
6
])
...
...
tests/spec_decode/test_utils.py
View file @
01bfb22b
from
vllm.spec_decode.util
import
get_all_seq_ids
from
unittest.mock
import
MagicMock
from
vllm.sequence
import
SequenceGroupMetadata
from
vllm.spec_decode.util
import
split_batch_by_proposal_len
import
pytest
import
pytest
from
unittest.mock
import
MagicMock
from
vllm.sequence
import
SequenceGroupMetadata
from
vllm.spec_decode.util
import
get_all_seq_ids
,
split_batch_by_proposal_len
def
test_get_all_seq_ids
():
def
test_get_all_seq_ids
():
...
...
tests/spec_decode/utils.py
View file @
01bfb22b
import
torch
from
dataclasses
import
dataclass
,
fields
from
typing
import
List
,
Optional
,
Dict
,
Iterable
,
Union
from
itertools
import
count
from
typing
import
Dict
,
Iterable
,
List
,
Optional
,
Union
from
unittest.mock
import
MagicMock
from
unittest.mock
import
MagicMock
from
vllm.worker.worker
import
W
or
ker
import
t
or
ch
from
vllm.utils
import
get_distributed_init_method
,
get_ip
,
get_open_port
from
vllm.engine.arg_utils
import
EngineArgs
from
vllm.engine.arg_utils
import
EngineArgs
from
vllm.sequence
import
(
Logprob
,
SequenceGroupMetadata
,
SequenceData
,
from
vllm.model_executor.utils
import
set_random_seed
SamplerOutput
,
SequenceGroupOutput
,
SequenceOutput
)
from
vllm.sampling_params
import
SamplingParams
from
vllm.sampling_params
import
SamplingParams
from
vllm.sequence
import
(
Logprob
,
SamplerOutput
,
SequenceData
,
SequenceGroupMetadata
,
SequenceGroupOutput
,
SequenceOutput
)
from
vllm.utils
import
get_distributed_init_method
,
get_ip
,
get_open_port
from
vllm.worker.cache_engine
import
CacheEngine
from
vllm.worker.cache_engine
import
CacheEngine
from
vllm.model_executor.utils
import
set_random_seed
from
vllm.worker.worker
import
Worker
from
itertools
import
count
from
dataclasses
import
dataclass
,
fields
@
dataclass
@
dataclass
...
...
tests/test_cache_block_hashing.py
View file @
01bfb22b
...
@@ -7,8 +7,8 @@ from typing import List, Optional
...
@@ -7,8 +7,8 @@ from typing import List, Optional
import
pytest
import
pytest
from
vllm.lora.request
import
LoRARequest
from
vllm.lora.request
import
LoRARequest
from
vllm.transformers_utils.tokenizer_group
import
TokenizerGroup
from
vllm.sequence
import
Sequence
from
vllm.sequence
import
Sequence
from
vllm.transformers_utils.tokenizer_group
import
TokenizerGroup
# Make two prefixes with different first blocks.
# Make two prefixes with different first blocks.
prefix_start
=
[(
"You are an expert"
),
(
"You are a"
)]
prefix_start
=
[(
"You are an expert"
),
(
"You are a"
)]
...
...
tests/test_sequence.py
View file @
01bfb22b
import
pytest
import
pytest
from
vllm.sequence
import
S
equenceGroupOutput
,
Sampler
Output
,
SequenceOutput
from
vllm.sequence
import
S
amplerOutput
,
SequenceGroup
Output
,
SequenceOutput
@
pytest
.
fixture
@
pytest
.
fixture
...
...
tests/tokenization/test_cached_tokenizer.py
View file @
01bfb22b
from
copy
import
deepcopy
from
copy
import
deepcopy
from
vllm.transformers_utils.tokenizer
import
get_cached_tokenizer
from
transformers
import
AutoTokenizer
from
transformers
import
AutoTokenizer
from
vllm.transformers_utils.tokenizer
import
get_cached_tokenizer
def
test_cached_tokenizer
():
def
test_cached_tokenizer
():
reference_tokenizer
=
AutoTokenizer
.
from_pretrained
(
"gpt2"
)
reference_tokenizer
=
AutoTokenizer
.
from_pretrained
(
"gpt2"
)
...
...
tests/tokenization/test_detokenize.py
View file @
01bfb22b
import
pyte
st
from
typing
import
Dict
,
Li
st
import
pytest
from
transformers
import
AutoTokenizer
from
transformers
import
AutoTokenizer
from
typing
import
List
,
Dict
from
vllm.sequence
import
Sequence
,
Logprob
,
SamplingParams
,
SequenceGroup
from
vllm.sequence
import
Logprob
,
SamplingParams
,
Sequence
,
SequenceGroup
from
vllm.transformers_utils.tokenizer_group
import
get_tokenizer_group
from
vllm.transformers_utils.tokenizer
import
detokenize_incrementally
from
vllm.transformers_utils.detokenizer
import
Detokenizer
from
vllm.transformers_utils.detokenizer
import
Detokenizer
from
vllm.transformers_utils.tokenizer
import
detokenize_incrementally
from
vllm.transformers_utils.tokenizer_group
import
get_tokenizer_group
TRUTH
=
[
TRUTH
=
[
"Hello here, this is a simple test"
,
"Hello here, this is a simple test"
,
...
...
tests/tokenization/test_tokenizer_group.py
View file @
01bfb22b
import
os
import
pytest
import
asyncio
import
asyncio
import
os
from
unittest.mock
import
patch
from
unittest.mock
import
patch
import
pytest
from
transformers
import
AutoTokenizer
,
PreTrainedTokenizerBase
from
transformers
import
AutoTokenizer
,
PreTrainedTokenizerBase
from
vllm.transformers_utils.tokenizer_group
import
get_tokenizer_group
from
vllm.transformers_utils.tokenizer_group
import
get_tokenizer_group
from
vllm.transformers_utils.tokenizer_group.ray_tokenizer_group
import
(
from
vllm.transformers_utils.tokenizer_group.ray_tokenizer_group
import
(
RayTokenizerGroupPool
)
RayTokenizerGroupPool
)
from
vllm.transformers_utils.tokenizer_group.tokenizer_group
import
(
from
vllm.transformers_utils.tokenizer_group.tokenizer_group
import
(
TokenizerGroup
)
TokenizerGroup
)
from
..conftest
import
get_tokenizer_pool_config
from
..conftest
import
get_tokenizer_pool_config
...
...
tests/worker/test_swap.py
View file @
01bfb22b
import
torch
import
torch
from
vllm.engine.arg_utils
import
EngineArgs
from
vllm.engine.arg_utils
import
EngineArgs
from
vllm.worker.worker
import
Worker
from
vllm.utils
import
get_distributed_init_method
,
get_ip
,
get_open_port
from
vllm.utils
import
get_distributed_init_method
,
get_ip
,
get_open_port
from
vllm.worker.worker
import
Worker
def
test_swap
()
->
None
:
def
test_swap
()
->
None
:
...
...
Prev
1
2
3
4
5
6
7
8
Next
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment