File tree Expand file tree Collapse file tree 1 file changed +16
-17
lines changed Expand file tree Collapse file tree 1 file changed +16
-17
lines changed Original file line number Diff line number Diff line change @@ -132,23 +132,22 @@ def test_models_distributed_DeepSeek_dbo():
132
132
def test_models_distributed_DeepSeek_w8a8_ep_dbo ():
133
133
example_prompts = ["The president of the United States is" ] * 100
134
134
sampling_params = SamplingParams (max_tokens = 100 , temperature = 0.0 )
135
- with VllmRunner (
136
- snapshot_download ("vllm-ascend/DeepSeek-V2-Lite-W8A8" ),
137
- dtype = "auto" ,
138
- quantization = "ascend" ,
139
- tensor_parallel_size = 4 ,
140
- enforce_eager = True ,
141
- enable_expert_parallel = True ,
142
- distributed_executor_backend = "mp" ,
143
- additional_config = {
144
- "ascend_scheduler_config" : {
145
- "enabled" : True ,
146
- },
147
- "torchair_graph_config" : {
148
- "enable" : True ,
149
- "enable_multistream_moe" : True
150
- }
151
- }) as vllm_model :
135
+ with VllmRunner (snapshot_download ("vllm-ascend/DeepSeek-V2-Lite-W8A8" ),
136
+ dtype = "auto" ,
137
+ quantization = "ascend" ,
138
+ tensor_parallel_size = 4 ,
139
+ enforce_eager = True ,
140
+ enable_expert_parallel = True ,
141
+ distributed_executor_backend = "mp" ,
142
+ additional_config = {
143
+ "ascend_scheduler_config" : {
144
+ "enabled" : True ,
145
+ },
146
+ "torchair_graph_config" : {
147
+ "enable" : True ,
148
+ "enable_multistream_moe" : True
149
+ }
150
+ }) as vllm_model :
152
151
model_arch = 'DeepseekV2ForCausalLM'
153
152
registed_models = ModelRegistry .models
154
153
assert registed_models [
You can’t perform that action at this time.
0 commit comments