We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent c90a6d3 commit 7ada9aaCopy full SHA for 7ada9aa
vllm_ascend/worker/model_runner_v1.py
@@ -2525,10 +2525,7 @@ def load_model(self) -> None:
2525
self.model.get_eagle3_aux_hidden_state_layers())
2526
2527
if self.lora_config:
2528
- self.model = self.load_lora_model(self.model,
2529
- self.model_config,
2530
- self.scheduler_config,
2531
- self.lora_config,
+ self.model = self.load_lora_model(self.model, self.vllm_config,
2532
self.device)
2533
logger.info("Loading model weights took %.4f GB",
2534
m.consumed_memory / float(2**30))
0 commit comments