|
50 | 50 | from vllm.sequence import IntermediateTensors, PoolerOutput |
51 | 51 |
|
52 | 52 | from .interfaces import SupportsLoRA, SupportsPP |
53 | | -from .utils import (AutoWeightsLoader, PPMissingLayer, is_pp_missing_parameter, |
| 53 | +from .utils import (AutoWeightsLoader, PPMissingLayer, WeightsMapper, |
| 54 | + is_pp_missing_parameter, |
54 | 55 | make_empty_intermediate_tensors_factory, make_layers, |
55 | 56 | maybe_prefix) |
56 | 57 |
|
@@ -585,8 +586,7 @@ def pooler( |
585 | 586 | ) -> Optional[PoolerOutput]: |
586 | 587 | return self._pooler(hidden_states, pooling_metadata) |
587 | 588 |
|
588 | | - def load_weights(self, weights: Iterable[Tuple[str, |
589 | | - torch.Tensor]]) -> Set[str]: |
590 | | - loader = AutoWeightsLoader(self, |
591 | | - ignore_unexpected_prefixes=["lm_head."]) |
592 | | - return loader.load_weights(weights) |
| 589 | + def load_weights(self, weights: Iterable[Tuple[str, torch.Tensor]]): |
| 590 | + hf_to_vllm_mapper = WeightsMapper(orig_to_new_prefix={"model.": ""}) |
| 591 | + weights = hf_to_vllm_mapper.apply(weights) |
| 592 | + self.model.load_weights(weights) |
0 commit comments