From 7cb2892bb441aaddbc88e90ff8314e5e6c2d8f8c Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Szymon=20O=C5=BC=C3=B3g?= <58388001+SzymonOzog@users.noreply.github.com> Date: Thu, 6 Feb 2025 16:29:53 +0100 Subject: [PATCH 1/2] Missing quant_config in deepseek embedding layer Signed-off-by: SzymonOzog --- vllm/model_executor/models/deepseek_v2.py | 1 + 1 file changed, 1 insertion(+) diff --git a/vllm/model_executor/models/deepseek_v2.py b/vllm/model_executor/models/deepseek_v2.py index 773f5abe71da..fb49c91cef7e 100644 --- a/vllm/model_executor/models/deepseek_v2.py +++ b/vllm/model_executor/models/deepseek_v2.py @@ -592,6 +592,7 @@ def __init__(self, *, vllm_config: VllmConfig, prefix: str = ""): self.embed_tokens = VocabParallelEmbedding( config.vocab_size, config.hidden_size, + quant_config=quant_config, ) else: self.embed_tokens = PPMissingLayer() From 27b8c884ea01b639af4222327ef643afe2902133 Mon Sep 17 00:00:00 2001 From: SzymonOzog Date: Thu, 6 Feb 2025 19:04:10 +0100 Subject: [PATCH 2/2] Accept changes Signed-off-by: SzymonOzog --- vllm/model_executor/models/deepseek_v2.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/vllm/model_executor/models/deepseek_v2.py b/vllm/model_executor/models/deepseek_v2.py index fb49c91cef7e..fb6725c9abc3 100644 --- a/vllm/model_executor/models/deepseek_v2.py +++ b/vllm/model_executor/models/deepseek_v2.py @@ -593,7 +593,7 @@ def __init__(self, *, vllm_config: VllmConfig, prefix: str = ""): config.vocab_size, config.hidden_size, quant_config=quant_config, - ) + prefix=f"{prefix}.embed_tokens") else: self.embed_tokens = PPMissingLayer()