diff --git a/vllm/model_executor/models/minicpm.py b/vllm/model_executor/models/minicpm.py index d99ae81468a9..0397b552ce9f 100644 --- a/vllm/model_executor/models/minicpm.py +++ b/vllm/model_executor/models/minicpm.py @@ -242,9 +242,6 @@ def __init__( base=rope_theta, rope_scaling=rope_scaling, ) - # set rope as fp32 instead of bf16 - self.rotary_emb.cos_sin_cache = self.rotary_emb._compute_cos_sin_cache( - ) self.attn = Attention(self.num_heads, self.head_dim, self.scaling,