We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
2 parents 376fba3 + 5ded17e commit cdf12f3Copy full SHA for cdf12f3
support_materials/1-inference/generate.py
@@ -122,7 +122,9 @@ def main(
122
print("load model")
123
load_model(
124
model,
125
- os.path.join(ckpt_path, f"model{rank}-mp{world_size}.safetensors"))
+ os.path.join(ckpt_path, f"model{rank}-mp{world_size}.safetensors"),
126
+ # use strict=False to fix the lm head dtype mismatch
127
+ strict=False)
128
print("I'm DeepSeek 👋")
129
130
if interactive:
0 commit comments