remove mixtral weight to clang first (#3792)

seems fine without it now
This commit is contained in:
chenyu
2024-03-17 23:33:17 -04:00
committed by GitHub
parent bf3e1c4df2
commit dccefab23f

View File

@@ -42,8 +42,7 @@ if __name__ == "__main__":
else:
device = Device.DEFAULT
t.set_description(f"ram used: {GlobalCounters.mem_used/1e9:5.2f} GB, loading {k} to {device}")
# NOTE: we have to copy through CLANG to avoid the HIP hang bug when copying directly from the DISK
model_state_dict[k].replace(state[k].to("CLANG").contiguous().to(device).half()).realize()
model_state_dict[k].replace(state[k].to(device).half()).realize()
if CI: print(f"ram used: {GlobalCounters.mem_used/1e9:5.2f} GB")
from sentencepiece import SentencePieceProcessor