mirror of
https://github.com/OpenBMB/MiniCPM-V.git
synced 2026-02-05 02:09:20 +08:00
combine dtype and device to save CPU memory
This commit is contained in:
@@ -31,8 +31,7 @@ if 'int4' in model_path:
|
||||
exit()
|
||||
model = AutoModel.from_pretrained(model_path, trust_remote_code=True)
|
||||
else:
|
||||
model = AutoModel.from_pretrained(model_path, trust_remote_code=True).to(dtype=torch.float16)
|
||||
model = model.to(device=device)
|
||||
model = AutoModel.from_pretrained(model_path, trust_remote_code=True, torch_dtype=torch.float16, device_map=device)
|
||||
tokenizer = AutoTokenizer.from_pretrained(model_path, trust_remote_code=True)
|
||||
model.eval()
|
||||
|
||||
|
||||
Reference in New Issue
Block a user