diff --git a/quantize/bnb_quantize.py b/quantize/bnb_quantize.py index 643f213..205cd28 100644 --- a/quantize/bnb_quantize.py +++ b/quantize/bnb_quantize.py @@ -19,9 +19,9 @@ import GPUtil import os model_path = '/root/ld/ld_model_pretrained/MiniCPM-Llama3-V-2_5' # Model download path -device = 'cpu' # # Select GPU if available, otherwise CPU +device = 'cuda' # Select GPU if available, otherwise CPU save_path = '/root/ld/ld_model_pretrain/MiniCPM-Llama3-V-2_5_int4' # Quantized model save path -image_path = '/root/ld/ld_project/pull_request/MiniCPM-V/assets/airplane.jpeg' +image_path = './assets/airplane.jpeg' # Create a configuration object to specify quantization parameters quantization_config = BitsAndBytesConfig(