Merge pull request #206 from ByeongkiJeong/patch-1

Update inference_on_multiple_gpus.md
2026-02-04 17:59:18 +08:00 · 2024-06-04 22:27:15 +08:00
parent 2351da1c9e 131ae3d294
commit f43e35adcb
1 changed files with 1 additions and 1 deletions
--- a/docs/inference_on_multiple_gpus.md
+++ b/docs/inference_on_multiple_gpus.md
@@ -43,7 +43,7 @@ gpu_device_ids = [0, 1] # Define which gpu to use (now we have two GPUs, each ha
 no_split_module_classes = ["LlamaDecoderLayer"]

 max_memory = {
-    device_id: memory for device_id in gpu_device_ids
+    device_id: max_memory_each_gpu for device_id in gpu_device_ids
 }

 config = AutoConfig.from_pretrained(