Update readme, example code use bfloat16 to reduce GPU memory usage
Browse files
README.md
CHANGED
@@ -124,7 +124,8 @@ import torch
|
|
124 |
from PIL import Image
|
125 |
from transformers import AutoModel, AutoTokenizer
|
126 |
|
127 |
-
model = AutoModel.from_pretrained('openbmb/MiniCPM-V', trust_remote_code=True)
|
|
|
128 |
tokenizer = AutoTokenizer.from_pretrained('openbmb/MiniCPM-V', trust_remote_code=True)
|
129 |
model.eval().cuda()
|
130 |
|
|
|
124 |
from PIL import Image
|
125 |
from transformers import AutoModel, AutoTokenizer
|
126 |
|
127 |
+
model = AutoModel.from_pretrained('openbmb/MiniCPM-V', trust_remote_code=True)
|
128 |
+
model = model.to(dtype=torch.bfloat16)
|
129 |
tokenizer = AutoTokenizer.from_pretrained('openbmb/MiniCPM-V', trust_remote_code=True)
|
130 |
model.eval().cuda()
|
131 |
|