Update readme, example code use bfloat16 to reduce GPU memory usage
Browse files
README.md
CHANGED
|
@@ -124,7 +124,8 @@ import torch
|
|
| 124 |
from PIL import Image
|
| 125 |
from transformers import AutoModel, AutoTokenizer
|
| 126 |
|
| 127 |
-
model = AutoModel.from_pretrained('openbmb/MiniCPM-V', trust_remote_code=True)
|
|
|
|
| 128 |
tokenizer = AutoTokenizer.from_pretrained('openbmb/MiniCPM-V', trust_remote_code=True)
|
| 129 |
model.eval().cuda()
|
| 130 |
|
|
|
|
| 124 |
from PIL import Image
|
| 125 |
from transformers import AutoModel, AutoTokenizer
|
| 126 |
|
| 127 |
+
model = AutoModel.from_pretrained('openbmb/MiniCPM-V', trust_remote_code=True)
|
| 128 |
+
model = model.to(dtype=torch.bfloat16)
|
| 129 |
tokenizer = AutoTokenizer.from_pretrained('openbmb/MiniCPM-V', trust_remote_code=True)
|
| 130 |
model.eval().cuda()
|
| 131 |
|