intfloat
/

mmE5-mllama-11b-instruct

Zero-Shot Image Classification

sentence-transformers

image-text-to-text

text-generation-inference

Inference Endpoints

Model card Files Files and versions Community

intfloat commited on 2 days ago

Commit

078d6bc

·

1 Parent(s): 97fe6cd

Set use_cache to false

Files changed (2) hide show

README.md +2 -10
config.json +1 -1

README.md CHANGED Viewed

@@ -44,7 +44,7 @@ pip install -r requirements.txt
 Then you can enter the directory to run the following command.
 ```python
-from transformers import MllamaForConditionalGeneration, AutoProcessor, AutoConfig
 import torch
 from PIL import Image
@@ -64,17 +64,9 @@ model_name = "intfloat/mmE5-mllama-11b-instruct"
 # Load Processor and Model
 processor = AutoProcessor.from_pretrained(model_name)
-processor.tokenizer.padding_side = "right"
-config = AutoConfig.from_pretrained(model_name)
-if hasattr(config, 'use_cache'):
-    config.use_cache = False
-config.padding_side = "right"
 model = MllamaForConditionalGeneration.from_pretrained(
-    model_name, config=config,
-    torch_dtype=torch.bfloat16
 ).to("cuda")
-model.padding_side = "right"
 model.eval()
 # Image + Text -> Text

 Then you can enter the directory to run the following command.
 ```python
+from transformers import MllamaForConditionalGeneration, AutoProcessor
 import torch
 from PIL import Image
 # Load Processor and Model
 processor = AutoProcessor.from_pretrained(model_name)
 model = MllamaForConditionalGeneration.from_pretrained(
+    model_name, torch_dtype=torch.bfloat16
 ).to("cuda")
 model.eval()
 # Image + Text -> Text

config.json CHANGED Viewed

@@ -96,7 +96,7 @@
     "torchscript": false,
     "typical_p": 1.0,
     "use_bfloat16": false,
-    "use_cache": true,
     "vocab_size": 128256
   },
   "torch_dtype": "bfloat16",

     "torchscript": false,
     "typical_p": 1.0,
     "use_bfloat16": false,
+    "use_cache": false,
     "vocab_size": 128256
   },
   "torch_dtype": "bfloat16",