DeepGlint-AI
/

mlcd-vit-bigG-patch14-336

Model card Files Files and versions

xiangan commited on Feb 8, 2025

Commit

02ada95

·

verified ·

1 Parent(s): 75b40c3

Update README.md

Files changed (1) hide show

README.md +6 -3

README.md CHANGED Viewed

@@ -30,16 +30,18 @@ cd unicom/mlcd
 ```python
 from vit_rope2d_hf import MLCDVisionModel
-from transformers import AutoImageProcessor
 from PIL import Image
 import torch
 # Load model and processor
 model = MLCDVisionModel.from_pretrained("DeepGlint-AI/mlcd-vit-bigG-patch14-336")
-processor = AutoImageProcessor.from_pretrained("DeepGlint-AI/mlcd-vit-bigG-patch14-336")
 # Process single image
-image = Image.open("document.jpg").convert("RGB")
 inputs = processor(images=image, return_tensors="pt")
 # Get visual features
@@ -48,4 +50,5 @@ with torch.no_grad():
 features = outputs.last_hidden_state
 print(f"Extracted features shape: {features.shape}")
 ```

 ```python
 from vit_rope2d_hf import MLCDVisionModel
+from transformers import CLIPImageProcessor
 from PIL import Image
+import requests
 import torch
 # Load model and processor
 model = MLCDVisionModel.from_pretrained("DeepGlint-AI/mlcd-vit-bigG-patch14-336")
+processor = CLIPImageProcessor.from_pretrained("DeepGlint-AI/mlcd-vit-bigG-patch14-336")
 # Process single image
+url = "http://images.cocodataset.org/val2017/000000039769.jpg"
+image = Image.open(requests.get(url, stream=True).raw)
 inputs = processor(images=image, return_tensors="pt")
 # Get visual features
 features = outputs.last_hidden_state
 print(f"Extracted features shape: {features.shape}")
+# Extracted features shape: torch.Size([1, 577, 1664])
 ```