Sync with C-RADIOv2-VLM-H-RC3 (#2)
Browse files- Sync with nvidia/C-RADIOv2-VLM-H-RC3 (a1fc2a754c7ce39bee9f0f1ebdf1ea32dc0f5ff8)
- Update README for release (581f0a8268fb26143fe249849e3f61b53c33a695)
- Remove custom load_state_dict (fe079c89a3bc7b68fb3ede1163d3c90c8679fef9)
- README.md +4 -2
- config.json +12 -2
- model.safetensors +1 -1
README.md
CHANGED
|
@@ -6,6 +6,8 @@ license_link: https://developer.download.nvidia.com/licenses/nvidia-open-model-l
|
|
| 6 |
|
| 7 |
# Model Overview
|
| 8 |
|
|
|
|
|
|
|
| 9 |
## Description
|
| 10 |
|
| 11 |
This model performs visual feature extraction.
|
|
@@ -78,7 +80,7 @@ import torch
|
|
| 78 |
from PIL import Image
|
| 79 |
from transformers import AutoModel, CLIPImageProcessor
|
| 80 |
|
| 81 |
-
hf_repo = "nvidia/C-RADIOv2-H"
|
| 82 |
|
| 83 |
image_processor = CLIPImageProcessor.from_pretrained(hf_repo)
|
| 84 |
model = AutoModel.from_pretrained(hf_repo, trust_remote_code=True)
|
|
@@ -224,4 +226,4 @@ Field | Response
|
|
| 224 |
Model Application(s): | Generation of visual embeddings
|
| 225 |
Describe the life critical impact (if present). | Not Applicable
|
| 226 |
Use Case Restrictions: | Abide by NVIDIA Open Model License Agreement
|
| 227 |
-
Model and dataset restrictions: | The Principle of least privilege (PoLP) is applied limiting access for dataset generation and model development. Restrictions enforce dataset access during training, and dataset license constraints adhered to.
|
|
|
|
| 6 |
|
| 7 |
# Model Overview
|
| 8 |
|
| 9 |
+
[[**Github**](https://github.com/NVlabs/RADIO)] [[**CVPR 2025**](https://arxiv.org/abs/2412.07679)] [[**CVPR 2024**](https://arxiv.org/abs/2312.06709)]
|
| 10 |
+
|
| 11 |
## Description
|
| 12 |
|
| 13 |
This model performs visual feature extraction.
|
|
|
|
| 80 |
from PIL import Image
|
| 81 |
from transformers import AutoModel, CLIPImageProcessor
|
| 82 |
|
| 83 |
+
hf_repo = "nvidia/C-RADIOv2-VLM-H"
|
| 84 |
|
| 85 |
image_processor = CLIPImageProcessor.from_pretrained(hf_repo)
|
| 86 |
model = AutoModel.from_pretrained(hf_repo, trust_remote_code=True)
|
|
|
|
| 226 |
Model Application(s): | Generation of visual embeddings
|
| 227 |
Describe the life critical impact (if present). | Not Applicable
|
| 228 |
Use Case Restrictions: | Abide by NVIDIA Open Model License Agreement
|
| 229 |
+
Model and dataset restrictions: | The Principle of least privilege (PoLP) is applied limiting access for dataset generation and model development. Restrictions enforce dataset access during training, and dataset license constraints adhered to.
|
config.json
CHANGED
|
@@ -16,7 +16,7 @@
|
|
| 16 |
"cache_dir": null,
|
| 17 |
"channels_last": false,
|
| 18 |
"checkpoint_hist": 10,
|
| 19 |
-
"chk_keep_forever":
|
| 20 |
"class_map": "",
|
| 21 |
"clip_grad": null,
|
| 22 |
"clip_mode": "norm",
|
|
@@ -31,6 +31,7 @@
|
|
| 31 |
"crop_pct": null,
|
| 32 |
"cutmix": 0.0,
|
| 33 |
"cutmix_minmax": null,
|
|
|
|
| 34 |
"dataset_download": false,
|
| 35 |
"debug_full_knn": false,
|
| 36 |
"decay_epochs": 90,
|
|
@@ -64,7 +65,7 @@
|
|
| 64 |
"force_new_wandb_id": false,
|
| 65 |
"force_spectral_reparam": true,
|
| 66 |
"freeze_bn": false,
|
| 67 |
-
"fsdp":
|
| 68 |
"full_equivariance": false,
|
| 69 |
"fuser": "",
|
| 70 |
"gp": null,
|
|
@@ -169,6 +170,15 @@
|
|
| 169 |
"name": "siglip2-g",
|
| 170 |
"type": "siglip2",
|
| 171 |
"use_summary": true
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 172 |
}
|
| 173 |
],
|
| 174 |
"torchcompile": null,
|
|
|
|
| 16 |
"cache_dir": null,
|
| 17 |
"channels_last": false,
|
| 18 |
"checkpoint_hist": 10,
|
| 19 |
+
"chk_keep_forever": 100,
|
| 20 |
"class_map": "",
|
| 21 |
"clip_grad": null,
|
| 22 |
"clip_mode": "norm",
|
|
|
|
| 31 |
"crop_pct": null,
|
| 32 |
"cutmix": 0.0,
|
| 33 |
"cutmix_minmax": null,
|
| 34 |
+
"damp": null,
|
| 35 |
"dataset_download": false,
|
| 36 |
"debug_full_knn": false,
|
| 37 |
"decay_epochs": 90,
|
|
|
|
| 65 |
"force_new_wandb_id": false,
|
| 66 |
"force_spectral_reparam": true,
|
| 67 |
"freeze_bn": false,
|
| 68 |
+
"fsdp": false,
|
| 69 |
"full_equivariance": false,
|
| 70 |
"fuser": "",
|
| 71 |
"gp": null,
|
|
|
|
| 170 |
"name": "siglip2-g",
|
| 171 |
"type": "siglip2",
|
| 172 |
"use_summary": true
|
| 173 |
+
},
|
| 174 |
+
{
|
| 175 |
+
"fd_normalize": false,
|
| 176 |
+
"feature_distillation": true,
|
| 177 |
+
"input_size": 384,
|
| 178 |
+
"model": "siglip2-g-384",
|
| 179 |
+
"name": "siglip2-g-dirty",
|
| 180 |
+
"type": "siglip2",
|
| 181 |
+
"use_summary": false
|
| 182 |
}
|
| 183 |
],
|
| 184 |
"torchcompile": null,
|
model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 2606616120
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:96ff3bfec4f732d68a0c38c41a49de043abd2503df24481526ea87d26dd6a4f5
|
| 3 |
size 2606616120
|