Skip to content

Commit 466acdc

Browse files
register dino v3 presets (#2463)
1 parent 5d0c852 commit 466acdc

File tree

2 files changed

+91
-2
lines changed

2 files changed

+91
-2
lines changed
Lines changed: 90 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,93 @@
11
"""DINOV3 model preset configurations."""
22

33
# Metadata for loading pretrained model weights.
4-
backbone_presets = {}
4+
backbone_presets = {
5+
"dinov3_vit_small_lvd1689m": {
6+
"metadata": {
7+
"description": (
8+
"Vision Transformer (small-sized model) trained on LVD-1689M "
9+
"using DINOv3."
10+
),
11+
"params": 21_600_000,
12+
"path": "dinov3",
13+
},
14+
"kaggle_handle": "kaggle://keras/dinov3/keras/dinov3_vit_small_lvd1689m/1",
15+
},
16+
"dinov3_vit_small_plus_lvd1689m": {
17+
"metadata": {
18+
"description": (
19+
"Vision Transformer (small-plus-sized model) trained on "
20+
"LVD-1689M using DINOv3."
21+
),
22+
"params": 29_000_000,
23+
"path": "dinov3",
24+
},
25+
"kaggle_handle": "kaggle://keras/dinov3/keras/dinov3_vit_small_plus_lvd1689m/1",
26+
},
27+
"dinov3_vit_base_lvd1689m": {
28+
"metadata": {
29+
"description": (
30+
"Vision Transformer (base-sized model) trained on LVD-1689M "
31+
"using DINOv3."
32+
),
33+
"params": 86_000_000,
34+
"path": "dinov3",
35+
},
36+
"kaggle_handle": "kaggle://keras/dinov3/keras/dinov3_vit_base_lvd1689m/1",
37+
},
38+
"dinov3_vit_large_lvd1689m": {
39+
"metadata": {
40+
"description": (
41+
"Vision Transformer (large-sized model) trained on LVD-1689M "
42+
"using DINOv3."
43+
),
44+
"params": 300_000_000,
45+
"path": "dinov3",
46+
},
47+
"kaggle_handle": "kaggle://keras/dinov3/keras/dinov3_vit_large_lvd1689m/1",
48+
},
49+
"dinov3_vit_huge_plus_lvd1689m": {
50+
"metadata": {
51+
"description": (
52+
"Vision Transformer (huge-plus-sized model) trained on "
53+
"LVD-1689M using DINOv3."
54+
),
55+
"params": 840_000_000,
56+
"path": "dinov3",
57+
},
58+
"kaggle_handle": "kaggle://keras/dinov3/keras/dinov3_vit_huge_plus_lvd1689m/1",
59+
},
60+
"dinov3_vit_7b_lvd1689m": {
61+
"metadata": {
62+
"description": (
63+
"Vision Transformer (7B-sized model) trained on LVD-1689M "
64+
"using DINOv3."
65+
),
66+
"params": 6_700_000_000,
67+
"path": "dinov3",
68+
},
69+
"kaggle_handle": "kaggle://keras/dinov3/keras/dinov3_vit_7b_lvd1689m/1",
70+
},
71+
"dinov3_vit_large_sat493m": {
72+
"metadata": {
73+
"description": (
74+
"Vision Transformer (large-sized model) trained on SAT-493M "
75+
"using DINOv3."
76+
),
77+
"params": 300_000_000,
78+
"path": "dinov3",
79+
},
80+
"kaggle_handle": "kaggle://keras/dinov3/keras/dinov3_vit_large_sat493m/1",
81+
},
82+
"dinov3_vit_7b_sat493m": {
83+
"metadata": {
84+
"description": (
85+
"Vision Transformer (7B-sized model) trained on SAT-493M "
86+
"using DINOv3."
87+
),
88+
"params": 6_700_000_000,
89+
"path": "dinov3",
90+
},
91+
"kaggle_handle": "kaggle://keras/dinov3/keras/dinov3_vit_7b_sat493m/1",
92+
},
93+
}

tools/checkpoint_conversion/convert_dinov3_checkpoints.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -115,7 +115,7 @@ def validate_output(
115115
hf_outputs = hf_outputs[0].detach().cpu().numpy()
116116

117117
# Call with keras.
118-
keras_outputs = keras_hub_model.predict({"images": images}, verbose=0)
118+
keras_outputs = keras_hub_model.predict({"pixel_values": images}, verbose=0)
119119
keras_outputs = keras.ops.convert_to_numpy(keras_outputs)
120120

121121
print("🔶 Keras output:", keras_outputs[0, 0, :10])

0 commit comments

Comments
 (0)