@@ -19,22 +19,26 @@ def setUp(self):
19
19
"layer_scale_init_value" : 1.0 ,
20
20
"num_register_tokens" : 0 ,
21
21
"use_swiglu_ffn" : False ,
22
- "image_shape" : (64 , 64 , 3 ),
22
+ "image_shape" : (70 , 70 , 3 ),
23
+ "name" : "dinov2_backbone" ,
23
24
}
24
25
self .input_data = {
25
- "images" : ops .ones ((2 , 64 , 64 , 3 )),
26
+ "images" : ops .ones ((2 , 70 , 70 , 3 )),
26
27
}
27
28
28
29
def test_backbone_basics (self ):
29
30
patch_size = self .init_kwargs ["patch_size" ]
30
31
image_size = self .init_kwargs ["image_shape" ][0 ]
31
32
hidden_dim = self .init_kwargs ["hidden_dim" ]
32
33
sequence_length = (image_size // patch_size ) ** 2 + 1
33
- self .run_backbone_test (
34
+ self .run_vision_backbone_test (
34
35
cls = DINOV2Backbone ,
35
36
init_kwargs = self .init_kwargs ,
36
37
input_data = self .input_data ,
37
38
expected_output_shape = (2 , sequence_length , hidden_dim ),
39
+ expected_pyramid_output_keys = ["Stem" , "Stage1" , "Stage2" ],
40
+ expected_pyramid_image_sizes = [(sequence_length , hidden_dim )] * 3 ,
41
+ run_data_format_check = False ,
38
42
)
39
43
40
44
@pytest .mark .large
@@ -107,10 +111,11 @@ def setUp(self):
107
111
"layer_scale_init_value" : 1.0 ,
108
112
"num_register_tokens" : 4 ,
109
113
"use_swiglu_ffn" : True ,
110
- "image_shape" : (64 , 64 , 3 ),
114
+ "image_shape" : (70 , 70 , 3 ),
115
+ "name" : "dinov2_backbone" ,
111
116
}
112
117
self .input_data = {
113
- "images" : ops .ones ((2 , 64 , 64 , 3 )),
118
+ "images" : ops .ones ((2 , 70 , 70 , 3 )),
114
119
}
115
120
116
121
def test_backbone_basics (self ):
@@ -121,11 +126,14 @@ def test_backbone_basics(self):
121
126
sequence_length = (
122
127
(image_size // patch_size ) ** 2 + 1 + num_register_tokens
123
128
)
124
- self .run_backbone_test (
129
+ self .run_vision_backbone_test (
125
130
cls = DINOV2Backbone ,
126
131
init_kwargs = self .init_kwargs ,
127
132
input_data = self .input_data ,
128
133
expected_output_shape = (2 , sequence_length , hidden_dim ),
134
+ expected_pyramid_output_keys = ["Stem" , "Stage1" , "Stage2" ],
135
+ expected_pyramid_image_sizes = [(sequence_length , hidden_dim )] * 3 ,
136
+ run_data_format_check = False ,
129
137
)
130
138
131
139
@pytest .mark .large
0 commit comments