@@ -173,9 +173,9 @@ def __init__(self,
173173 # thus being consistent with the fine-tuning stage
174174 # Note that the ssv2 we use is decoded to frames at 12 fps;
175175 # if decoded at 24 fps, the sample interval should be 4.
176- self .ssv2_skip_length = self . new_length * 2
176+ self .orig_new_step = new_step
177177 self .orig_skip_length = self .skip_length
178-
178+
179179 self .video_loader = get_video_loader ()
180180 self .image_loader = get_image_loader ()
181181
@@ -191,7 +191,8 @@ def __getitem__(self, index):
191191 try :
192192 video_name , start_idx , total_frame = self .clips [index ]
193193 self .skip_length = self .orig_skip_length
194-
194+ self .new_step = self .orig_new_step
195+
195196 if total_frame < 0 :
196197 decord_vr = self .video_loader (video_name )
197198 duration = len (decord_vr )
@@ -210,7 +211,8 @@ def __getitem__(self, index):
210211 else :
211212 # ssv2 & ava & other rawframe dataset
212213 if 'SomethingV2' in video_name :
213- self .skip_length = self .ssv2_skip_length
214+ self .new_step = 2
215+ self .skip_length = self .new_length * self .new_step
214216 fname_tmpl = self .ssv2_fname_tmpl
215217 elif 'AVA2.2' in video_name :
216218 fname_tmpl = self .ava_fname_tmpl
0 commit comments