Tumpukan PyTorchvideo mengharapkan setiap tensor memiliki ukuran yang sama, tetapi mendapat [89088] saat entri 0 dan [88064] saat entri 1

# Add decode_audio=False to the val_dataset 

# Before:
val_dataset = pytorchvideo.data.Kinetics(
  data_path=os.path.join(self._DATA_PATH, "val.csv"),
  clip_sampler=pytorchvideo.data.make_clip_sampler("uniform",
                                                   self._CLIP_DURATION),
  transform=val_transform
)

# After
val_dataset = pytorchvideo.data.Kinetics(
  data_path=os.path.join(self._DATA_PATH, "val.csv"),
  clip_sampler=pytorchvideo.data.make_clip_sampler("uniform", 
                                                   self._CLIP_DURATION),
  decode_audio=False,
  transform=val_transform
)
Jittery Jay