torch>=1.8.1
torchvision>=0.8.9
tqdm>=2
scikit-learn<2,>=1.0
open_clip_torch>=0.2.1
pycocoevalcap
webdataset>=0.2.31
transformers
