absl-py<3.0.0,>=2.0.0
comment_parser
cosmos-xenna==0.1.2
fsspec
jieba==0.42.1
loguru
mecab-python3
pandas>=2.1.0
pyarrow
ray[data,default]>=2.49
torch
transformers==4.55.2

[all]
nemo_curator[audio_cuda12]
nemo_curator[image_cuda12]
nemo_curator[text_cuda12]
nemo_curator[video_cuda12]

[audio_cpu]
nemo_toolkit[asr]==2.4.0

[audio_cuda12]
nemo_curator[audio_cpu]
nemo_curator[cuda12]

[cuda12]
gpustat
pynvml

[deduplication_cuda12]
cudf-cu12==25.6.*
cugraph-cu12==25.6.*
cuml-cu12==25.6.*
nx-cugraph-cu12==25.6.*
pylibraft-cu12==25.6.*
raft-dask-cu12==25.6.*
rapidsmpf-cu12==25.6.*

[image_cpu]
torchvision

[image_cuda12]
nemo_curator[image_cpu]
nemo_curator[cuda12]
nemo_curator[deduplication_cuda12]
nvidia-dali-cuda120

[text_cpu]
beautifulsoup4
justext
lxml
pycld2
resiliparse
s5cmd
trafilatura==2.0.0
warcio
fasttext==0.9.3
sentencepiece
mwparserfromhell==0.6.5
peft
ftfy==6.1.1

[text_cuda12]
nemo_curator[cuda12]
nemo_curator[deduplication_cuda12]
nemo_curator[text_cpu]

[video_cpu]
av==13.1.0
opencv-python
torchvision
einops
easydict

[video_cuda12]
nemo_curator[video_cpu]
nemo_curator[cuda12]
cvcuda_cu12
pycuda
torch<=2.8.0
torchaudio

[video_cuda12:platform_machine == "x86_64" and platform_system != "Darwin"]
flash-attn<=2.8.3
PyNvVideoCodec==2.0.2
vllm==0.10.2
