duckdb==0.8.0
gensim>=4.1.2
numpy>=1.21.5
pandas>=1.4.4
polars>=0.19.8
pyarrow>=14.0.1
tokenizers>=0.13.3
transformers>=4.29.2
datasets>=2.12.0
