vllm >= 0.2.1 transformers >= 4.34.0 datasets >= 2.14.6 torch >= 2.0.1 nltk tqdm sentencepiece # 0.1.97 datasets # 2.14.6 wandb scikit-learn