torch>=2.0.0 transformers>=4.40.0 peft>=0.10.0 accelerate>=0.27.0 datasets>=2.18.0 tokenizers>=0.15.0 # RL gymnasium>=0.29.0 stable-baselines3>=2.2.0 # LLM API openai>=1.20.0 anthropic>=0.25.0 dashscope>=1.18.0 # Experiment tracking wandb>=0.16.0 # Data processing pandas>=2.0.0 numpy>=1.24.0 scikit-learn>=1.3.0 tqdm>=4.66.0 # Evaluation scipy>=1.11.0 # Config pyyaml>=6.0 omegaconf>=2.3.0 # Utilities jsonlines>=4.0.0 rich>=13.0.0