# 核心深度学习框架 torch>=2.0.0 torchvision xformers # Transformers生态 transformers>=4.35.0 accelerate>=0.24.0 tokenizers huggingface_hub # 数据处理 datasets>=2.14.0 numpy>=1.24.0 sentence-transformers faiss-cpu # 模型微调和RLHF peft>=0.9.0 trl[peft]>=0.7.10 bitsandbytes>=0.41.0 # 图像生成 diffusers invisible_watermark # 数据标注 label-studio # API和网络请求 flickrapi requests # 实验跟踪和可视化 wandb>=0.15.0 tensorboard>=2.13.0 # 评估指标 evaluate sacrebleu rouge-score # 系统工具和监控 scipy protobuf sentencepiece alive_progress psutil gpustat # 高级优化器(可选) deepspeed>=0.10.0 # RLHF特定工具 reward-bench