From f1c2cc22d46a6976df3555391e667c7e61592fad Mon Sep 17 00:00:00 2001 From: YurenHao0426 Date: Wed, 4 Feb 2026 18:59:35 -0600 Subject: Initial commit: RL floating-point noise project --- requirements.txt | 39 +++++++++++++++++++++++++++++++++++++++ 1 file changed, 39 insertions(+) create mode 100644 requirements.txt (limited to 'requirements.txt') diff --git a/requirements.txt b/requirements.txt new file mode 100644 index 0000000..c108ec1 --- /dev/null +++ b/requirements.txt @@ -0,0 +1,39 @@ +# RLVR Floating-Point Precision Experiment Dependencies +# Core ML frameworks +torch>=2.0.0 +transformers>=4.36.0 +accelerate>=0.25.0 + +# RL framework (VeRL) +# Install from source: pip install git+https://github.com/volcengine/verl.git +# verl + +# Inference +vllm>=0.2.0 + +# Numerical computation +numpy>=1.24.0 +scipy>=1.10.0 + +# Visualization +matplotlib>=3.7.0 + +# Progress tracking +tqdm>=4.65.0 + +# Data handling +datasets>=2.14.0 + +# Utilities +pyyaml>=6.0 +jsonlines>=3.1.0 + +# Distributed training (optional, usually comes with torch) +# torch-distributed + +# Flash attention (optional, for faster inference) +# flash-attn>=2.3.0 + +# Evaluation utilities +# eval-chemy # Math verifier (install from RLVR repo) + -- cgit v1.2.3