caiyuchen
/

DAPO-step-0

Text Generation

text-generation-inference

Model card Files Files and versions

caiyuchen commited on Oct 3, 2025

Commit

c57c89a

·

verified ·

1 Parent(s): 73a2606

Update README.md

Files changed (1) hide show

README.md +9 -5

README.md CHANGED Viewed

@@ -1,13 +1,17 @@
 ---
 license: apache-2.0
 tags:
-  - math
-  - rl
-  - qwen3
-  - dapomath17k
 library_name: transformers
 pipeline_tag: text-generation
 language: en
 ---
 # DAPO RL Checkpoint - Step 0
@@ -58,4 +62,4 @@ prompt = tokenizer.apply_chat_template(
 inputs = tokenizer(prompt, return_tensors="pt")
 outputs = model.generate(**inputs, max_new_tokens=256)
-print(tokenizer.decode(outputs[0], skip_special_tokens=True))

 ---
 license: apache-2.0
 tags:
+- math
+- rl
+- qwen3
+- dapomath17k
 library_name: transformers
 pipeline_tag: text-generation
 language: en
+datasets:
+- BytedTsinghua-SIA/DAPO-Math-17k
+base_model:
+- Qwen/Qwen3-8B-Base
 ---
 # DAPO RL Checkpoint - Step 0
 inputs = tokenizer(prompt, return_tensors="pt")
 outputs = model.generate(**inputs, max_new_tokens=256)
+print(tokenizer.decode(outputs[0], skip_special_tokens=True))