We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent f40031c commit fbf82b0Copy full SHA for fbf82b0
1 file changed
docs/source/trl_integration.md
@@ -7,8 +7,8 @@ from datasets import Dataset
7
from trl import SFTConfig, SFTTrainer
8
9
# Create a small fake dataset
10
-prompts = ["What is the capital of France?", "Who wrote Hamlet?"] * 12
11
-completions = ["Paris.", "Shakespeare."] * 12
+prompts = ["The capital of France is", "Hamlet was written by"] * 12
+completions = [" Paris.", " Shakespeare."] * 12
12
dataset = Dataset.from_dict({"prompt": prompts, "completion": completions})
13
14
# Train a model using the TRL SFTTrainer API
0 commit comments