huggingface · hesamsheikh · Mar 3, 2025
diff --git a/chapters/en/chapter12/2.mdx b/chapters/en/chapter12/2.mdx
@@ -166,15 +166,15 @@ In the next module, we'll get our hands dirty and dive into the DeepSeek R1 pape
 
 <Question
     choices={[
+        {
+            text: "It makes models generate text faster",
+            explain: "RLHF isn't primarily about improving generation speed."
+        },
         {
             text: "It helps align models with human preferences and values",
             explain: "Correct! RLHF uses human feedback to guide models toward more helpful, harmless, and aligned behavior.",
             correct: true
         },
-        {
-            text: "It makes models generate text faster",
-            explain: "RLHF isn't primarily about improving generation speed."
-        },
         {
             text: "It reduces the model's memory usage",
             explain: "RLHF doesn't focus on model efficiency or memory optimization."
@@ -186,18 +186,18 @@ In the next module, we'll get our hands dirty and dive into the DeepSeek R1 pape
 
 <Question
     choices={[
-        {
-            text: "Generating words or choosing responses in a conversation",
-            explain: "Correct! For LLMs, actions typically involve text generation decisions.",
-            correct: true
-        },
         {
             text: "Updating model weights",
             explain: "This is part of the training process, not an action in the RL context."
         },
         {
             text: "Processing input tokens",
             explain: "This is part of the model's operation, not an action in the RL context."
+        },
+        {
+            text: "Generating words or choosing responses in a conversation",
+            explain: "Correct! For LLMs, actions typically involve text generation decisions.",
+            correct: true
         }
     ]}
 />
@@ -226,15 +226,15 @@ In the next module, we'll get our hands dirty and dive into the DeepSeek R1 pape
 
 <Question
     choices={[
+        {
+            text: "A function that generates responses",
+            explain: "Rewards are feedback on response quality, not the generation process itself."
+        },
         {
             text: "A numerical score that measures the quality of a response",
             explain: "Correct! Rewards provide feedback on response quality, guiding the model toward desired behavior.",
             correct: true
         },
-        {
-            text: "A function that generates responses",
-            explain: "Rewards are feedback on response quality, not the generation process itself."
-        },
         {
             text: "A model that evaluates the quality of responses",
             explain: "Rewards are feedback on response quality, not an evaluation model."