Spaces:

mcamargo00
/

math-solution-classifier

Paused

App Files Files Community

mcamargo00 commited on Aug 12

Commit

e725555

verified ·

1 Parent(s): f9ebb4d

Upload app.py

Browse files

Files changed (1) hide show

app.py +32 -31

app.py CHANGED Viewed

@@ -1,4 +1,4 @@
-# app.py - Gradio version (much simpler for HF Spaces)
 import unsloth
 from unsloth import FastModel
@@ -55,7 +55,7 @@ class GPTSequenceClassifier(nn.Module):
 # ===================================================================
-# 3. HELPERS
 # ===================================================================
 # --- Helper Functions ---
@@ -109,7 +109,7 @@ def evaluate_equations(eq_dict: dict, sol_dict: dict):
                 correct_rhs_val = round(lhs_val, 4)
                 correct_rhs_str = f"{correct_rhs_val:.4f}".rstrip('0').rstrip('.')
-                # Return a more detailed dictionary for better explanations
                 return {
                     "error": True,
                     "line_key": key,
@@ -235,7 +235,7 @@ logger.info("load_model(): %s", msg)
 # ===================================================================
-# 4. PIPELINE COMPONENTS
 # ===================================================================
 def run_conceptual_check(question: str, solution: str, model, tokenizer) -> dict:
@@ -255,7 +255,7 @@ def run_conceptual_check(question: str, solution: str, model, tokenizer) -> dict
     with torch.inference_mode():
         outputs = model(**inputs, use_cache=False)
-        # Explicitly cast logits to float32 for stable downstream processing
         logits = outputs["logits"].to(torch.float32)
         probs = torch.softmax(logits, dim=-1).squeeze().tolist()
@@ -327,11 +327,11 @@ def analyze_solution(question: str, solution: str):
     """
     Main orchestrator that runs the full pipeline and generates the final explanation.
     """
-    # STAGE 1: Conceptual Check (Fast)
     conceptual_result = run_conceptual_check(question, solution, classifier_model, classifier_tokenizer)
     confidence = conceptual_result['probabilities'][conceptual_result['prediction']]
-    # STAGE 2: Computational Check (Slower, Batched)
     computational_result = run_computational_check(solution, gemma_model, gemma_tokenizer)
     # FINAL VERDICT LOGIC
@@ -372,13 +372,13 @@ def classify_solution_stream(question: str, solution: str):
     log = []
-    # basic input check
     if not question.strip() or not solution.strip():
         log.append("⚠️ Provide a question and a solution.")
         yield "Please fill in both fields", "", render(log)
         return
-    # lazy-load if needed
     if not models_ready():
         log.append("⏳ Loading models…")
         yield "⏳ Working…", "", render(log)
@@ -444,7 +444,7 @@ def classify_solution_stream(question: str, solution: str):
         yield "Runtime error", f"{type(e).__name__}: {e}", render(log)
-        # ---------------- UI: streaming, no progress bars ----------------
 with gr.Blocks(title="Math Solution Classifier", theme=gr.themes.Soft()) as app:
     gr.Markdown("# 🧮 Math Solution Classifier")
     gr.Markdown(
@@ -665,7 +665,7 @@ class ExampleSelector:
         else:
             self.balance["wrong"] += 1
-# ===== CSV hookup (place near other imports / globals) =====
 from pathlib import Path
 import time
@@ -673,10 +673,10 @@ CSV_PATH = Path(__file__).resolve().parent / "final-test-with-wrong-answers.csv"
 POOL = load_examples_csv(str(CSV_PATH))
 def new_selector(seed: int | None = None):
-    # per-session selector; seed for reproducibility if you want
     return ExampleSelector(POOL, seed=seed or int(time.time()) & 0xFFFF)
-# small helpers for UI
 def _truncate(s: str, n: int = 100) -> str:
     s = s or ""
     return s if len(s) <= n else s[: n - 1] + "…"
@@ -694,7 +694,6 @@ def _rows_to_table(rows: list[dict]) -> list[list[str]]:
     return table
-# ===== Gradio callbacks for examples =====
 def ui_surprise(selector, filter_label="any"):
     """Pick one example and push it straight to inputs; persist selector state."""
     if selector is None or not POOL:
@@ -704,9 +703,13 @@ def ui_surprise(selector, filter_label="any"):
         return selector, gr.update(), gr.update()
     return selector, r["question"], r["solution"]
-# ---------------- UI: add CSV-driven examples ----------------
 with gr.Blocks(title="Math Solution Classifier", theme=gr.themes.Soft()) as app:
     gr.Markdown("# 🧮 Math Solution Classifier")
     gr.Markdown(
@@ -715,7 +718,7 @@ with gr.Blocks(title="Math Solution Classifier", theme=gr.themes.Soft()) as app:
         " \n Press 'Surprise me' to randomly select a sample question/answer pair from our dataset."
     )
-    # Per-session state
     selector_state = gr.State(new_selector())
     with gr.Row():
@@ -723,12 +726,12 @@ with gr.Blocks(title="Math Solution Classifier", theme=gr.themes.Soft()) as app:
         with gr.Column(scale=1):
             question_input = gr.Textbox(
                 label="Math Question",
-                placeholder="e.g., Solve for x: 2x + 5 = 13",
                 lines=3,
             )
             solution_input = gr.Textbox(
                 label="Proposed Solution",
-                placeholder="e.g., 2x + 5 = 13\n2x = 13 - 5\n2x = 8\nx = 4",
                 lines=8,
             )
             expected_label_example = gr.Textbox(
@@ -738,7 +741,7 @@ with gr.Blocks(title="Math Solution Classifier", theme=gr.themes.Soft()) as app:
             with gr.Row():
                 classify_btn = gr.Button("Classify Solution", variant="primary")
                 surprise_btn = gr.Button("Surprise me")   # <- new
-                clear_btn    = gr.Button("Clear")
         # -------- Right: outputs --------
         with gr.Column(scale=1):
@@ -746,7 +749,7 @@ with gr.Blocks(title="Math Solution Classifier", theme=gr.themes.Soft()) as app:
             explanation_output   = gr.Textbox(label="Explanation",   interactive=False, lines=6)
             status_output        = gr.Markdown(value="*(idle)*")  # live stage updates
-    # -------- Curated starter examples (static) --------
     gr.Examples(
         examples=[
                 ["John has three apples and Mary has seven, how many apples do they have together?",
@@ -755,18 +758,18 @@ with gr.Blocks(title="Math Solution Classifier", theme=gr.themes.Soft()) as app:
         ["A rectangle's length is twice its width. If the width is 7 cm, what is the perimeter of the rectangle?",
         "The length of the rectangle is 2 * 7 = 14 cm.\n The perimeter is 14 + 7 = 21 cm.\n Final answer: 21",
         "Conceptually flawed"],
-        ["A tank holds 60 liters of fuel. A generator uses fuel at a rate of 5 liters per hour. After running for 9 hours, how many liters are still in the tank?",
-"The generator uses 5 L/h × 9 h = 45 L of fuel in 9 hours.\n Then, there remain 60 L + 45 L = 105 L in the tank.\n Final answer: 105 L",
-"Conceptually flawed"],
             ["What is 15% of 200?",
              "15% = 15/100 = 0.15\n0.15 × 200 = 30\n Final answer: 30",
              "Correct"],
              ["A circle has a radius of 5 cm. Using the approximation pi = 3.14, what is the circumference of the circle?",
              "The circumference of the circle is 3.14 * 5 = 15.7 cm.\n Final answer: 15.7",
              "Conceptually flawed"],
-             ["Emily is saving for a bicycle that costs $250. She saves $15 each week from her allowance. She also received $40 for her birthday to put towards the bike. How many weeks will it take her to save enough money?",
-             "The amount Emily still needs to save is $250 - $40 = $210.\n The number of weeks it will take her to save is 210 / 15 = 12.\n Final answer: 12",
-             "Computationally flawed"],
              ["A 24-meter rope is cut into 6 equal pieces. A climber uses 2 of those pieces. How many meters of rope are still unused?",
              "The length of each piece is 24 / 6 = 4 m.\n The climber uses 2 × 4 m = 8 m of rope.\n There are 24 m − 8 m = 16 m of rope still unused.\n Final answer: 16",
              "Correct"]
@@ -776,7 +779,7 @@ with gr.Blocks(title="Math Solution Classifier", theme=gr.themes.Soft()) as app:
     # ---------- Wiring ----------
-    # Main classify (streaming)
     classify_btn.click(
         fn=classify_solution_stream,
         inputs=[question_input, solution_input],
@@ -785,16 +788,14 @@ with gr.Blocks(title="Math Solution Classifier", theme=gr.themes.Soft()) as app:
         concurrency_limit=1,
     )
-    # ---- and replace the Surprise button wiring with this ----
     surprise_btn.click(
         fn=ui_surprise,
-        inputs=[selector_state],                              # no filter_dd anymore
-        outputs=[selector_state, question_input, solution_input],  # persist selector state
         queue=True,
     )
-# Enable queue for streaming
 app.queue()
 if __name__ == "__main__":

+# app.py
 import unsloth
 from unsloth import FastModel
 # ===================================================================
+#HELPERS
 # ===================================================================
 # --- Helper Functions ---
                 correct_rhs_val = round(lhs_val, 4)
                 correct_rhs_str = f"{correct_rhs_val:.4f}".rstrip('0').rstrip('.')
                 return {
                     "error": True,
                     "line_key": key,
 # ===================================================================
+# PIPELINE COMPONENTS
 # ===================================================================
 def run_conceptual_check(question: str, solution: str, model, tokenizer) -> dict:
     with torch.inference_mode():
         outputs = model(**inputs, use_cache=False)
         logits = outputs["logits"].to(torch.float32)
         probs = torch.softmax(logits, dim=-1).squeeze().tolist()
     """
     Main orchestrator that runs the full pipeline and generates the final explanation.
     """
+    # STAGE 1: Conceptual Check
     conceptual_result = run_conceptual_check(question, solution, classifier_model, classifier_tokenizer)
     confidence = conceptual_result['probabilities'][conceptual_result['prediction']]
+    # STAGE 2: Computational Check
     computational_result = run_computational_check(solution, gemma_model, gemma_tokenizer)
     # FINAL VERDICT LOGIC
     log = []
     if not question.strip() or not solution.strip():
         log.append("⚠️ Provide a question and a solution.")
         yield "Please fill in both fields", "", render(log)
         return
     if not models_ready():
         log.append("⏳ Loading models…")
         yield "⏳ Working…", "", render(log)
         yield "Runtime error", f"{type(e).__name__}: {e}", render(log)
+        # ---------------- UI: streaming ----------------
 with gr.Blocks(title="Math Solution Classifier", theme=gr.themes.Soft()) as app:
     gr.Markdown("# 🧮 Math Solution Classifier")
     gr.Markdown(
         else:
             self.balance["wrong"] += 1
+# ===== CSV hookup =====
 from pathlib import Path
 import time
 POOL = load_examples_csv(str(CSV_PATH))
 def new_selector(seed: int | None = None):
     return ExampleSelector(POOL, seed=seed or int(time.time()) & 0xFFFF)
 def _truncate(s: str, n: int = 100) -> str:
     s = s or ""
     return s if len(s) <= n else s[: n - 1] + "…"
     return table
 def ui_surprise(selector, filter_label="any"):
     """Pick one example and push it straight to inputs; persist selector state."""
     if selector is None or not POOL:
         return selector, gr.update(), gr.update()
     return selector, r["question"], r["solution"]
+components_to_clear = [
+    question_input,
+    solution_input,
+    expected_label_example,
+]
 with gr.Blocks(title="Math Solution Classifier", theme=gr.themes.Soft()) as app:
     gr.Markdown("# 🧮 Math Solution Classifier")
     gr.Markdown(
         " \n Press 'Surprise me' to randomly select a sample question/answer pair from our dataset."
     )
     selector_state = gr.State(new_selector())
     with gr.Row():
         with gr.Column(scale=1):
             question_input = gr.Textbox(
                 label="Math Question",
+                placeholder="e.g., What is 14 divided by 2?",
                 lines=3,
             )
             solution_input = gr.Textbox(
                 label="Proposed Solution",
+                placeholder="e.g., 14/2 = 9",
                 lines=8,
             )
             expected_label_example = gr.Textbox(
             with gr.Row():
                 classify_btn = gr.Button("Classify Solution", variant="primary")
                 surprise_btn = gr.Button("Surprise me")   # <- new
+                clear_btn    = clear_btn = gr.ClearButton(components=components_to_clear, value="Clear")
         # -------- Right: outputs --------
         with gr.Column(scale=1):
             explanation_output   = gr.Textbox(label="Explanation",   interactive=False, lines=6)
             status_output        = gr.Markdown(value="*(idle)*")  # live stage updates
+    # -------- Curated starter examples --------
     gr.Examples(
         examples=[
                 ["John has three apples and Mary has seven, how many apples do they have together?",
         ["A rectangle's length is twice its width. If the width is 7 cm, what is the perimeter of the rectangle?",
         "The length of the rectangle is 2 * 7 = 14 cm.\n The perimeter is 14 + 7 = 21 cm.\n Final answer: 21",
         "Conceptually flawed"],
+        ["",
+"The lateral area of the bottom layer is 2 * 3.14 * 20 * 8 = 1004.8.\n The lateral area of the middle layer is 2 * 3.14 * 15 * 8 = 753.6.\n The lateral area of the top layer is 2 * 3.14 * 10 * 8 = 502.4.\n The exposed top surface is the area of the smallest circle: 3.14 * (10*10) = 314.\n The total frosted area is 1004.8 + 753.6 + 502.4 + 314 = 2888.8 sq cm.\n FINAL ANSWER: 2888.8",
+"Computationally flawed"],
             ["What is 15% of 200?",
              "15% = 15/100 = 0.15\n0.15 × 200 = 30\n Final answer: 30",
              "Correct"],
              ["A circle has a radius of 5 cm. Using the approximation pi = 3.14, what is the circumference of the circle?",
              "The circumference of the circle is 3.14 * 5 = 15.7 cm.\n Final answer: 15.7",
              "Conceptually flawed"],
+             ["A library is building new shelves. Each shelf is 1.2 meters long. A standard book is 3 cm thick, and a large book is 5 cm thick. A shelf must hold 20 standard books and 10 large books. After filling a shelf with these books, how much space, in centimeters, is left on the shelf?",
+             "The shelf length in centimeters is 1.2 * 100 = 120 cm.\n The space taken by standard books is 20 * 3 = 60 cm.\n The space taken by large books is 10 * 5 = 50 cm.\n The total space taken is 60 + 50 = 110 cm.\n The remaining space is 120 + 110 = 230 cm.\n FINAL ANSWER: 230",
+             "Conceptually flawed"],
              ["A 24-meter rope is cut into 6 equal pieces. A climber uses 2 of those pieces. How many meters of rope are still unused?",
              "The length of each piece is 24 / 6 = 4 m.\n The climber uses 2 × 4 m = 8 m of rope.\n There are 24 m − 8 m = 16 m of rope still unused.\n Final answer: 16",
              "Correct"]
     # ---------- Wiring ----------
+    # Main classify
     classify_btn.click(
         fn=classify_solution_stream,
         inputs=[question_input, solution_input],
         concurrency_limit=1,
     )
     surprise_btn.click(
         fn=ui_surprise,
+        inputs=[selector_state],
+        outputs=[selector_state, question_input, solution_input],
         queue=True,
     )
 app.queue()
 if __name__ == "__main__":