Spaces:

Oysiyl
/

Reasoning-model-demo

Sleeping

App Files Files Community

Oysiyl commited on May 2

Commit

4e38b02

verified ·

1 Parent(s): 29907b1

Update app.py

Browse files

Files changed (1) hide show

app.py +6 -41

app.py CHANGED Viewed

@@ -3,9 +3,11 @@ from transformers import AutoTokenizer, AutoModelForCausalLM, TextIteratorStream
 import threading
 import torch
-# Load model directly
-model = AutoModelForCausalLM.from_pretrained("Oysiyl/gemma-3-1B-GRPO")
-tokenizer = AutoTokenizer.from_pretrained("Oysiyl/gemma-3-1B-GRPO")
 def process_history(history):
@@ -74,9 +76,8 @@ def respond(
     output = "Thinking: \n"
     for token in streamer:
         output += token
-        # Check for various solution patterns
         if "<SOLUTION>" in output:
-            # Original solution pattern
             solution_start = output.find("<SOLUTION>") + len("<SOLUTION>")
             solution_end = output.find("</SOLUTION>")
             if solution_end > solution_start:
@@ -87,42 +88,6 @@ def respond(
                 )
                 yield formatted_output
             else:
-                # Handle case where closing tag is missing
-                formatted_output = (
-                    output[:solution_start] +
-                    "Final answer: **" + output[solution_start:] + "**"
-                )
-                yield formatted_output
-        # Check if end_working_out tag is present
-        elif "</end_working_out>" in output:
-            solution_start = output.find("</end_working_out>") + len("</end_working_out>")
-            formatted_output = (
-                output[:solution_start] +
-                "\nFinal answer: **" + output[solution_start:] + "**"
-            )
-            yield formatted_output
-        # Check if start_working_out is present but end_working_out is missing
-        elif "<start_working_out>" in output:
-            # Check if there's a SOLUTION tag after start_working_out
-            working_start = output.find("<start_working_out>")
-            if "<SOLUTION>" in output[working_start:]:
-                solution_start = output.find("<SOLUTION>", working_start) + len("<SOLUTION>")
-                solution_end = output.find("</SOLUTION>", solution_start)
-                if solution_end > solution_start:
-                    formatted_output = (
-                        output[:solution_start] +
-                        "Final answer: **" + output[solution_start:solution_end] + "**" +
-                        output[solution_end:]
-                    )
-                    yield formatted_output
-                else:
-                    formatted_output = (
-                        output[:solution_start] +
-                        "Final answer: **" + output[solution_start:] + "**"
-                    )
-                    yield formatted_output
-            else:
-                # No clear solution identified
                 yield output
         else:
             yield output

 import threading
 import torch
+# Load base model directly and then add the adapter
+model = AutoModelForCausalLM.from_pretrained("unsloth/gemma-3-1b-it")
+# Apply adapter from the fine-tuned version
+model.load_adapter("Oysiyl/gemma-3-1B-GRPO")
+tokenizer = AutoTokenizer.from_pretrained("unsloth/gemma-3-1b-it")
 def process_history(history):
     output = "Thinking: \n"
     for token in streamer:
         output += token
+        # Check if "<SOLUTION>" token is in the output and format everything after it as bold
         if "<SOLUTION>" in output:
             solution_start = output.find("<SOLUTION>") + len("<SOLUTION>")
             solution_end = output.find("</SOLUTION>")
             if solution_end > solution_start:
                 )
                 yield formatted_output
             else:
                 yield output
         else:
             yield output