Spaces:

padmanabhbosamia
/

phi2-grpo

Runtime error

App Files Files Community

padmanabhbosamia commited on Apr 1

Commit

e9026bb

verified ·

1 Parent(s): fd6b90a

Changed before after

Browse files

Files changed (1) hide show

app.py +65 -12

app.py CHANGED Viewed

@@ -21,6 +21,15 @@ tokenizer = AutoTokenizer.from_pretrained("./fine-tuned-model")
 tokenizer.pad_token = tokenizer.eos_token
 tokenizer.padding_side = 'left'
 def generate_response(
     prompt,
     max_length=128,  # Match training max_length
@@ -29,6 +38,7 @@ def generate_response(
     num_generations=2,  # Match training num_generations
     repetition_penalty=1.1,
     do_sample=True,
 ):
     try:
         # Get the device of the model
@@ -40,7 +50,7 @@ def generate_response(
         # Move inputs to the same device as the model
         inputs = {k: v.to(device) for k, v in inputs.items()}
-        # Generate response
         with torch.no_grad():  # Disable gradient computation
             outputs = model.generate(
                 **inputs,
@@ -60,7 +70,35 @@ def generate_response(
             response = tokenizer.decode(output, skip_special_tokens=True)
             responses.append(response)
-        return "\n\n---\n\n".join(responses)
     except Exception as e:
         console.print(f"[bold red]Error during generation: {str(e)}[/bold red]")
         return f"Error: {str(e)}"
@@ -85,6 +123,12 @@ custom_css = """
     line-height: 1.6;
     margin-bottom: 20px;
 }
 """
 # Create the Gradio interface with enhanced UI
@@ -160,12 +204,17 @@ with gr.Blocks(css=custom_css, theme=gr.themes.Soft()) as demo:
                         info="Enable/disable sampling for deterministic output"
                     )
             generate_btn = gr.Button("Generate", variant="primary")
         with gr.Column(scale=3):
-            output = gr.Textbox(
                 label="Generated Response(s)",
-                lines=10,
                 show_label=True,
             )
@@ -177,22 +226,23 @@ with gr.Blocks(css=custom_css, theme=gr.themes.Soft()) as demo:
         1. **Technical Questions**:
            - "What is machine learning?"
            - "What is deep learning?"
-           - "Explain quantum computing in simple terms."
         2. **Creative Writing**:
            - "Write a short story about a robot learning to paint."
            - "Write a story about a time-traveling smartphone."
-           - "Write a poem about artificial intelligence."
         3. **Technical Explanations**:
            - "How does neural network training work?"
-           - "What is the difference between supervised and unsupervised learning?"
-           - "Explain the concept of transfer learning."
         4. **Creative Tasks**:
-           - "Write a fairy tale about a computer learning to dream."
-           - "Create a story about an AI becoming an artist."
            - "Write a poem about the future of technology."
         """,
         elem_classes="description"
     )
@@ -207,7 +257,9 @@ with gr.Blocks(css=custom_css, theme=gr.themes.Soft()) as demo:
             ["What is deep learning?"],
             ["Write a story about a time-traveling smartphone."],
             ["How does neural network training work?"],
-            ["Write a fairy tale about a computer learning to dream."]
         ],
         inputs=prompt
     )
@@ -222,7 +274,8 @@ with gr.Blocks(css=custom_css, theme=gr.themes.Soft()) as demo:
             top_p,
             num_generations,
             repetition_penalty,
-            do_sample
         ],
         outputs=output
     )

 tokenizer.pad_token = tokenizer.eos_token
 tokenizer.padding_side = 'left'
+# Load base model for before/after comparison
+console.print("[bold green]Loading base model for comparison...[/bold green]")
+base_model = AutoModelForCausalLM.from_pretrained(
+    "microsoft/phi-2",
+    device_map="auto",
+    trust_remote_code=True,
+    torch_dtype=torch.float16,
+)
 def generate_response(
     prompt,
     max_length=128,  # Match training max_length
     num_generations=2,  # Match training num_generations
     repetition_penalty=1.1,
     do_sample=True,
+    show_comparison=True,  # New parameter for comparison toggle
 ):
     try:
         # Get the device of the model
         # Move inputs to the same device as the model
         inputs = {k: v.to(device) for k, v in inputs.items()}
+        # Generate response from fine-tuned model
         with torch.no_grad():  # Disable gradient computation
             outputs = model.generate(
                 **inputs,
             response = tokenizer.decode(output, skip_special_tokens=True)
             responses.append(response)
+        fine_tuned_response = "\n\n---\n\n".join(responses)
+        if show_comparison:
+            # Generate response from base model
+            with torch.no_grad():
+                base_outputs = base_model.generate(
+                    **inputs,
+                    max_new_tokens=max_length,
+                    do_sample=do_sample,
+                    temperature=temperature,
+                    top_p=top_p,
+                    num_return_sequences=1,  # Only one for comparison
+                    repetition_penalty=repetition_penalty,
+                    pad_token_id=tokenizer.eos_token_id,
+                    eos_token_id=tokenizer.eos_token_id,
+                )
+            base_response = tokenizer.decode(base_outputs[0], skip_special_tokens=True)
+            return f"""
+### Before Fine-tuning (Base Model)
+{base_response}
+### After Fine-tuning
+{fine_tuned_response}
+"""
+        else:
+            return fine_tuned_response
     except Exception as e:
         console.print(f"[bold red]Error during generation: {str(e)}[/bold red]")
         return f"Error: {str(e)}"
     line-height: 1.6;
     margin-bottom: 20px;
 }
+.comparison {
+    background-color: #f8f9fa;
+    padding: 15px;
+    border-radius: 8px;
+    margin: 10px 0;
+}
 """
 # Create the Gradio interface with enhanced UI
                         info="Enable/disable sampling for deterministic output"
                     )
+            show_comparison = gr.Checkbox(
+                value=True,
+                label="Show Before/After Comparison",
+                info="Toggle to show responses from both base and fine-tuned models"
+            )
             generate_btn = gr.Button("Generate", variant="primary")
         with gr.Column(scale=3):
+            output = gr.Markdown(
                 label="Generated Response(s)",
                 show_label=True,
             )
         1. **Technical Questions**:
            - "What is machine learning?"
            - "What is deep learning?"
+           - "What is the difference between supervised and unsupervised learning?"
         2. **Creative Writing**:
            - "Write a short story about a robot learning to paint."
            - "Write a story about a time-traveling smartphone."
+           - "Write a fairy tale about a computer learning to dream."
+           - "Create a story about an AI becoming an artist."
         3. **Technical Explanations**:
            - "How does neural network training work?"
+           - "Explain quantum computing in simple terms."
+           - "What is transfer learning?"
         4. **Creative Tasks**:
+           - "Write a poem about artificial intelligence."
            - "Write a poem about the future of technology."
+           - "Create a story about a robot learning to dream."
         """,
         elem_classes="description"
     )
             ["What is deep learning?"],
             ["Write a story about a time-traveling smartphone."],
             ["How does neural network training work?"],
+            ["Write a fairy tale about a computer learning to dream."],
+            ["What is the difference between supervised and unsupervised learning?"],
+            ["Create a story about an AI becoming an artist."]
         ],
         inputs=prompt
     )
             top_p,
             num_generations,
             repetition_penalty,
+            do_sample,
+            show_comparison
         ],
         outputs=output
     )