mistral-7b-v0.3-chat

Sleeping

App Files Files Community

rohitmenonhart commited on Oct 27, 2024

Commit

76860a8

verified ·

1 Parent(s): ae73e63

Update app.py

Browse files

Files changed (1) hide show

app.py +9 -16

app.py CHANGED Viewed

@@ -3,17 +3,18 @@ import gradio as gr
 client = InferenceClient("mistralai/Mistral-7B-Instruct-v0.3")
-def format_prompt(message, history, persona=None):
-    prompt = "<s>"
-    if persona:
-        prompt += f"[ROLE: {persona}] "
     for user_prompt, bot_response in history:
         prompt += f"[INST] {user_prompt} [/INST] {bot_response}</s> "
     prompt += f"[INST] {message} [/INST]"
     return prompt
 def generate(
-    prompt, history, temperature=0.9, max_new_tokens=256, top_p=0.95, repetition_penalty=1.0, persona=None
 ):
     temperature = float(temperature)
     if temperature < 1e-2:
@@ -29,7 +30,7 @@ def generate(
         seed=42,
     )
-    formatted_prompt = format_prompt(prompt, history, persona)
     stream = client.text_generation(formatted_prompt, **generate_kwargs, stream=True, details=True, return_full_text=False)
     output = ""
@@ -76,19 +77,11 @@ additional_inputs = [
         step=0.05,
         interactive=True,
         info="Penalize repeated tokens",
-    ),
-    gr.Textbox(
-        label="Persona",
-        placeholder="Describe the role (e.g., 'wise mentor', 'friendly assistant')",
-        info="Define a persona for the model to roleplay.",
-    ),
 ]
 gr.ChatInterface(
-    fn=lambda prompt, history, temperature, max_new_tokens, top_p, repetition_penalty, persona: generate(
-        prompt, history, temperature, max_new_tokens, top_p, repetition_penalty, persona
-    ),
     chatbot=gr.Chatbot(show_label=False, show_share_button=False, show_copy_button=True, likeable=True, layout="panel"),
     additional_inputs=additional_inputs,
     title="Mistral 7B v0.3"

 client = InferenceClient("mistralai/Mistral-7B-Instruct-v0.3")
+# Define a fixed role
+DEFAULT_PERSONA = "strict teacher"
+def format_prompt(message, history):
+    prompt = f"<s>[ROLE: {DEFAULT_PERSONA}] "
     for user_prompt, bot_response in history:
         prompt += f"[INST] {user_prompt} [/INST] {bot_response}</s> "
     prompt += f"[INST] {message} [/INST]"
     return prompt
 def generate(
+    prompt, history, temperature=0.9, max_new_tokens=256, top_p=0.95, repetition_penalty=1.0
 ):
     temperature = float(temperature)
     if temperature < 1e-2:
         seed=42,
     )
+    formatted_prompt = format_prompt(prompt, history)
     stream = client.text_generation(formatted_prompt, **generate_kwargs, stream=True, details=True, return_full_text=False)
     output = ""
         step=0.05,
         interactive=True,
         info="Penalize repeated tokens",
+    )
 ]
 gr.ChatInterface(
+    fn=generate,
     chatbot=gr.Chatbot(show_label=False, show_share_button=False, show_copy_button=True, likeable=True, layout="panel"),
     additional_inputs=additional_inputs,
     title="Mistral 7B v0.3"