mistral-7b-v0.3-chat

Runtime error

App Files Files Community

DFanGEr commited on Jul 21, 2024

Commit

50eaa70

verified ·

1 Parent(s): f41bbc3

update app.py

Browse files

This setup can be extremely powerful and potentially dangerous depending on its use. With high flexibility in text generation and minimal constraints, it can generate misleading, inappropriate, or harmful content if not used responsibly. The AI's capabilities to create highly varied and convincing outputs mean that misuse could lead to spreading misinformation, generating offensive material, or other unethical uses. Always exercise caution and ethical consideration when deploying such powerful tools. 🚨

Files changed (1) hide show

app.py +20 -29

app.py CHANGED Viewed

@@ -1,22 +1,17 @@
 from huggingface_hub import InferenceClient
 import gradio as gr
-client = InferenceClient(
-    "mistralai/Mistral-7B-Instruct-v0.3"
-)
 def format_prompt(message, history):
-  prompt = "<s>"
-  for user_prompt, bot_response in history:
-    prompt += f"[INST] {user_prompt} [/INST]"
-    prompt += f" {bot_response}</s> "
-  prompt += f"[INST] {message} [/INST]"
-  return prompt
-def generate(
-    prompt, history, temperature=0.9, max_new_tokens=256, top_p=0.95, repetition_penalty=1.0,
-):
     temperature = float(temperature)
     if temperature < 1e-2:
         temperature = 1e-2
@@ -41,55 +36,51 @@ def generate(
         yield output
     return output
 additional_inputs=[
     gr.Slider(
         label="Temperature",
-        value=0.9,
         minimum=0.0,
         maximum=1.0,
-        step=0.05,
         interactive=True,
         info="Higher values produce more diverse outputs",
     ),
     gr.Slider(
         label="Max new tokens",
-        value=256,
         minimum=0,
-        maximum=1048,
-        step=64,
         interactive=True,
         info="The maximum numbers of new tokens",
     ),
     gr.Slider(
         label="Top-p (nucleus sampling)",
-        value=0.90,
         minimum=0.0,
-        maximum=1,
-        step=0.05,
         interactive=True,
         info="Higher values sample more low-probability tokens",
     ),
     gr.Slider(
         label="Repetition penalty",
-        value=1.2,
         minimum=1.0,
         maximum=2.0,
-        step=0.05,
         interactive=True,
         info="Penalize repeated tokens",
     )
 ]
 gr.ChatInterface(
     fn=generate,
     chatbot=gr.Chatbot(show_label=False, show_share_button=False, show_copy_button=True, likeable=True, layout="panel"),
     additional_inputs=additional_inputs,
-    title="""Mistral 7B v0.3"""
 ).launch(show_api=False)
 gr.load("models/ehristoforu/dalle-3-xl-v2").launch()
-gr.load("models/microsoft/Phi-3-mini-4k-instruct").launch()

 from huggingface_hub import InferenceClient
 import gradio as gr
+client = InferenceClient("mistralai/Mistral-7B-Instruct-v0.3")
 def format_prompt(message, history):
+    prompt = "<s>"
+    for user_prompt, bot_response in history:
+        prompt += f"[INST] {user_prompt} [/INST]"
+        prompt += f" {bot_response}</s> "
+    prompt += f"[INST] {message} [/INST]"
+    return prompt
+def generate(prompt, history, temperature=1.0, max_new_tokens=1048, top_p=1.0, repetition_penalty=1.0):
     temperature = float(temperature)
     if temperature < 1e-2:
         temperature = 1e-2
         yield output
     return output
 additional_inputs=[
     gr.Slider(
         label="Temperature",
+        value=1.0,
         minimum=0.0,
         maximum=1.0,
+        step=0.01,
         interactive=True,
         info="Higher values produce more diverse outputs",
     ),
     gr.Slider(
         label="Max new tokens",
+        value=1048,
         minimum=0,
+        maximum=2048,
+        step=128,
         interactive=True,
         info="The maximum numbers of new tokens",
     ),
     gr.Slider(
         label="Top-p (nucleus sampling)",
+        value=1.0,
         minimum=0.0,
+        maximum=1.0,
+        step=0.01,
         interactive=True,
         info="Higher values sample more low-probability tokens",
     ),
     gr.Slider(
         label="Repetition penalty",
+        value=1.0,
         minimum=1.0,
         maximum=2.0,
+        step=0.01,
         interactive=True,
         info="Penalize repeated tokens",
     )
 ]
 gr.ChatInterface(
     fn=generate,
     chatbot=gr.Chatbot(show_label=False, show_share_button=False, show_copy_button=True, likeable=True, layout="panel"),
     additional_inputs=additional_inputs,
+    title="Mistral 7B v0.3"
 ).launch(show_api=False)
 gr.load("models/ehristoforu/dalle-3-xl-v2").launch()
+gr.load("models/microsoft/Phi-3-mini-4k-instruct").launch()