Spaces:

SkyNetWalker
/

HF-LLMs

Running

App Files Files Community

SkyNetWalker commited on 2 days ago

Commit

4ca2388

verified ·

1 Parent(s): 19bd564

Update app.py

Browse files

Files changed (1) hide show

app.py +65 -25

app.py CHANGED Viewed

@@ -16,17 +16,29 @@ client = OpenAI(
 print("Client initialized.")
 def respond(
     message,
     history: list[tuple[str, str]],
-    system_message,
     max_tokens,
     temperature,
     top_p,
-    model_name,  # New parameter for model selection
 ):
     print(f"Received message: {message}")
     print(f"History: {history}")
     print(f"System message: {system_message}")
     print(f"Max tokens: {max_tokens}, Temperature: {temperature}, Top-P: {top_p}")
     print(f"Selected model: {model_name}")
@@ -47,7 +59,7 @@ def respond(
     print("Sending request to OpenAI API.")
     for message in client.chat.completions.create(
-        model=model_name,  # Use the selected model
         max_tokens=max_tokens,
         stream=True,
         temperature=temperature,
@@ -60,40 +72,68 @@ def respond(
         yield response
     print("Completed response generation.")
 chatbot = gr.Chatbot(height=400)
 print("Chatbot interface created.")
-# Define the list of models
 models = [
-    "PowerInfer/SmallThinker-3B-Preview", #OK
-    "Qwen/QwQ-32B-Preview", #OK
-    "Qwen/Qwen2.5-Coder-32B-Instruct", #OK
-    "meta-llama/Llama-3.2-3B-Instruct", #OK
-    #"Qwen/Qwen2.5-32B-Instruct", #fail, too large
-    "microsoft/Phi-3-mini-128k-instruct", #fail
-    #"microsoft/Phi-3-medium-128k-instruct", #fail
-    #"microsoft/phi-4", #fail, too large to be loaded automatically (29GB > 10GB)
-    #"meta-llama/Llama-3.3-70B-Instruct", #fail, need HF Pro subscription
 ]
-# Add a title and move the model dropdown to the top
 with gr.Blocks() as demo:
-    gr.Markdown("# LLM Test")  # Add a title to the top of the UI
-    # Add the model dropdown above the chatbot
-    model_dropdown = gr.Dropdown(choices=models, value=models[0], label="Select Model:")
-    # Use the existing ChatInterface
-    gr.ChatInterface(
         respond,
         additional_inputs=[
-            gr.Textbox(value="", label="Additional System Prompt:"),
-            gr.Slider(minimum=1, maximum=4096, value=1024, step=1, label="Max new tokens:"),
-            gr.Slider(minimum=0.1, maximum=1.0, value=0.3, step=0.1, label="Temperature:"),
-            gr.Slider(minimum=0.1, maximum=1.0, value=0.95, step=0.05, label="Top-P:"),
-            model_dropdown,  # Pass the dropdown as an additional input
         ],
         fill_height=True,
         chatbot=chatbot,

 print("Client initialized.")
+# Pre-set system prompts
+SYSTEM_PROMPTS = {
+    "General Assistant": "You are a helpful, respectful and honest assistant. Always provide accurate information and admit when you're not sure about something.",
+    "Code Helper": "You are a programming assistant. Help users with coding questions, debugging, and best practices. Provide clear explanations and code examples when appropriate.",
+    "Creative Writer": "You are a creative writing assistant. Help users with storytelling, character development, and creative writing techniques. Be imaginative and encouraging."
+}
 def respond(
     message,
     history: list[tuple[str, str]],
+    preset_prompt,
+    custom_prompt,
     max_tokens,
     temperature,
     top_p,
+    model_name,
 ):
     print(f"Received message: {message}")
     print(f"History: {history}")
+    # Use custom prompt if provided, otherwise use selected preset
+    system_message = custom_prompt if custom_prompt.strip() else SYSTEM_PROMPTS[preset_prompt]
     print(f"System message: {system_message}")
     print(f"Max tokens: {max_tokens}, Temperature: {temperature}, Top-P: {top_p}")
     print(f"Selected model: {model_name}")
     print("Sending request to OpenAI API.")
     for message in client.chat.completions.create(
+        model=model_name,
         max_tokens=max_tokens,
         stream=True,
         temperature=temperature,
         yield response
     print("Completed response generation.")
 chatbot = gr.Chatbot(height=400)
 print("Chatbot interface created.")
 models = [
+    "PowerInfer/SmallThinker-3B-Preview",
+    "Qwen/QwQ-32B-Preview",
+    "Qwen/Qwen2.5-Coder-32B-Instruct",
+    "meta-llama/Llama-3.2-3B-Instruct",
+    "microsoft/Phi-3-mini-128k-instruct",
 ]
 with gr.Blocks() as demo:
+    gr.Markdown("# LLM Test")
+    with gr.Row():
+        # Model selection at the top
+        model_dropdown = gr.Dropdown(
+            choices=models,
+            value=models[0],
+            label="Select Model:"
+        )
+    # Chatbot interface
+    chat_interface = gr.ChatInterface(
         respond,
         additional_inputs=[
+            # Prompt selections
+            gr.Dropdown(
+                choices=list(SYSTEM_PROMPTS.keys()),
+                value=list(SYSTEM_PROMPTS.keys())[0],
+                label="Select System Prompt:"
+            ),
+            gr.Textbox(
+                value="",
+                label="Custom System Prompt (leaves blank to use preset):",
+                lines=2
+            ),
+            # Other parameters
+            gr.Slider(
+                minimum=1,
+                maximum=4096,
+                value=1024,
+                step=1,
+                label="Max new tokens:"
+            ),
+            gr.Slider(
+                minimum=0.1,
+                maximum=1.0,
+                value=0.3,
+                step=0.1,
+                label="Temperature:"
+            ),
+            gr.Slider(
+                minimum=0.1,
+                maximum=1.0,
+                value=0.95,
+                step=0.05,
+                label="Top-P:"
+            ),
+            model_dropdown,
         ],
         fill_height=True,
         chatbot=chatbot,