Spaces:

benhaotang
/

try-out-phi4-qwq-sky-t1

Running on Zero

benhaotang commited on Jan 17

Commit

7046ce9

verified ·

1 Parent(s): f058cc0

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -33,8 +33,8 @@ def load_model():
 pipe = load_model()
-@spaces.GPU(duration=110)
-def generate_response(prompt, max_length=1024):
     # Create messages with system prompt
     messages = [
         {"role": "system", "content": "You are a helpful AI assistant. You always think step by step."},
@@ -42,7 +42,8 @@ def generate_response(prompt, max_length=1024):
     ]
     outputs = pipe(messages, max_new_tokens=max_length)
     # Extract just the assistant's response
     try:
         # Get the message list from the output

 pipe = load_model()
+@spaces.GPU(duration=20)
+def generate_response(prompt, max_length=124):
     # Create messages with system prompt
     messages = [
         {"role": "system", "content": "You are a helpful AI assistant. You always think step by step."},
     ]
     outputs = pipe(messages, max_new_tokens=max_length)
+    print("Raw output:", outputs)
     # Extract just the assistant's response
     try:
         # Get the message list from the output