zR commited on
Commit
5f7b72c
1 Parent(s): 83a2412

add suggested_hardware

Browse files
Files changed (2) hide show
  1. README.md +1 -0
  2. app.py +3 -3
README.md CHANGED
@@ -5,6 +5,7 @@ colorFrom: yellow
5
  colorTo: purple
6
  sdk: gradio
7
  sdk_version: 4.41.0
 
8
  app_port: 7860
9
  app_file: app.py
10
  models:
 
5
  colorTo: purple
6
  sdk: gradio
7
  sdk_version: 4.41.0
8
+ suggested_hardware: a100-large
9
  app_port: 7860
10
  app_file: app.py
11
  models:
app.py CHANGED
@@ -29,7 +29,7 @@ class StopOnTokens(StoppingCriteria):
29
  return False
30
 
31
 
32
- @spaces.GPU(duration=300)
33
  def predict(history, prompt, max_length, top_p, temperature):
34
  stop = StopOnTokens()
35
  messages = []
@@ -83,9 +83,9 @@ with gr.Blocks() as demo:
83
  </div>
84
  <div style="text-align: center; font-size: 15px; font-weight: bold; color: red; margin-bottom: 20px;">
85
  ⚠️ Due to the limitations of Huggingface ZERO GPUs, in order to output 10K characters in one go,
86
- we need to request a 5-minute quota each time.
87
  This will result in you only being able to use it once every 4 hours.
88
- If you plan to use it long-term, please consider deploying the model yourself.
89
  </div>
90
  """
91
  )
 
29
  return False
30
 
31
 
32
+ @spaces.GPU(duration=280)
33
  def predict(history, prompt, max_length, top_p, temperature):
34
  stop = StopOnTokens()
35
  messages = []
 
83
  </div>
84
  <div style="text-align: center; font-size: 15px; font-weight: bold; color: red; margin-bottom: 20px;">
85
  ⚠️ Due to the limitations of Huggingface ZERO GPUs, in order to output 10K characters in one go,
86
+ we need to request a 4-5 minute quota each time.
87
  This will result in you only being able to use it once every 4 hours.
88
+ If you plan to use it long-term, please consider deploying the model or fork this space yourself.
89
  </div>
90
  """
91
  )