johnbridges commited on
Commit
f453fc2
·
1 Parent(s): c1ed10f
Files changed (2) hide show
  1. requirements.txt +1 -0
  2. transformers_backend.py +1 -1
requirements.txt CHANGED
@@ -8,6 +8,7 @@ pydantic-settings>=2.10.1
8
 
9
  spaces
10
  accelerate
 
11
 
12
  vllm>=0.10.0
13
  torch>=2.7.1
 
8
 
9
  spaces
10
  accelerate
11
+ autoawq
12
 
13
  vllm>=0.10.0
14
  torch>=2.7.1
transformers_backend.py CHANGED
@@ -34,7 +34,7 @@ class TransformersChatBackend(ChatBackend):
34
 
35
  # Run inside ZeroGPU lease
36
  if spaces:
37
- @spaces.GPU(duration=60)
38
  def run_once(prompt: str) -> str:
39
  tokenizer = AutoTokenizer.from_pretrained(model_id)
40
  model = AutoModelForCausalLM.from_pretrained(model_id, device_map="auto")
 
34
 
35
  # Run inside ZeroGPU lease
36
  if spaces:
37
+ @spaces.GPU(duration=300)
38
  def run_once(prompt: str) -> str:
39
  tokenizer = AutoTokenizer.from_pretrained(model_id)
40
  model = AutoModelForCausalLM.from_pretrained(model_id, device_map="auto")