Commit
·
f453fc2
1
Parent(s):
c1ed10f
- requirements.txt +1 -0
- transformers_backend.py +1 -1
requirements.txt
CHANGED
|
@@ -8,6 +8,7 @@ pydantic-settings>=2.10.1
|
|
| 8 |
|
| 9 |
spaces
|
| 10 |
accelerate
|
|
|
|
| 11 |
|
| 12 |
vllm>=0.10.0
|
| 13 |
torch>=2.7.1
|
|
|
|
| 8 |
|
| 9 |
spaces
|
| 10 |
accelerate
|
| 11 |
+
autoawq
|
| 12 |
|
| 13 |
vllm>=0.10.0
|
| 14 |
torch>=2.7.1
|
transformers_backend.py
CHANGED
|
@@ -34,7 +34,7 @@ class TransformersChatBackend(ChatBackend):
|
|
| 34 |
|
| 35 |
# Run inside ZeroGPU lease
|
| 36 |
if spaces:
|
| 37 |
-
@spaces.GPU(duration=
|
| 38 |
def run_once(prompt: str) -> str:
|
| 39 |
tokenizer = AutoTokenizer.from_pretrained(model_id)
|
| 40 |
model = AutoModelForCausalLM.from_pretrained(model_id, device_map="auto")
|
|
|
|
| 34 |
|
| 35 |
# Run inside ZeroGPU lease
|
| 36 |
if spaces:
|
| 37 |
+
@spaces.GPU(duration=300)
|
| 38 |
def run_once(prompt: str) -> str:
|
| 39 |
tokenizer = AutoTokenizer.from_pretrained(model_id)
|
| 40 |
model = AutoModelForCausalLM.from_pretrained(model_id, device_map="auto")
|