Spaces:
Sleeping
Sleeping
File size: 772 Bytes
a2bd186 543454f 5f122aa |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 |
# DGX Spark Environment Configuration
# Copy this to .env.spark and fill in values
# Service Configuration
PORT=8000
# Model Configuration (Phase 1: CodeGen, Phase 3: Devstral)
DEFAULT_MODEL=codegen-350m
# DEFAULT_MODEL=devstral-small # Uncomment for Phase 3
# API Security
API_KEY=<your-api-key>
# HuggingFace (required for gated models like Devstral)
HF_TOKEN=<your-hf-token>
# Model Settings
MAX_CONTEXT=8192
BATCH_SIZE=1
# TORCH_DTYPE is auto-detected from model config (codegen→fp16, devstral→bf16)
# Uncomment to override:
# TORCH_DTYPE=fp16
# TORCH_DTYPE=bf16
# Device Override (set to 'cpu' if GPU not supported yet)
# DEVICE=cuda # Default: auto-detect
DEVICE=cpu # Force CPU until GB10 GPU support available
|