File size: 772 Bytes
a2bd186
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
543454f
 
 
 
5f122aa
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
# DGX Spark Environment Configuration
# Copy this to .env.spark and fill in values

# Service Configuration
PORT=8000

# Model Configuration (Phase 1: CodeGen, Phase 3: Devstral)
DEFAULT_MODEL=codegen-350m
# DEFAULT_MODEL=devstral-small    # Uncomment for Phase 3

# API Security
API_KEY=<your-api-key>

# HuggingFace (required for gated models like Devstral)
HF_TOKEN=<your-hf-token>

# Model Settings
MAX_CONTEXT=8192
BATCH_SIZE=1
# TORCH_DTYPE is auto-detected from model config (codegen→fp16, devstral→bf16)
# Uncomment to override:
# TORCH_DTYPE=fp16
# TORCH_DTYPE=bf16

# Device Override (set to 'cpu' if GPU not supported yet)
# DEVICE=cuda                    # Default: auto-detect
DEVICE=cpu                       # Force CPU until GB10 GPU support available