# DGX Spark Environment Configuration # Copy this to .env.spark and fill in values # Service Configuration PORT=8000 # Model Configuration (Phase 1: CodeGen, Phase 3: Devstral) DEFAULT_MODEL=codegen-350m # DEFAULT_MODEL=devstral-small # Uncomment for Phase 3 # API Security API_KEY= # HuggingFace (required for gated models like Devstral) HF_TOKEN= # Model Settings MAX_CONTEXT=8192 BATCH_SIZE=1 # TORCH_DTYPE is auto-detected from model config (codegen→fp16, devstral→bf16) # Uncomment to override: # TORCH_DTYPE=fp16 # TORCH_DTYPE=bf16 # Device Override (set to 'cpu' if GPU not supported yet) # DEVICE=cuda # Default: auto-detect DEVICE=cpu # Force CPU until GB10 GPU support available