Spaces:
Running
on
CPU Upgrade
Running
on
CPU Upgrade
| # DGX Spark Environment Configuration | |
| # Copy this to .env.spark and fill in values | |
| # Service Configuration | |
| PORT=8000 | |
| # Model Configuration (Phase 1: CodeGen, Phase 3: Devstral) | |
| DEFAULT_MODEL=codegen-350m | |
| # DEFAULT_MODEL=devstral-small # Uncomment for Phase 3 | |
| # API Security | |
| API_KEY=<your-api-key> | |
| # HuggingFace (required for gated models like Devstral) | |
| HF_TOKEN=<your-hf-token> | |
| # Model Settings | |
| MAX_CONTEXT=8192 | |
| BATCH_SIZE=1 | |
| # TORCH_DTYPE is auto-detected from model config (codegen→fp16, devstral→bf16) | |
| # Uncomment to override: | |
| # TORCH_DTYPE=fp16 | |
| # TORCH_DTYPE=bf16 | |
| # Device Override (set to 'cpu' if GPU not supported yet) | |
| # DEVICE=cuda # Default: auto-detect | |
| DEVICE=cpu # Force CPU until GB10 GPU support available | |