api / .env.spark.example
gary-boon
Update .env.spark.example: TORCH_DTYPE now auto-detected
543454f
raw
history blame
772 Bytes
# DGX Spark Environment Configuration
# Copy this to .env.spark and fill in values
# Service Configuration
PORT=8000
# Model Configuration (Phase 1: CodeGen, Phase 3: Devstral)
DEFAULT_MODEL=codegen-350m
# DEFAULT_MODEL=devstral-small # Uncomment for Phase 3
# API Security
API_KEY=<your-api-key>
# HuggingFace (required for gated models like Devstral)
HF_TOKEN=<your-hf-token>
# Model Settings
MAX_CONTEXT=8192
BATCH_SIZE=1
# TORCH_DTYPE is auto-detected from model config (codegen→fp16, devstral→bf16)
# Uncomment to override:
# TORCH_DTYPE=fp16
# TORCH_DTYPE=bf16
# Device Override (set to 'cpu' if GPU not supported yet)
# DEVICE=cuda # Default: auto-detect
DEVICE=cpu # Force CPU until GB10 GPU support available