RWKV-LatestSpace / config.production-modelscope.yaml
sparkleman
UPDATE: G1a for modelscope
f3d9166
raw
history blame
1.84 kB
HOST: "0.0.0.0"
PORT: 7860
STRATEGY: "cuda fp16"
RWKV_CUDA_ON: True
CHUNK_LEN: 256
MODELS:
- SERVICE_NAME: "rwkv7-g1a-2.9b-20250924-ctx4096"
DOWNLOAD_MODEL_FILE_NAME: "rwkv7-g1a-2.9b-20250924-ctx4096.pth"
DOWNLOAD_MODEL_REPO_ID: "RWKV/rwkv7-g1"
REASONING: True
DEFAULT_SAMPLER:
max_tokens: 4096
temperature: 1.0
top_p: 0.3
presence_penalty: 0.5
count_penalty: 0.5
penalty_decay: 0.996
stop:
- "\n\n"
stop_tokens:
- 0
- SERVICE_NAME: "rwkv7-g1a-1.5b-20250922-ctx4096"
DOWNLOAD_MODEL_FILE_NAME: "rwkv7-g1a-1.5b-20250922-ctx4096.pth"
DOWNLOAD_MODEL_REPO_ID: "RWKV/rwkv7-g1"
REASONING: True
DEFAULT_SAMPLER:
max_tokens: 4096
temperature: 1.0
top_p: 0.3
presence_penalty: 0.5
count_penalty: 0.5
penalty_decay: 0.996
stop:
- "\n\n"
stop_tokens:
- 0
- SERVICE_NAME: "rwkv7-g1a-0.4b-20250905-ctx4096"
DOWNLOAD_MODEL_FILE_NAME: "rwkv7-g1a-0.4b-20250905-ctx4096.pth"
DOWNLOAD_MODEL_REPO_ID: "RWKV/rwkv7-g1"
REASONING: True
DEFAULT_SAMPLER:
max_tokens: 4096
temperature: 1.0
top_p: 0.3
presence_penalty: 0.5
count_penalty: 0.5
penalty_decay: 0.996
stop:
- "\n\n"
stop_tokens:
- 0
- SERVICE_NAME: "rwkv7-g1a-0.1b-20250728-ctx4096"
DOWNLOAD_MODEL_FILE_NAME: "rwkv7-g1a-0.1b-20250728-ctx4096.pth"
DOWNLOAD_MODEL_REPO_ID: "RWKV/rwkv7-g1"
REASONING: True
DEFAULT_CHAT: True
DEFAULT_REASONING: True
DEFAULT_SAMPLER:
max_tokens: 4096
temperature: 1.0
top_p: 0.3
presence_penalty: 0.5
count_penalty: 0.5
penalty_decay: 0.996
stop:
- "\n\n"
stop_tokens:
- 0