sparkleman commited on
Commit
944cd13
·
1 Parent(s): 51ee4dc

UPDATE: G1 1.5B 62% & G1 2.9B 41%

Browse files
config.production-modelscope.yaml CHANGED
@@ -4,8 +4,8 @@ STRATEGY: "cuda fp16"
4
  RWKV_CUDA_ON: True
5
  CHUNK_LEN: 256
6
  MODELS:
7
- - SERVICE_NAME: "RWKV7-G1-2.9B-32%trained-20250327-ctx4k"
8
- DOWNLOAD_MODEL_FILE_NAME: "RWKV7-G1-2.9B-32%trained-20250327-ctx4k.pth"
9
  DOWNLOAD_MODEL_REPO_ID: "RWKV/temp-latest-training-models"
10
  REASONING: True
11
  DEFAULT_SAMPLER:
@@ -19,8 +19,8 @@ MODELS:
19
  - "\n\n"
20
  stop_tokens:
21
  - 0
22
- - SERVICE_NAME: "RWKV7-G1-1.5B-50%trained-20250330-ctx4k"
23
- DOWNLOAD_MODEL_FILE_NAME: "RWKV7-G1-1.5B-50%trained-20250330-ctx4k.pth"
24
  DOWNLOAD_MODEL_REPO_ID: "RWKV/temp-latest-training-models"
25
  REASONING: True
26
  DEFAULT_SAMPLER:
 
4
  RWKV_CUDA_ON: True
5
  CHUNK_LEN: 256
6
  MODELS:
7
+ - SERVICE_NAME: "RWKV7-G1-2.9B-41%trained-20250410-ctx4k"
8
+ DOWNLOAD_MODEL_FILE_NAME: "RWKV7-G1-2.9B-41%trained-20250410-ctx4k.pth"
9
  DOWNLOAD_MODEL_REPO_ID: "RWKV/temp-latest-training-models"
10
  REASONING: True
11
  DEFAULT_SAMPLER:
 
19
  - "\n\n"
20
  stop_tokens:
21
  - 0
22
+ - SERVICE_NAME: "RWKV7-G1-1.5B-62%trained-20250410-ctx4k"
23
+ DOWNLOAD_MODEL_FILE_NAME: "RWKV7-G1-1.5B-62%trained-20250410-ctx4k.pth"
24
  DOWNLOAD_MODEL_REPO_ID: "RWKV/temp-latest-training-models"
25
  REASONING: True
26
  DEFAULT_SAMPLER:
config.production.yaml CHANGED
@@ -4,8 +4,8 @@ STRATEGY: "cuda fp16"
4
  RWKV_CUDA_ON: True
5
  CHUNK_LEN: 256
6
  MODELS:
7
- - SERVICE_NAME: "RWKV7-G1-2.9B-32%trained-20250327-ctx4k"
8
- DOWNLOAD_MODEL_FILE_NAME: "RWKV7-G1-2.9B-32%trained-20250327-ctx4k.pth"
9
  DOWNLOAD_MODEL_REPO_ID: "BlinkDL/temp-latest-training-models"
10
  REASONING: True
11
  DEFAULT_SAMPLER:
@@ -19,8 +19,8 @@ MODELS:
19
  - "\n\n"
20
  stop_tokens:
21
  - 0
22
- - SERVICE_NAME: "RWKV7-G1-1.5B-50%trained-20250330-ctx4k"
23
- DOWNLOAD_MODEL_FILE_NAME: "RWKV7-G1-1.5B-50%trained-20250330-ctx4k.pth"
24
  DOWNLOAD_MODEL_REPO_ID: "BlinkDL/temp-latest-training-models"
25
  REASONING: True
26
  DEFAULT_SAMPLER:
 
4
  RWKV_CUDA_ON: True
5
  CHUNK_LEN: 256
6
  MODELS:
7
+ - SERVICE_NAME: "RWKV7-G1-2.9B-41%trained-20250410-ctx4k"
8
+ DOWNLOAD_MODEL_FILE_NAME: "RWKV7-G1-2.9B-41%trained-20250410-ctx4k.pth"
9
  DOWNLOAD_MODEL_REPO_ID: "BlinkDL/temp-latest-training-models"
10
  REASONING: True
11
  DEFAULT_SAMPLER:
 
19
  - "\n\n"
20
  stop_tokens:
21
  - 0
22
+ - SERVICE_NAME: "RWKV7-G1-1.5B-62%trained-20250410-ctx4k"
23
+ DOWNLOAD_MODEL_FILE_NAME: "RWKV7-G1-1.5B-62%trained-20250410-ctx4k.pth"
24
  DOWNLOAD_MODEL_REPO_ID: "BlinkDL/temp-latest-training-models"
25
  REASONING: True
26
  DEFAULT_SAMPLER: