sukaka commited on
Commit
c0bf0a9
1 Parent(s): bf45687

Upload config (1).json

Browse files
Files changed (1) hide show
  1. config (1).json +948 -0
config (1).json ADDED
@@ -0,0 +1,948 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "currentModelConfigIndex": 28,
3
+ "dataProcessParams": {
4
+ "dataPath": "finetune/data/sample.jsonl",
5
+ "vocabPath": "backend-python/rwkv_pip/rwkv_vocab_v20230424.txt"
6
+ },
7
+ "loraFinetuneParams": {
8
+ "accumGradBatches": 8,
9
+ "adamEps": "1e-8",
10
+ "baseModel": "RWKV-4-World-CHNtuned-7B-v1-20230709-ctx4096.pth",
11
+ "beta1": 0.9,
12
+ "beta2": 0.999,
13
+ "ctxLen": 1024,
14
+ "devices": 1,
15
+ "epochBegin": 0,
16
+ "epochCount": 20,
17
+ "epochSave": 2,
18
+ "epochSteps": 200,
19
+ "gradCp": false,
20
+ "headQk": false,
21
+ "loraAlpha": 32,
22
+ "loraDropout": 0.01,
23
+ "loraLoad": "",
24
+ "loraR": 8,
25
+ "lrFinal": "5e-5",
26
+ "lrInit": "5e-5",
27
+ "microBsz": 1,
28
+ "preFfn": false,
29
+ "precision": "bf16",
30
+ "warmupSteps": 0
31
+ },
32
+ "modelConfigs": [
33
+ {
34
+ "apiParameters": {
35
+ "apiPort": 8000,
36
+ "frequencyPenalty": 1,
37
+ "maxResponseToken": 4100,
38
+ "presencePenalty": 0,
39
+ "temperature": 1,
40
+ "topP": 0.3
41
+ },
42
+ "modelParameters": {
43
+ "device": "CUDA",
44
+ "maxStoredLayers": 41,
45
+ "modelName": "RWKV-4-World-3B-v1-20230619-ctx4096.pth",
46
+ "precision": "int8",
47
+ "storedLayers": 6,
48
+ "useCustomCuda": true
49
+ },
50
+ "name": "GPU-2G-3B-World"
51
+ },
52
+ {
53
+ "apiParameters": {
54
+ "apiPort": 8000,
55
+ "frequencyPenalty": 1,
56
+ "maxResponseToken": 4100,
57
+ "presencePenalty": 0,
58
+ "temperature": 1,
59
+ "topP": 0.3
60
+ },
61
+ "modelParameters": {
62
+ "device": "CUDA",
63
+ "maxStoredLayers": 41,
64
+ "modelName": "RWKV-4-World-0.1B-v1-20230520-ctx4096.pth",
65
+ "precision": "fp32",
66
+ "storedLayers": 41
67
+ },
68
+ "name": "GPU-2G-0.1B-World"
69
+ },
70
+ {
71
+ "apiParameters": {
72
+ "apiPort": 8000,
73
+ "frequencyPenalty": 1,
74
+ "maxResponseToken": 4100,
75
+ "presencePenalty": 0,
76
+ "temperature": 1,
77
+ "topP": 0.3
78
+ },
79
+ "modelParameters": {
80
+ "device": "CUDA",
81
+ "maxStoredLayers": 41,
82
+ "modelName": "RWKV-4-Raven-1B5-v12-Eng98%-Other2%-20230520-ctx4096.pth",
83
+ "precision": "int8",
84
+ "storedLayers": 4,
85
+ "useCustomCuda": true
86
+ },
87
+ "name": "GPU-2G-1B5-EN"
88
+ },
89
+ {
90
+ "apiParameters": {
91
+ "apiPort": 8000,
92
+ "frequencyPenalty": 1,
93
+ "maxResponseToken": 4100,
94
+ "presencePenalty": 0,
95
+ "temperature": 1,
96
+ "topP": 0.3
97
+ },
98
+ "modelParameters": {
99
+ "device": "CUDA",
100
+ "maxStoredLayers": 41,
101
+ "modelName": "RWKV-4-World-0.4B-v1-20230529-ctx4096.pth",
102
+ "precision": "fp32",
103
+ "storedLayers": 41
104
+ },
105
+ "name": "GPU-4G-0.4B-World"
106
+ },
107
+ {
108
+ "apiParameters": {
109
+ "apiPort": 8000,
110
+ "frequencyPenalty": 1,
111
+ "maxResponseToken": 4100,
112
+ "presencePenalty": 0,
113
+ "temperature": 1,
114
+ "topP": 0.3
115
+ },
116
+ "modelParameters": {
117
+ "device": "CUDA",
118
+ "maxStoredLayers": 41,
119
+ "modelName": "RWKV-4-World-1.5B-v1-fixed-20230612-ctx4096.pth",
120
+ "precision": "fp32",
121
+ "storedLayers": 8
122
+ },
123
+ "name": "GPU-4G-1B5-World"
124
+ },
125
+ {
126
+ "apiParameters": {
127
+ "apiPort": 8000,
128
+ "frequencyPenalty": 1,
129
+ "maxResponseToken": 4100,
130
+ "presencePenalty": 0,
131
+ "temperature": 1,
132
+ "topP": 0.3
133
+ },
134
+ "modelParameters": {
135
+ "device": "CUDA",
136
+ "maxStoredLayers": 41,
137
+ "modelName": "RWKV-4-Raven-1B5-v12-Eng98%-Other2%-20230520-ctx4096.pth",
138
+ "precision": "int8",
139
+ "storedLayers": 41,
140
+ "useCustomCuda": true
141
+ },
142
+ "name": "GPU-4G-1B5-EN"
143
+ },
144
+ {
145
+ "apiParameters": {
146
+ "apiPort": 8000,
147
+ "frequencyPenalty": 1,
148
+ "maxResponseToken": 4100,
149
+ "presencePenalty": 0,
150
+ "temperature": 1,
151
+ "topP": 0.3
152
+ },
153
+ "modelParameters": {
154
+ "device": "CUDA",
155
+ "maxStoredLayers": 41,
156
+ "modelName": "RWKV-4-World-3B-v1-20230619-ctx4096.pth",
157
+ "precision": "int8",
158
+ "storedLayers": 24,
159
+ "useCustomCuda": true
160
+ },
161
+ "name": "GPU-4G-3B-World"
162
+ },
163
+ {
164
+ "apiParameters": {
165
+ "apiPort": 8000,
166
+ "frequencyPenalty": 1,
167
+ "maxResponseToken": 4100,
168
+ "presencePenalty": 0,
169
+ "temperature": 1,
170
+ "topP": 0.3
171
+ },
172
+ "modelParameters": {
173
+ "device": "CUDA",
174
+ "maxStoredLayers": 41,
175
+ "modelName": "RWKV-4-Raven-3B-v12-Eng98%-Other2%-20230520-ctx4096.pth",
176
+ "precision": "int8",
177
+ "storedLayers": 24,
178
+ "useCustomCuda": true
179
+ },
180
+ "name": "GPU-4G-3B-EN"
181
+ },
182
+ {
183
+ "apiParameters": {
184
+ "apiPort": 8000,
185
+ "frequencyPenalty": 1,
186
+ "maxResponseToken": 4100,
187
+ "presencePenalty": 0,
188
+ "temperature": 1,
189
+ "topP": 0.3
190
+ },
191
+ "modelParameters": {
192
+ "device": "CUDA",
193
+ "maxStoredLayers": 41,
194
+ "modelName": "RWKV-4-World-CHNtuned-3B-v1-20230625-ctx4096.pth",
195
+ "precision": "int8",
196
+ "storedLayers": 24,
197
+ "useCustomCuda": true
198
+ },
199
+ "name": "GPU-4G-3B-CN"
200
+ },
201
+ {
202
+ "apiParameters": {
203
+ "apiPort": 8000,
204
+ "frequencyPenalty": 1,
205
+ "maxResponseToken": 4100,
206
+ "presencePenalty": 0,
207
+ "temperature": 1,
208
+ "topP": 0.3
209
+ },
210
+ "modelParameters": {
211
+ "device": "CUDA",
212
+ "maxStoredLayers": 41,
213
+ "modelName": "RWKV-4-World-7B-v1-20230626-ctx4096.pth",
214
+ "precision": "int8",
215
+ "storedLayers": 8,
216
+ "useCustomCuda": true
217
+ },
218
+ "name": "GPU-4G-7B-World"
219
+ },
220
+ {
221
+ "apiParameters": {
222
+ "apiPort": 8000,
223
+ "frequencyPenalty": 1,
224
+ "maxResponseToken": 4100,
225
+ "presencePenalty": 0,
226
+ "temperature": 1,
227
+ "topP": 0.3
228
+ },
229
+ "modelParameters": {
230
+ "device": "CUDA",
231
+ "maxStoredLayers": 41,
232
+ "modelName": "RWKV-4-Raven-7B-v12-Eng98%-Other2%-20230521-ctx8192.pth",
233
+ "precision": "int8",
234
+ "storedLayers": 8,
235
+ "useCustomCuda": true
236
+ },
237
+ "name": "GPU-4G-7B-EN"
238
+ },
239
+ {
240
+ "apiParameters": {
241
+ "apiPort": 8000,
242
+ "frequencyPenalty": 1,
243
+ "maxResponseToken": 4100,
244
+ "presencePenalty": 0,
245
+ "temperature": 1,
246
+ "topP": 0.3
247
+ },
248
+ "modelParameters": {
249
+ "device": "CUDA",
250
+ "maxStoredLayers": 41,
251
+ "modelName": "RWKV-4-World-CHNtuned-7B-v1-20230709-ctx4096.pth",
252
+ "precision": "int8",
253
+ "storedLayers": 8,
254
+ "useCustomCuda": true
255
+ },
256
+ "name": "GPU-4G-7B-CN"
257
+ },
258
+ {
259
+ "apiParameters": {
260
+ "apiPort": 8000,
261
+ "frequencyPenalty": 1,
262
+ "maxResponseToken": 4100,
263
+ "presencePenalty": 0,
264
+ "temperature": 1,
265
+ "topP": 0.3
266
+ },
267
+ "modelParameters": {
268
+ "device": "CUDA",
269
+ "maxStoredLayers": 41,
270
+ "modelName": "RWKV-4-Raven-1B5-v12-Eng98%-Other2%-20230520-ctx4096.pth",
271
+ "precision": "fp16",
272
+ "storedLayers": 41,
273
+ "useCustomCuda": true
274
+ },
275
+ "name": "GPU-6G-1B5-EN"
276
+ },
277
+ {
278
+ "apiParameters": {
279
+ "apiPort": 8000,
280
+ "frequencyPenalty": 1,
281
+ "maxResponseToken": 4100,
282
+ "presencePenalty": 0,
283
+ "temperature": 1,
284
+ "topP": 0.3
285
+ },
286
+ "modelParameters": {
287
+ "device": "CUDA",
288
+ "maxStoredLayers": 41,
289
+ "modelName": "RWKV-4-World-3B-v1-20230619-ctx4096.pth",
290
+ "precision": "int8",
291
+ "storedLayers": 41,
292
+ "useCustomCuda": true
293
+ },
294
+ "name": "GPU-6G-3B-World"
295
+ },
296
+ {
297
+ "apiParameters": {
298
+ "apiPort": 8000,
299
+ "frequencyPenalty": 1,
300
+ "maxResponseToken": 4100,
301
+ "presencePenalty": 0,
302
+ "temperature": 1,
303
+ "topP": 0.3
304
+ },
305
+ "modelParameters": {
306
+ "device": "CUDA",
307
+ "maxStoredLayers": 41,
308
+ "modelName": "RWKV-4-Raven-3B-v12-Eng98%-Other2%-20230520-ctx4096.pth",
309
+ "precision": "int8",
310
+ "storedLayers": 41,
311
+ "useCustomCuda": true
312
+ },
313
+ "name": "GPU-6G-3B-EN"
314
+ },
315
+ {
316
+ "apiParameters": {
317
+ "apiPort": 8000,
318
+ "frequencyPenalty": 1,
319
+ "maxResponseToken": 4100,
320
+ "presencePenalty": 0,
321
+ "temperature": 1,
322
+ "topP": 0.3
323
+ },
324
+ "modelParameters": {
325
+ "device": "CUDA",
326
+ "maxStoredLayers": 41,
327
+ "modelName": "RWKV-4-World-CHNtuned-3B-v1-20230625-ctx4096.pth",
328
+ "precision": "int8",
329
+ "storedLayers": 41,
330
+ "useCustomCuda": true
331
+ },
332
+ "name": "GPU-6G-3B-CN"
333
+ },
334
+ {
335
+ "apiParameters": {
336
+ "apiPort": 8000,
337
+ "frequencyPenalty": 1,
338
+ "maxResponseToken": 4100,
339
+ "presencePenalty": 0,
340
+ "temperature": 1,
341
+ "topP": 0.3
342
+ },
343
+ "modelParameters": {
344
+ "device": "CUDA",
345
+ "maxStoredLayers": 41,
346
+ "modelName": "RWKV-4-World-7B-v1-20230626-ctx4096.pth",
347
+ "precision": "int8",
348
+ "storedLayers": 18,
349
+ "useCustomCuda": true
350
+ },
351
+ "name": "GPU-6G-7B-World"
352
+ },
353
+ {
354
+ "apiParameters": {
355
+ "apiPort": 8000,
356
+ "frequencyPenalty": 1,
357
+ "maxResponseToken": 4100,
358
+ "presencePenalty": 0,
359
+ "temperature": 1,
360
+ "topP": 0.3
361
+ },
362
+ "modelParameters": {
363
+ "device": "CUDA",
364
+ "maxStoredLayers": 41,
365
+ "modelName": "RWKV-4-Raven-7B-v12-Eng98%-Other2%-20230521-ctx8192.pth",
366
+ "precision": "int8",
367
+ "storedLayers": 18,
368
+ "useCustomCuda": true
369
+ },
370
+ "name": "GPU-6G-7B-EN"
371
+ },
372
+ {
373
+ "apiParameters": {
374
+ "apiPort": 8000,
375
+ "frequencyPenalty": 1,
376
+ "maxResponseToken": 4100,
377
+ "presencePenalty": 0,
378
+ "temperature": 1,
379
+ "topP": 0.3
380
+ },
381
+ "modelParameters": {
382
+ "device": "CUDA",
383
+ "maxStoredLayers": 41,
384
+ "modelName": "RWKV-4-World-CHNtuned-7B-v1-20230709-ctx4096.pth",
385
+ "precision": "int8",
386
+ "storedLayers": 18,
387
+ "useCustomCuda": true
388
+ },
389
+ "name": "GPU-6G-7B-CN"
390
+ },
391
+ {
392
+ "apiParameters": {
393
+ "apiPort": 8000,
394
+ "frequencyPenalty": 1,
395
+ "maxResponseToken": 4100,
396
+ "presencePenalty": 0,
397
+ "temperature": 1,
398
+ "topP": 0.3
399
+ },
400
+ "modelParameters": {
401
+ "device": "CUDA",
402
+ "maxStoredLayers": 41,
403
+ "modelName": "RWKV-4-World-1.5B-v1-fixed-20230612-ctx4096.pth",
404
+ "precision": "fp32",
405
+ "storedLayers": 41
406
+ },
407
+ "name": "GPU-8G-1B5-World"
408
+ },
409
+ {
410
+ "apiParameters": {
411
+ "apiPort": 8000,
412
+ "frequencyPenalty": 1,
413
+ "maxResponseToken": 4100,
414
+ "presencePenalty": 0,
415
+ "temperature": 1,
416
+ "topP": 0.3
417
+ },
418
+ "modelParameters": {
419
+ "device": "CUDA",
420
+ "maxStoredLayers": 41,
421
+ "modelName": "RWKV-4-World-3B-v1-20230619-ctx4096.pth",
422
+ "precision": "fp16",
423
+ "storedLayers": 41,
424
+ "useCustomCuda": true
425
+ },
426
+ "name": "GPU-8G-3B-World"
427
+ },
428
+ {
429
+ "apiParameters": {
430
+ "apiPort": 8000,
431
+ "frequencyPenalty": 1,
432
+ "maxResponseToken": 4100,
433
+ "presencePenalty": 0,
434
+ "temperature": 1,
435
+ "topP": 0.3
436
+ },
437
+ "modelParameters": {
438
+ "device": "CUDA",
439
+ "maxStoredLayers": 41,
440
+ "modelName": "RWKV-4-Raven-3B-v12-Eng98%-Other2%-20230520-ctx4096.pth",
441
+ "precision": "fp16",
442
+ "storedLayers": 41,
443
+ "useCustomCuda": true
444
+ },
445
+ "name": "GPU-8G-3B-EN"
446
+ },
447
+ {
448
+ "apiParameters": {
449
+ "apiPort": 8000,
450
+ "frequencyPenalty": 1,
451
+ "maxResponseToken": 4100,
452
+ "presencePenalty": 0,
453
+ "temperature": 1,
454
+ "topP": 0.3
455
+ },
456
+ "modelParameters": {
457
+ "device": "CUDA",
458
+ "maxStoredLayers": 41,
459
+ "modelName": "RWKV-4-World-CHNtuned-3B-v1-20230625-ctx4096.pth",
460
+ "precision": "fp16",
461
+ "storedLayers": 41,
462
+ "useCustomCuda": true
463
+ },
464
+ "name": "GPU-8G-3B-CN"
465
+ },
466
+ {
467
+ "apiParameters": {
468
+ "apiPort": 8000,
469
+ "frequencyPenalty": 1,
470
+ "maxResponseToken": 4100,
471
+ "presencePenalty": 0,
472
+ "temperature": 1,
473
+ "topP": 0.3
474
+ },
475
+ "modelParameters": {
476
+ "device": "CUDA",
477
+ "maxStoredLayers": 41,
478
+ "modelName": "RWKV-4-World-7B-v1-20230626-ctx4096.pth",
479
+ "precision": "int8",
480
+ "storedLayers": 27,
481
+ "useCustomCuda": true
482
+ },
483
+ "name": "GPU-8G-7B-World"
484
+ },
485
+ {
486
+ "apiParameters": {
487
+ "apiPort": 8000,
488
+ "frequencyPenalty": 1,
489
+ "maxResponseToken": 4100,
490
+ "presencePenalty": 0,
491
+ "temperature": 1,
492
+ "topP": 0.3
493
+ },
494
+ "modelParameters": {
495
+ "device": "CUDA",
496
+ "maxStoredLayers": 41,
497
+ "modelName": "RWKV-4-Raven-7B-v12-Eng98%-Other2%-20230521-ctx8192.pth",
498
+ "precision": "int8",
499
+ "storedLayers": 27,
500
+ "useCustomCuda": true
501
+ },
502
+ "name": "GPU-8G-7B-EN"
503
+ },
504
+ {
505
+ "apiParameters": {
506
+ "apiPort": 8000,
507
+ "frequencyPenalty": 1,
508
+ "maxResponseToken": 4100,
509
+ "presencePenalty": 0,
510
+ "temperature": 1,
511
+ "topP": 0.3
512
+ },
513
+ "modelParameters": {
514
+ "device": "CUDA",
515
+ "maxStoredLayers": 41,
516
+ "modelName": "RWKV-4-World-CHNtuned-7B-v1-20230709-ctx4096.pth",
517
+ "precision": "int8",
518
+ "storedLayers": 27,
519
+ "useCustomCuda": true
520
+ },
521
+ "name": "GPU-8G-7B-CN"
522
+ },
523
+ {
524
+ "apiParameters": {
525
+ "apiPort": 8000,
526
+ "frequencyPenalty": 1,
527
+ "maxResponseToken": 4100,
528
+ "presencePenalty": 0,
529
+ "temperature": 1,
530
+ "topP": 0.3
531
+ },
532
+ "modelParameters": {
533
+ "device": "CUDA",
534
+ "maxStoredLayers": 41,
535
+ "modelName": "RWKV-4-World-7B-v1-20230626-ctx4096.pth",
536
+ "precision": "int8",
537
+ "storedLayers": 41,
538
+ "useCustomCuda": true
539
+ },
540
+ "name": "GPU-10G-7B-World"
541
+ },
542
+ {
543
+ "apiParameters": {
544
+ "apiPort": 8000,
545
+ "frequencyPenalty": 1,
546
+ "maxResponseToken": 4100,
547
+ "presencePenalty": 0,
548
+ "temperature": 1,
549
+ "topP": 0.3
550
+ },
551
+ "modelParameters": {
552
+ "device": "CUDA",
553
+ "maxStoredLayers": 41,
554
+ "modelName": "RWKV-4-Raven-7B-v12-Eng98%-Other2%-20230521-ctx8192.pth",
555
+ "precision": "int8",
556
+ "storedLayers": 41,
557
+ "useCustomCuda": true
558
+ },
559
+ "name": "GPU-10G-7B-EN"
560
+ },
561
+ {
562
+ "apiParameters": {
563
+ "apiPort": 8000,
564
+ "frequencyPenalty": 1,
565
+ "maxResponseToken": 6100,
566
+ "presencePenalty": 0,
567
+ "temperature": 1,
568
+ "topP": 0.3
569
+ },
570
+ "modelParameters": {
571
+ "device": "CUDA",
572
+ "maxStoredLayers": 41,
573
+ "modelName": "RWKV-claude-4-World-7B-20230805-ctx65k.pth",
574
+ "precision": "int8",
575
+ "storedLayers": 31,
576
+ "useCustomCuda": true
577
+ },
578
+ "name": "GPU-10G-7B-CN"
579
+ },
580
+ {
581
+ "apiParameters": {
582
+ "apiPort": 8000,
583
+ "frequencyPenalty": 1,
584
+ "maxResponseToken": 4100,
585
+ "presencePenalty": 0,
586
+ "temperature": 1,
587
+ "topP": 0.3
588
+ },
589
+ "modelParameters": {
590
+ "device": "CUDA",
591
+ "maxStoredLayers": 41,
592
+ "modelName": "RWKV-4-Raven-14B-v12-Eng98%-Other2%-20230523-ctx8192.pth",
593
+ "precision": "int8",
594
+ "storedLayers": 24,
595
+ "useCustomCuda": true
596
+ },
597
+ "name": "GPU-12G-14B-EN"
598
+ },
599
+ {
600
+ "apiParameters": {
601
+ "apiPort": 8000,
602
+ "frequencyPenalty": 1,
603
+ "maxResponseToken": 4100,
604
+ "presencePenalty": 0,
605
+ "temperature": 1,
606
+ "topP": 0.3
607
+ },
608
+ "modelParameters": {
609
+ "device": "CUDA",
610
+ "maxStoredLayers": 41,
611
+ "modelName": "RWKV-4-World-7B-v1-20230626-ctx4096.pth",
612
+ "precision": "fp16",
613
+ "storedLayers": 41,
614
+ "useCustomCuda": true
615
+ },
616
+ "name": "GPU-16G-7B-World"
617
+ },
618
+ {
619
+ "apiParameters": {
620
+ "apiPort": 8000,
621
+ "frequencyPenalty": 1,
622
+ "maxResponseToken": 4100,
623
+ "presencePenalty": 0,
624
+ "temperature": 1,
625
+ "topP": 0.3
626
+ },
627
+ "modelParameters": {
628
+ "device": "CUDA",
629
+ "maxStoredLayers": 41,
630
+ "modelName": "RWKV-4-Raven-7B-v12-Eng98%-Other2%-20230521-ctx8192.pth",
631
+ "precision": "fp16",
632
+ "storedLayers": 41,
633
+ "useCustomCuda": true
634
+ },
635
+ "name": "GPU-16G-7B-EN"
636
+ },
637
+ {
638
+ "apiParameters": {
639
+ "apiPort": 8000,
640
+ "frequencyPenalty": 1,
641
+ "maxResponseToken": 4100,
642
+ "presencePenalty": 0,
643
+ "temperature": 1,
644
+ "topP": 0.3
645
+ },
646
+ "modelParameters": {
647
+ "device": "CUDA",
648
+ "maxStoredLayers": 41,
649
+ "modelName": "RWKV-4-World-CHNtuned-7B-v1-20230709-ctx4096.pth",
650
+ "precision": "fp16",
651
+ "storedLayers": 32,
652
+ "useCustomCuda": true
653
+ },
654
+ "name": "GPU-16G-7B-CN"
655
+ },
656
+ {
657
+ "apiParameters": {
658
+ "apiPort": 8000,
659
+ "frequencyPenalty": 1,
660
+ "maxResponseToken": 4100,
661
+ "presencePenalty": 0,
662
+ "temperature": 1,
663
+ "topP": 0.3
664
+ },
665
+ "modelParameters": {
666
+ "device": "CUDA",
667
+ "maxStoredLayers": 41,
668
+ "modelName": "RWKV-4-Raven-14B-v12-Eng98%-Other2%-20230523-ctx8192.pth",
669
+ "precision": "int8",
670
+ "storedLayers": 37,
671
+ "useCustomCuda": true
672
+ },
673
+ "name": "GPU-16G-14B-EN"
674
+ },
675
+ {
676
+ "apiParameters": {
677
+ "apiPort": 8000,
678
+ "frequencyPenalty": 1,
679
+ "maxResponseToken": 4100,
680
+ "presencePenalty": 0,
681
+ "temperature": 1,
682
+ "topP": 0.3
683
+ },
684
+ "modelParameters": {
685
+ "device": "CUDA",
686
+ "maxStoredLayers": 41,
687
+ "modelName": "RWKV-4-Raven-14B-v12-Eng98%-Other2%-20230523-ctx8192.pth",
688
+ "precision": "int8",
689
+ "storedLayers": 41,
690
+ "useCustomCuda": true
691
+ },
692
+ "name": "GPU-18G-14B-EN"
693
+ },
694
+ {
695
+ "apiParameters": {
696
+ "apiPort": 8000,
697
+ "frequencyPenalty": 1,
698
+ "maxResponseToken": 4100,
699
+ "presencePenalty": 0,
700
+ "temperature": 1,
701
+ "topP": 0.3
702
+ },
703
+ "modelParameters": {
704
+ "device": "CUDA",
705
+ "maxStoredLayers": 41,
706
+ "modelName": "RWKV-4-Raven-14B-v12-Eng98%-Other2%-20230523-ctx8192.pth",
707
+ "precision": "fp16",
708
+ "storedLayers": 41,
709
+ "useCustomCuda": true
710
+ },
711
+ "name": "GPU-32G-14B-EN"
712
+ },
713
+ {
714
+ "apiParameters": {
715
+ "apiPort": 8000,
716
+ "frequencyPenalty": 1,
717
+ "maxResponseToken": 4100,
718
+ "presencePenalty": 0,
719
+ "temperature": 1,
720
+ "topP": 0.8
721
+ },
722
+ "modelParameters": {
723
+ "device": "CPU",
724
+ "maxStoredLayers": 41,
725
+ "modelName": "RWKV-4-MIDI-120M-v1-20230714-ctx4096.pth",
726
+ "precision": "fp32",
727
+ "storedLayers": 41
728
+ },
729
+ "name": "CPU-120M-Music"
730
+ },
731
+ {
732
+ "apiParameters": {
733
+ "apiPort": 8000,
734
+ "frequencyPenalty": 1,
735
+ "maxResponseToken": 4100,
736
+ "presencePenalty": 0,
737
+ "temperature": 1,
738
+ "topP": 0.8
739
+ },
740
+ "modelParameters": {
741
+ "device": "CPU",
742
+ "maxStoredLayers": 41,
743
+ "modelName": "RWKV-4-MIDI-560M-v1-20230717-ctx4096.pth",
744
+ "precision": "fp32",
745
+ "storedLayers": 41
746
+ },
747
+ "name": "CPU-560M-Music"
748
+ },
749
+ {
750
+ "apiParameters": {
751
+ "apiPort": 8000,
752
+ "frequencyPenalty": 1,
753
+ "maxResponseToken": 4100,
754
+ "presencePenalty": 0,
755
+ "temperature": 1,
756
+ "topP": 0.3
757
+ },
758
+ "modelParameters": {
759
+ "device": "CPU",
760
+ "maxStoredLayers": 41,
761
+ "modelName": "RWKV-4-World-1.5B-v1-fixed-20230612-ctx4096.pth",
762
+ "precision": "fp32",
763
+ "storedLayers": 41
764
+ },
765
+ "name": "CPU-6G-1B5-World"
766
+ },
767
+ {
768
+ "apiParameters": {
769
+ "apiPort": 8000,
770
+ "frequencyPenalty": 1,
771
+ "maxResponseToken": 4100,
772
+ "presencePenalty": 0,
773
+ "temperature": 1,
774
+ "topP": 0.3
775
+ },
776
+ "modelParameters": {
777
+ "device": "CPU",
778
+ "maxStoredLayers": 41,
779
+ "modelName": "RWKV-4-Raven-1B5-v12-Eng98%-Other2%-20230520-ctx4096.pth",
780
+ "precision": "fp32",
781
+ "storedLayers": 41
782
+ },
783
+ "name": "CPU-6G-1B5-EN"
784
+ },
785
+ {
786
+ "apiParameters": {
787
+ "apiPort": 8000,
788
+ "frequencyPenalty": 1,
789
+ "maxResponseToken": 4100,
790
+ "presencePenalty": 0,
791
+ "temperature": 1,
792
+ "topP": 0.3
793
+ },
794
+ "modelParameters": {
795
+ "device": "CPU",
796
+ "maxStoredLayers": 41,
797
+ "modelName": "RWKV-4-World-3B-v1-20230619-ctx4096.pth",
798
+ "precision": "fp32",
799
+ "storedLayers": 41
800
+ },
801
+ "name": "CPU-12G-3B-World"
802
+ },
803
+ {
804
+ "apiParameters": {
805
+ "apiPort": 8000,
806
+ "frequencyPenalty": 1,
807
+ "maxResponseToken": 4100,
808
+ "presencePenalty": 0,
809
+ "temperature": 1,
810
+ "topP": 0.3
811
+ },
812
+ "modelParameters": {
813
+ "device": "CPU",
814
+ "maxStoredLayers": 41,
815
+ "modelName": "RWKV-4-Raven-3B-v12-Eng98%-Other2%-20230520-ctx4096.pth",
816
+ "precision": "fp32",
817
+ "storedLayers": 41
818
+ },
819
+ "name": "CPU-12G-3B-EN"
820
+ },
821
+ {
822
+ "apiParameters": {
823
+ "apiPort": 8000,
824
+ "frequencyPenalty": 1,
825
+ "maxResponseToken": 4100,
826
+ "presencePenalty": 0,
827
+ "temperature": 1,
828
+ "topP": 0.3
829
+ },
830
+ "modelParameters": {
831
+ "device": "CPU",
832
+ "maxStoredLayers": 41,
833
+ "modelName": "RWKV-4-World-CHNtuned-3B-v1-20230625-ctx4096.pth",
834
+ "precision": "fp32",
835
+ "storedLayers": 41
836
+ },
837
+ "name": "CPU-12G-3B-CN"
838
+ },
839
+ {
840
+ "apiParameters": {
841
+ "apiPort": 8000,
842
+ "frequencyPenalty": 1,
843
+ "maxResponseToken": 4100,
844
+ "presencePenalty": 0,
845
+ "temperature": 1,
846
+ "topP": 0.3
847
+ },
848
+ "modelParameters": {
849
+ "device": "CPU",
850
+ "maxStoredLayers": 41,
851
+ "modelName": "RWKV-4-World-7B-v1-20230626-ctx4096.pth",
852
+ "precision": "fp32",
853
+ "storedLayers": 41
854
+ },
855
+ "name": "CPU-28G-7B-World"
856
+ },
857
+ {
858
+ "apiParameters": {
859
+ "apiPort": 8000,
860
+ "frequencyPenalty": 1,
861
+ "maxResponseToken": 4100,
862
+ "presencePenalty": 0,
863
+ "temperature": 1,
864
+ "topP": 0.3
865
+ },
866
+ "modelParameters": {
867
+ "device": "CPU",
868
+ "maxStoredLayers": 41,
869
+ "modelName": "RWKV-4-Raven-7B-v12-Eng98%-Other2%-20230521-ctx8192.pth",
870
+ "precision": "fp32",
871
+ "storedLayers": 41
872
+ },
873
+ "name": "CPU-28G-7B-EN"
874
+ },
875
+ {
876
+ "apiParameters": {
877
+ "apiPort": 8000,
878
+ "frequencyPenalty": 1,
879
+ "maxResponseToken": 4100,
880
+ "presencePenalty": 0,
881
+ "temperature": 1,
882
+ "topP": 0.3
883
+ },
884
+ "modelParameters": {
885
+ "device": "CPU",
886
+ "maxStoredLayers": 41,
887
+ "modelName": "RWKV-4-World-CHNtuned-7B-v1-20230709-ctx4096.pth",
888
+ "precision": "fp32",
889
+ "storedLayers": 41
890
+ },
891
+ "name": "CPU-28G-7B-CN"
892
+ },
893
+ {
894
+ "apiParameters": {
895
+ "apiPort": 8000,
896
+ "frequencyPenalty": 1,
897
+ "maxResponseToken": 4100,
898
+ "presencePenalty": 0,
899
+ "temperature": 1,
900
+ "topP": 0.3
901
+ },
902
+ "modelParameters": {
903
+ "device": "CUDA",
904
+ "maxStoredLayers": 41,
905
+ "modelName": "RWKV-4-World-CHNtuned-7B-v1-20230709-ctx4096.pth",
906
+ "precision": "int8",
907
+ "storedLayers": 6,
908
+ "useCustomCuda": true
909
+ },
910
+ "name": "2023/9/2 09:30:41"
911
+ },
912
+ {
913
+ "apiParameters": {
914
+ "apiPort": 8000,
915
+ "frequencyPenalty": 1,
916
+ "maxResponseToken": 4100,
917
+ "presencePenalty": 0,
918
+ "temperature": 1,
919
+ "topP": 0.3
920
+ },
921
+ "modelParameters": {
922
+ "device": "CUDA",
923
+ "maxStoredLayers": 41,
924
+ "modelName": "RWKV-4-World-3B-v1-20230619-ctx4096.pth",
925
+ "precision": "int8",
926
+ "storedLayers": 6,
927
+ "useCustomCuda": true
928
+ },
929
+ "name": "2023/9/2 11:47:17"
930
+ }
931
+ ],
932
+ "modelSourceManifestList": "https://cdn.jsdelivr.net/gh/josstorer/RWKV-Runner@master/manifest.json;https://cdn.jsdelivr.net/gh/josstorer/TheBloke@master/manifest.json;",
933
+ "settings": {
934
+ "apiChatModelName": "rwkv",
935
+ "apiCompletionModelName": "rwkv",
936
+ "apiKey": "sk-",
937
+ "apiUrl": "",
938
+ "autoUpdatesCheck": true,
939
+ "cnMirror": true,
940
+ "customModelsPath": "./models",
941
+ "customPythonPath": "",
942
+ "darkMode": true,
943
+ "dpiScaling": 100,
944
+ "giteeUpdatesSource": true,
945
+ "host": "0.0.0.0",
946
+ "language": "zh"
947
+ }
948
+ }