{ "currentModelConfigIndex": 28, "dataProcessParams": { "dataPath": "finetune/data/sample.jsonl", "vocabPath": "backend-python/rwkv_pip/rwkv_vocab_v20230424.txt" }, "loraFinetuneParams": { "accumGradBatches": 8, "adamEps": "1e-8", "baseModel": "RWKV-4-World-CHNtuned-7B-v1-20230709-ctx4096.pth", "beta1": 0.9, "beta2": 0.999, "ctxLen": 1024, "devices": 1, "epochBegin": 0, "epochCount": 20, "epochSave": 2, "epochSteps": 200, "gradCp": false, "headQk": false, "loraAlpha": 32, "loraDropout": 0.01, "loraLoad": "", "loraR": 8, "lrFinal": "5e-5", "lrInit": "5e-5", "microBsz": 1, "preFfn": false, "precision": "bf16", "warmupSteps": 0 }, "modelConfigs": [ { "apiParameters": { "apiPort": 8000, "frequencyPenalty": 1, "maxResponseToken": 4100, "presencePenalty": 0, "temperature": 1, "topP": 0.3 }, "modelParameters": { "device": "CUDA", "maxStoredLayers": 41, "modelName": "RWKV-4-World-3B-v1-20230619-ctx4096.pth", "precision": "int8", "storedLayers": 6, "useCustomCuda": true }, "name": "GPU-2G-3B-World" }, { "apiParameters": { "apiPort": 8000, "frequencyPenalty": 1, "maxResponseToken": 4100, "presencePenalty": 0, "temperature": 1, "topP": 0.3 }, "modelParameters": { "device": "CUDA", "maxStoredLayers": 41, "modelName": "RWKV-4-World-0.1B-v1-20230520-ctx4096.pth", "precision": "fp32", "storedLayers": 41 }, "name": "GPU-2G-0.1B-World" }, { "apiParameters": { "apiPort": 8000, "frequencyPenalty": 1, "maxResponseToken": 4100, "presencePenalty": 0, "temperature": 1, "topP": 0.3 }, "modelParameters": { "device": "CUDA", "maxStoredLayers": 41, "modelName": "RWKV-4-Raven-1B5-v12-Eng98%-Other2%-20230520-ctx4096.pth", "precision": "int8", "storedLayers": 4, "useCustomCuda": true }, "name": "GPU-2G-1B5-EN" }, { "apiParameters": { "apiPort": 8000, "frequencyPenalty": 1, "maxResponseToken": 4100, "presencePenalty": 0, "temperature": 1, "topP": 0.3 }, "modelParameters": { "device": "CUDA", "maxStoredLayers": 41, "modelName": "RWKV-4-World-0.4B-v1-20230529-ctx4096.pth", "precision": "fp32", "storedLayers": 41 }, "name": "GPU-4G-0.4B-World" }, { "apiParameters": { "apiPort": 8000, "frequencyPenalty": 1, "maxResponseToken": 4100, "presencePenalty": 0, "temperature": 1, "topP": 0.3 }, "modelParameters": { "device": "CUDA", "maxStoredLayers": 41, "modelName": "RWKV-4-World-1.5B-v1-fixed-20230612-ctx4096.pth", "precision": "fp32", "storedLayers": 8 }, "name": "GPU-4G-1B5-World" }, { "apiParameters": { "apiPort": 8000, "frequencyPenalty": 1, "maxResponseToken": 4100, "presencePenalty": 0, "temperature": 1, "topP": 0.3 }, "modelParameters": { "device": "CUDA", "maxStoredLayers": 41, "modelName": "RWKV-4-Raven-1B5-v12-Eng98%-Other2%-20230520-ctx4096.pth", "precision": "int8", "storedLayers": 41, "useCustomCuda": true }, "name": "GPU-4G-1B5-EN" }, { "apiParameters": { "apiPort": 8000, "frequencyPenalty": 1, "maxResponseToken": 4100, "presencePenalty": 0, "temperature": 1, "topP": 0.3 }, "modelParameters": { "device": "CUDA", "maxStoredLayers": 41, "modelName": "RWKV-4-World-3B-v1-20230619-ctx4096.pth", "precision": "int8", "storedLayers": 24, "useCustomCuda": true }, "name": "GPU-4G-3B-World" }, { "apiParameters": { "apiPort": 8000, "frequencyPenalty": 1, "maxResponseToken": 4100, "presencePenalty": 0, "temperature": 1, "topP": 0.3 }, "modelParameters": { "device": "CUDA", "maxStoredLayers": 41, "modelName": "RWKV-4-Raven-3B-v12-Eng98%-Other2%-20230520-ctx4096.pth", "precision": "int8", "storedLayers": 24, "useCustomCuda": true }, "name": "GPU-4G-3B-EN" }, { "apiParameters": { "apiPort": 8000, "frequencyPenalty": 1, "maxResponseToken": 4100, "presencePenalty": 0, "temperature": 1, "topP": 0.3 }, "modelParameters": { "device": "CUDA", "maxStoredLayers": 41, "modelName": "RWKV-4-World-CHNtuned-3B-v1-20230625-ctx4096.pth", "precision": "int8", "storedLayers": 24, "useCustomCuda": true }, "name": "GPU-4G-3B-CN" }, { "apiParameters": { "apiPort": 8000, "frequencyPenalty": 1, "maxResponseToken": 4100, "presencePenalty": 0, "temperature": 1, "topP": 0.3 }, "modelParameters": { "device": "CUDA", "maxStoredLayers": 41, "modelName": "RWKV-4-World-7B-v1-20230626-ctx4096.pth", "precision": "int8", "storedLayers": 8, "useCustomCuda": true }, "name": "GPU-4G-7B-World" }, { "apiParameters": { "apiPort": 8000, "frequencyPenalty": 1, "maxResponseToken": 4100, "presencePenalty": 0, "temperature": 1, "topP": 0.3 }, "modelParameters": { "device": "CUDA", "maxStoredLayers": 41, "modelName": "RWKV-4-Raven-7B-v12-Eng98%-Other2%-20230521-ctx8192.pth", "precision": "int8", "storedLayers": 8, "useCustomCuda": true }, "name": "GPU-4G-7B-EN" }, { "apiParameters": { "apiPort": 8000, "frequencyPenalty": 1, "maxResponseToken": 4100, "presencePenalty": 0, "temperature": 1, "topP": 0.3 }, "modelParameters": { "device": "CUDA", "maxStoredLayers": 41, "modelName": "RWKV-4-World-CHNtuned-7B-v1-20230709-ctx4096.pth", "precision": "int8", "storedLayers": 8, "useCustomCuda": true }, "name": "GPU-4G-7B-CN" }, { "apiParameters": { "apiPort": 8000, "frequencyPenalty": 1, "maxResponseToken": 4100, "presencePenalty": 0, "temperature": 1, "topP": 0.3 }, "modelParameters": { "device": "CUDA", "maxStoredLayers": 41, "modelName": "RWKV-4-Raven-1B5-v12-Eng98%-Other2%-20230520-ctx4096.pth", "precision": "fp16", "storedLayers": 41, "useCustomCuda": true }, "name": "GPU-6G-1B5-EN" }, { "apiParameters": { "apiPort": 8000, "frequencyPenalty": 1, "maxResponseToken": 4100, "presencePenalty": 0, "temperature": 1, "topP": 0.3 }, "modelParameters": { "device": "CUDA", "maxStoredLayers": 41, "modelName": "RWKV-4-World-3B-v1-20230619-ctx4096.pth", "precision": "int8", "storedLayers": 41, "useCustomCuda": true }, "name": "GPU-6G-3B-World" }, { "apiParameters": { "apiPort": 8000, "frequencyPenalty": 1, "maxResponseToken": 4100, "presencePenalty": 0, "temperature": 1, "topP": 0.3 }, "modelParameters": { "device": "CUDA", "maxStoredLayers": 41, "modelName": "RWKV-4-Raven-3B-v12-Eng98%-Other2%-20230520-ctx4096.pth", "precision": "int8", "storedLayers": 41, "useCustomCuda": true }, "name": "GPU-6G-3B-EN" }, { "apiParameters": { "apiPort": 8000, "frequencyPenalty": 1, "maxResponseToken": 4100, "presencePenalty": 0, "temperature": 1, "topP": 0.3 }, "modelParameters": { "device": "CUDA", "maxStoredLayers": 41, "modelName": "RWKV-4-World-CHNtuned-3B-v1-20230625-ctx4096.pth", "precision": "int8", "storedLayers": 41, "useCustomCuda": true }, "name": "GPU-6G-3B-CN" }, { "apiParameters": { "apiPort": 8000, "frequencyPenalty": 1, "maxResponseToken": 4100, "presencePenalty": 0, "temperature": 1, "topP": 0.3 }, "modelParameters": { "device": "CUDA", "maxStoredLayers": 41, "modelName": "RWKV-4-World-7B-v1-20230626-ctx4096.pth", "precision": "int8", "storedLayers": 18, "useCustomCuda": true }, "name": "GPU-6G-7B-World" }, { "apiParameters": { "apiPort": 8000, "frequencyPenalty": 1, "maxResponseToken": 4100, "presencePenalty": 0, "temperature": 1, "topP": 0.3 }, "modelParameters": { "device": "CUDA", "maxStoredLayers": 41, "modelName": "RWKV-4-Raven-7B-v12-Eng98%-Other2%-20230521-ctx8192.pth", "precision": "int8", "storedLayers": 18, "useCustomCuda": true }, "name": "GPU-6G-7B-EN" }, { "apiParameters": { "apiPort": 8000, "frequencyPenalty": 1, "maxResponseToken": 4100, "presencePenalty": 0, "temperature": 1, "topP": 0.3 }, "modelParameters": { "device": "CUDA", "maxStoredLayers": 41, "modelName": "RWKV-4-World-CHNtuned-7B-v1-20230709-ctx4096.pth", "precision": "int8", "storedLayers": 18, "useCustomCuda": true }, "name": "GPU-6G-7B-CN" }, { "apiParameters": { "apiPort": 8000, "frequencyPenalty": 1, "maxResponseToken": 4100, "presencePenalty": 0, "temperature": 1, "topP": 0.3 }, "modelParameters": { "device": "CUDA", "maxStoredLayers": 41, "modelName": "RWKV-4-World-1.5B-v1-fixed-20230612-ctx4096.pth", "precision": "fp32", "storedLayers": 41 }, "name": "GPU-8G-1B5-World" }, { "apiParameters": { "apiPort": 8000, "frequencyPenalty": 1, "maxResponseToken": 4100, "presencePenalty": 0, "temperature": 1, "topP": 0.3 }, "modelParameters": { "device": "CUDA", "maxStoredLayers": 41, "modelName": "RWKV-4-World-3B-v1-20230619-ctx4096.pth", "precision": "fp16", "storedLayers": 41, "useCustomCuda": true }, "name": "GPU-8G-3B-World" }, { "apiParameters": { "apiPort": 8000, "frequencyPenalty": 1, "maxResponseToken": 4100, "presencePenalty": 0, "temperature": 1, "topP": 0.3 }, "modelParameters": { "device": "CUDA", "maxStoredLayers": 41, "modelName": "RWKV-4-Raven-3B-v12-Eng98%-Other2%-20230520-ctx4096.pth", "precision": "fp16", "storedLayers": 41, "useCustomCuda": true }, "name": "GPU-8G-3B-EN" }, { "apiParameters": { "apiPort": 8000, "frequencyPenalty": 1, "maxResponseToken": 4100, "presencePenalty": 0, "temperature": 1, "topP": 0.3 }, "modelParameters": { "device": "CUDA", "maxStoredLayers": 41, "modelName": "RWKV-4-World-CHNtuned-3B-v1-20230625-ctx4096.pth", "precision": "fp16", "storedLayers": 41, "useCustomCuda": true }, "name": "GPU-8G-3B-CN" }, { "apiParameters": { "apiPort": 8000, "frequencyPenalty": 1, "maxResponseToken": 4100, "presencePenalty": 0, "temperature": 1, "topP": 0.3 }, "modelParameters": { "device": "CUDA", "maxStoredLayers": 41, "modelName": "RWKV-4-World-7B-v1-20230626-ctx4096.pth", "precision": "int8", "storedLayers": 27, "useCustomCuda": true }, "name": "GPU-8G-7B-World" }, { "apiParameters": { "apiPort": 8000, "frequencyPenalty": 1, "maxResponseToken": 4100, "presencePenalty": 0, "temperature": 1, "topP": 0.3 }, "modelParameters": { "device": "CUDA", "maxStoredLayers": 41, "modelName": "RWKV-4-Raven-7B-v12-Eng98%-Other2%-20230521-ctx8192.pth", "precision": "int8", "storedLayers": 27, "useCustomCuda": true }, "name": "GPU-8G-7B-EN" }, { "apiParameters": { "apiPort": 8000, "frequencyPenalty": 1, "maxResponseToken": 4100, "presencePenalty": 0, "temperature": 1, "topP": 0.3 }, "modelParameters": { "device": "CUDA", "maxStoredLayers": 41, "modelName": "RWKV-4-World-CHNtuned-7B-v1-20230709-ctx4096.pth", "precision": "int8", "storedLayers": 27, "useCustomCuda": true }, "name": "GPU-8G-7B-CN" }, { "apiParameters": { "apiPort": 8000, "frequencyPenalty": 1, "maxResponseToken": 4100, "presencePenalty": 0, "temperature": 1, "topP": 0.3 }, "modelParameters": { "device": "CUDA", "maxStoredLayers": 41, "modelName": "RWKV-4-World-7B-v1-20230626-ctx4096.pth", "precision": "int8", "storedLayers": 41, "useCustomCuda": true }, "name": "GPU-10G-7B-World" }, { "apiParameters": { "apiPort": 8000, "frequencyPenalty": 1, "maxResponseToken": 4100, "presencePenalty": 0, "temperature": 1, "topP": 0.3 }, "modelParameters": { "device": "CUDA", "maxStoredLayers": 41, "modelName": "RWKV-4-Raven-7B-v12-Eng98%-Other2%-20230521-ctx8192.pth", "precision": "int8", "storedLayers": 41, "useCustomCuda": true }, "name": "GPU-10G-7B-EN" }, { "apiParameters": { "apiPort": 8000, "frequencyPenalty": 1, "maxResponseToken": 6100, "presencePenalty": 0, "temperature": 1, "topP": 0.3 }, "modelParameters": { "device": "CUDA", "maxStoredLayers": 41, "modelName": "RWKV-claude-4-World-7B-20230805-ctx65k.pth", "precision": "int8", "storedLayers": 31, "useCustomCuda": true }, "name": "GPU-10G-7B-CN" }, { "apiParameters": { "apiPort": 8000, "frequencyPenalty": 1, "maxResponseToken": 4100, "presencePenalty": 0, "temperature": 1, "topP": 0.3 }, "modelParameters": { "device": "CUDA", "maxStoredLayers": 41, "modelName": "RWKV-4-Raven-14B-v12-Eng98%-Other2%-20230523-ctx8192.pth", "precision": "int8", "storedLayers": 24, "useCustomCuda": true }, "name": "GPU-12G-14B-EN" }, { "apiParameters": { "apiPort": 8000, "frequencyPenalty": 1, "maxResponseToken": 4100, "presencePenalty": 0, "temperature": 1, "topP": 0.3 }, "modelParameters": { "device": "CUDA", "maxStoredLayers": 41, "modelName": "RWKV-4-World-7B-v1-20230626-ctx4096.pth", "precision": "fp16", "storedLayers": 41, "useCustomCuda": true }, "name": "GPU-16G-7B-World" }, { "apiParameters": { "apiPort": 8000, "frequencyPenalty": 1, "maxResponseToken": 4100, "presencePenalty": 0, "temperature": 1, "topP": 0.3 }, "modelParameters": { "device": "CUDA", "maxStoredLayers": 41, "modelName": "RWKV-4-Raven-7B-v12-Eng98%-Other2%-20230521-ctx8192.pth", "precision": "fp16", "storedLayers": 41, "useCustomCuda": true }, "name": "GPU-16G-7B-EN" }, { "apiParameters": { "apiPort": 8000, "frequencyPenalty": 1, "maxResponseToken": 4100, "presencePenalty": 0, "temperature": 1, "topP": 0.3 }, "modelParameters": { "device": "CUDA", "maxStoredLayers": 41, "modelName": "RWKV-4-World-CHNtuned-7B-v1-20230709-ctx4096.pth", "precision": "fp16", "storedLayers": 32, "useCustomCuda": true }, "name": "GPU-16G-7B-CN" }, { "apiParameters": { "apiPort": 8000, "frequencyPenalty": 1, "maxResponseToken": 4100, "presencePenalty": 0, "temperature": 1, "topP": 0.3 }, "modelParameters": { "device": "CUDA", "maxStoredLayers": 41, "modelName": "RWKV-4-Raven-14B-v12-Eng98%-Other2%-20230523-ctx8192.pth", "precision": "int8", "storedLayers": 37, "useCustomCuda": true }, "name": "GPU-16G-14B-EN" }, { "apiParameters": { "apiPort": 8000, "frequencyPenalty": 1, "maxResponseToken": 4100, "presencePenalty": 0, "temperature": 1, "topP": 0.3 }, "modelParameters": { "device": "CUDA", "maxStoredLayers": 41, "modelName": "RWKV-4-Raven-14B-v12-Eng98%-Other2%-20230523-ctx8192.pth", "precision": "int8", "storedLayers": 41, "useCustomCuda": true }, "name": "GPU-18G-14B-EN" }, { "apiParameters": { "apiPort": 8000, "frequencyPenalty": 1, "maxResponseToken": 4100, "presencePenalty": 0, "temperature": 1, "topP": 0.3 }, "modelParameters": { "device": "CUDA", "maxStoredLayers": 41, "modelName": "RWKV-4-Raven-14B-v12-Eng98%-Other2%-20230523-ctx8192.pth", "precision": "fp16", "storedLayers": 41, "useCustomCuda": true }, "name": "GPU-32G-14B-EN" }, { "apiParameters": { "apiPort": 8000, "frequencyPenalty": 1, "maxResponseToken": 4100, "presencePenalty": 0, "temperature": 1, "topP": 0.8 }, "modelParameters": { "device": "CPU", "maxStoredLayers": 41, "modelName": "RWKV-4-MIDI-120M-v1-20230714-ctx4096.pth", "precision": "fp32", "storedLayers": 41 }, "name": "CPU-120M-Music" }, { "apiParameters": { "apiPort": 8000, "frequencyPenalty": 1, "maxResponseToken": 4100, "presencePenalty": 0, "temperature": 1, "topP": 0.8 }, "modelParameters": { "device": "CPU", "maxStoredLayers": 41, "modelName": "RWKV-4-MIDI-560M-v1-20230717-ctx4096.pth", "precision": "fp32", "storedLayers": 41 }, "name": "CPU-560M-Music" }, { "apiParameters": { "apiPort": 8000, "frequencyPenalty": 1, "maxResponseToken": 4100, "presencePenalty": 0, "temperature": 1, "topP": 0.3 }, "modelParameters": { "device": "CPU", "maxStoredLayers": 41, "modelName": "RWKV-4-World-1.5B-v1-fixed-20230612-ctx4096.pth", "precision": "fp32", "storedLayers": 41 }, "name": "CPU-6G-1B5-World" }, { "apiParameters": { "apiPort": 8000, "frequencyPenalty": 1, "maxResponseToken": 4100, "presencePenalty": 0, "temperature": 1, "topP": 0.3 }, "modelParameters": { "device": "CPU", "maxStoredLayers": 41, "modelName": "RWKV-4-Raven-1B5-v12-Eng98%-Other2%-20230520-ctx4096.pth", "precision": "fp32", "storedLayers": 41 }, "name": "CPU-6G-1B5-EN" }, { "apiParameters": { "apiPort": 8000, "frequencyPenalty": 1, "maxResponseToken": 4100, "presencePenalty": 0, "temperature": 1, "topP": 0.3 }, "modelParameters": { "device": "CPU", "maxStoredLayers": 41, "modelName": "RWKV-4-World-3B-v1-20230619-ctx4096.pth", "precision": "fp32", "storedLayers": 41 }, "name": "CPU-12G-3B-World" }, { "apiParameters": { "apiPort": 8000, "frequencyPenalty": 1, "maxResponseToken": 4100, "presencePenalty": 0, "temperature": 1, "topP": 0.3 }, "modelParameters": { "device": "CPU", "maxStoredLayers": 41, "modelName": "RWKV-4-Raven-3B-v12-Eng98%-Other2%-20230520-ctx4096.pth", "precision": "fp32", "storedLayers": 41 }, "name": "CPU-12G-3B-EN" }, { "apiParameters": { "apiPort": 8000, "frequencyPenalty": 1, "maxResponseToken": 4100, "presencePenalty": 0, "temperature": 1, "topP": 0.3 }, "modelParameters": { "device": "CPU", "maxStoredLayers": 41, "modelName": "RWKV-4-World-CHNtuned-3B-v1-20230625-ctx4096.pth", "precision": "fp32", "storedLayers": 41 }, "name": "CPU-12G-3B-CN" }, { "apiParameters": { "apiPort": 8000, "frequencyPenalty": 1, "maxResponseToken": 4100, "presencePenalty": 0, "temperature": 1, "topP": 0.3 }, "modelParameters": { "device": "CPU", "maxStoredLayers": 41, "modelName": "RWKV-4-World-7B-v1-20230626-ctx4096.pth", "precision": "fp32", "storedLayers": 41 }, "name": "CPU-28G-7B-World" }, { "apiParameters": { "apiPort": 8000, "frequencyPenalty": 1, "maxResponseToken": 4100, "presencePenalty": 0, "temperature": 1, "topP": 0.3 }, "modelParameters": { "device": "CPU", "maxStoredLayers": 41, "modelName": "RWKV-4-Raven-7B-v12-Eng98%-Other2%-20230521-ctx8192.pth", "precision": "fp32", "storedLayers": 41 }, "name": "CPU-28G-7B-EN" }, { "apiParameters": { "apiPort": 8000, "frequencyPenalty": 1, "maxResponseToken": 4100, "presencePenalty": 0, "temperature": 1, "topP": 0.3 }, "modelParameters": { "device": "CPU", "maxStoredLayers": 41, "modelName": "RWKV-4-World-CHNtuned-7B-v1-20230709-ctx4096.pth", "precision": "fp32", "storedLayers": 41 }, "name": "CPU-28G-7B-CN" }, { "apiParameters": { "apiPort": 8000, "frequencyPenalty": 1, "maxResponseToken": 4100, "presencePenalty": 0, "temperature": 1, "topP": 0.3 }, "modelParameters": { "device": "CUDA", "maxStoredLayers": 41, "modelName": "RWKV-4-World-CHNtuned-7B-v1-20230709-ctx4096.pth", "precision": "int8", "storedLayers": 6, "useCustomCuda": true }, "name": "2023/9/2 09:30:41" }, { "apiParameters": { "apiPort": 8000, "frequencyPenalty": 1, "maxResponseToken": 4100, "presencePenalty": 0, "temperature": 1, "topP": 0.3 }, "modelParameters": { "device": "CUDA", "maxStoredLayers": 41, "modelName": "RWKV-4-World-3B-v1-20230619-ctx4096.pth", "precision": "int8", "storedLayers": 6, "useCustomCuda": true }, "name": "2023/9/2 11:47:17" } ], "modelSourceManifestList": "https://cdn.jsdelivr.net/gh/josstorer/RWKV-Runner@master/manifest.json;https://cdn.jsdelivr.net/gh/josstorer/TheBloke@master/manifest.json;", "settings": { "apiChatModelName": "rwkv", "apiCompletionModelName": "rwkv", "apiKey": "sk-", "apiUrl": "", "autoUpdatesCheck": true, "cnMirror": true, "customModelsPath": "./models", "customPythonPath": "", "darkMode": true, "dpiScaling": 100, "giteeUpdatesSource": true, "host": "0.0.0.0", "language": "zh" } }