diff --git a/frontend/src/pages/defaultModelConfigs.ts b/frontend/src/pages/defaultModelConfigs.ts index 9e30b11..0186130 100644 --- a/frontend/src/pages/defaultModelConfigs.ts +++ b/frontend/src/pages/defaultModelConfigs.ts @@ -1,6 +1,63 @@ import { ModelConfig } from './Configs'; export const defaultModelConfigsMac: ModelConfig[] = [ + { + name: 'MAC-0.1B-World', + apiParameters: { + apiPort: 8000, + maxResponseToken: 4100, + temperature: 1.2, + topP: 0.5, + presencePenalty: 0.4, + frequencyPenalty: 0.4 + }, + modelParameters: { + modelName: 'RWKV-4-World-0.1B-v1-20230520-ctx4096.pth', + device: 'MPS', + precision: 'fp32', + storedLayers: 41, + maxStoredLayers: 41, + customStrategy: 'mps fp32' + } + }, + { + name: 'MAC-0.4B-World', + apiParameters: { + apiPort: 8000, + maxResponseToken: 4100, + temperature: 1.2, + topP: 0.5, + presencePenalty: 0.4, + frequencyPenalty: 0.4 + }, + modelParameters: { + modelName: 'RWKV-4-World-0.4B-v1-20230529-ctx4096.pth', + device: 'MPS', + precision: 'fp32', + storedLayers: 41, + maxStoredLayers: 41, + customStrategy: 'mps fp32' + } + }, + { + name: 'MAC-1B5-World', + apiParameters: { + apiPort: 8000, + maxResponseToken: 4100, + temperature: 1.2, + topP: 0.5, + presencePenalty: 0.4, + frequencyPenalty: 0.4 + }, + modelParameters: { + modelName: 'RWKV-4-World-1.5B-v1-fixed-20230612-ctx4096.pth', + device: 'MPS', + precision: 'fp32', + storedLayers: 41, + maxStoredLayers: 41, + customStrategy: 'mps fp32' + } + }, { name: 'MAC-1B5-EN', apiParameters: { @@ -17,7 +74,25 @@ export const defaultModelConfigsMac: ModelConfig[] = [ precision: 'fp32', storedLayers: 41, maxStoredLayers: 41, - useCustomCuda: false, + customStrategy: 'mps fp32' + } + }, + { + name: 'MAC-3B-World', + apiParameters: { + apiPort: 8000, + maxResponseToken: 4100, + temperature: 1.2, + topP: 0.5, + presencePenalty: 0.4, + frequencyPenalty: 0.4 + }, + modelParameters: { + modelName: 'RWKV-4-World-3B-v1-OnlyForTest_80%_trained-20230612-ctx4096.pth', + device: 'MPS', + precision: 'fp32', + storedLayers: 41, + maxStoredLayers: 41, customStrategy: 'mps fp32' } }, @@ -37,7 +112,6 @@ export const defaultModelConfigsMac: ModelConfig[] = [ precision: 'fp32', storedLayers: 41, maxStoredLayers: 41, - useCustomCuda: false, customStrategy: 'mps fp32' } }, @@ -57,10 +131,46 @@ export const defaultModelConfigsMac: ModelConfig[] = [ precision: 'fp32', storedLayers: 41, maxStoredLayers: 41, - useCustomCuda: false, customStrategy: 'mps fp32' } }, + { + name: 'MAC-7B-World', + apiParameters: { + apiPort: 8000, + maxResponseToken: 4100, + temperature: 1.2, + topP: 0.5, + presencePenalty: 0.4, + frequencyPenalty: 0.4 + }, + modelParameters: { + modelName: 'RWKV-4-World-7B-v1-OnlyForTest_64%_trained-20230610-ctx4096.pth', + device: 'MPS', + precision: 'fp32', + storedLayers: 41, + maxStoredLayers: 41, + customStrategy: 'mps fp32' + } + }, + { + name: 'CPU-6G-1B5-World', + apiParameters: { + apiPort: 8000, + maxResponseToken: 4100, + temperature: 1.2, + topP: 0.5, + presencePenalty: 0.4, + frequencyPenalty: 0.4 + }, + modelParameters: { + modelName: 'RWKV-4-World-1.5B-v1-fixed-20230612-ctx4096.pth', + device: 'CPU', + precision: 'fp32', + storedLayers: 41, + maxStoredLayers: 41 + } + }, { name: 'CPU-6G-1B5-EN', apiParameters: { @@ -79,6 +189,24 @@ export const defaultModelConfigsMac: ModelConfig[] = [ maxStoredLayers: 41 } }, + { + name: 'CPU-12G-3B-World', + apiParameters: { + apiPort: 8000, + maxResponseToken: 4100, + temperature: 1.2, + topP: 0.5, + presencePenalty: 0.4, + frequencyPenalty: 0.4 + }, + modelParameters: { + modelName: 'RWKV-4-World-3B-v1-OnlyForTest_80%_trained-20230612-ctx4096.pth', + device: 'CPU', + precision: 'fp32', + storedLayers: 41, + maxStoredLayers: 41 + } + }, { name: 'CPU-12G-3B-EN', apiParameters: { @@ -115,6 +243,24 @@ export const defaultModelConfigsMac: ModelConfig[] = [ maxStoredLayers: 41 } }, + { + name: 'CPU-28G-7B-World', + apiParameters: { + apiPort: 8000, + maxResponseToken: 4100, + temperature: 1.2, + topP: 0.5, + presencePenalty: 0.4, + frequencyPenalty: 0.4 + }, + modelParameters: { + modelName: 'RWKV-4-World-7B-v1-OnlyForTest_64%_trained-20230610-ctx4096.pth', + device: 'CPU', + precision: 'fp32', + storedLayers: 41, + maxStoredLayers: 41 + } + }, { name: 'CPU-28G-7B-EN', apiParameters: { @@ -154,6 +300,24 @@ export const defaultModelConfigsMac: ModelConfig[] = [ ]; export const defaultModelConfigs: ModelConfig[] = [ + { + name: 'GPU-2G-0.1B-World', + apiParameters: { + apiPort: 8000, + maxResponseToken: 4100, + temperature: 1.2, + topP: 0.5, + presencePenalty: 0.4, + frequencyPenalty: 0.4 + }, + modelParameters: { + modelName: 'RWKV-4-World-0.1B-v1-20230520-ctx4096.pth', + device: 'CUDA', + precision: 'fp32', + storedLayers: 41, + maxStoredLayers: 41 + } + }, { name: 'GPU-2G-1B5-EN', apiParameters: { @@ -173,6 +337,42 @@ export const defaultModelConfigs: ModelConfig[] = [ useCustomCuda: true } }, + { + name: 'GPU-4G-0.4B-World', + apiParameters: { + apiPort: 8000, + maxResponseToken: 4100, + temperature: 1.2, + topP: 0.5, + presencePenalty: 0.4, + frequencyPenalty: 0.4 + }, + modelParameters: { + modelName: 'RWKV-4-World-0.4B-v1-20230529-ctx4096.pth', + device: 'CUDA', + precision: 'fp32', + storedLayers: 41, + maxStoredLayers: 41 + } + }, + { + name: 'GPU-4G-1B5-World', + apiParameters: { + apiPort: 8000, + maxResponseToken: 4100, + temperature: 1.2, + topP: 0.5, + presencePenalty: 0.4, + frequencyPenalty: 0.4 + }, + modelParameters: { + modelName: 'RWKV-4-World-1.5B-v1-fixed-20230612-ctx4096.pth', + device: 'CUDA', + precision: 'fp32', + storedLayers: 8, + maxStoredLayers: 41 + } + }, { name: 'GPU-4G-1B5-EN', apiParameters: { @@ -192,6 +392,25 @@ export const defaultModelConfigs: ModelConfig[] = [ useCustomCuda: true } }, + { + name: 'GPU-4G-3B-World', + apiParameters: { + apiPort: 8000, + maxResponseToken: 4100, + temperature: 1.2, + topP: 0.5, + presencePenalty: 0.4, + frequencyPenalty: 0.4 + }, + modelParameters: { + modelName: 'RWKV-4-World-3B-v1-OnlyForTest_80%_trained-20230612-ctx4096.pth', + device: 'CUDA', + precision: 'int8', + storedLayers: 24, + maxStoredLayers: 41, + useCustomCuda: true + } + }, { name: 'GPU-4G-3B-EN', apiParameters: { @@ -230,6 +449,25 @@ export const defaultModelConfigs: ModelConfig[] = [ useCustomCuda: true } }, + { + name: 'GPU-4G-7B-World', + apiParameters: { + apiPort: 8000, + maxResponseToken: 4100, + temperature: 1.2, + topP: 0.5, + presencePenalty: 0.4, + frequencyPenalty: 0.4 + }, + modelParameters: { + modelName: 'RWKV-4-World-7B-v1-OnlyForTest_64%_trained-20230610-ctx4096.pth', + device: 'CUDA', + precision: 'int8', + storedLayers: 8, + maxStoredLayers: 41, + useCustomCuda: true + } + }, { name: 'GPU-4G-7B-EN', apiParameters: { @@ -287,6 +525,25 @@ export const defaultModelConfigs: ModelConfig[] = [ useCustomCuda: true } }, + { + name: 'GPU-6G-3B-World', + apiParameters: { + apiPort: 8000, + maxResponseToken: 4100, + temperature: 1.2, + topP: 0.5, + presencePenalty: 0.4, + frequencyPenalty: 0.4 + }, + modelParameters: { + modelName: 'RWKV-4-World-3B-v1-OnlyForTest_80%_trained-20230612-ctx4096.pth', + device: 'CUDA', + precision: 'int8', + storedLayers: 41, + maxStoredLayers: 41, + useCustomCuda: true + } + }, { name: 'GPU-6G-3B-EN', apiParameters: { @@ -325,6 +582,25 @@ export const defaultModelConfigs: ModelConfig[] = [ useCustomCuda: true } }, + { + name: 'GPU-6G-7B-World', + apiParameters: { + apiPort: 8000, + maxResponseToken: 4100, + temperature: 1.2, + topP: 0.5, + presencePenalty: 0.4, + frequencyPenalty: 0.4 + }, + modelParameters: { + modelName: 'RWKV-4-World-7B-v1-OnlyForTest_64%_trained-20230610-ctx4096.pth', + device: 'CUDA', + precision: 'int8', + storedLayers: 18, + maxStoredLayers: 41, + useCustomCuda: true + } + }, { name: 'GPU-6G-7B-EN', apiParameters: { @@ -363,6 +639,43 @@ export const defaultModelConfigs: ModelConfig[] = [ useCustomCuda: true } }, + { + name: 'GPU-8G-1B5-World', + apiParameters: { + apiPort: 8000, + maxResponseToken: 4100, + temperature: 1.2, + topP: 0.5, + presencePenalty: 0.4, + frequencyPenalty: 0.4 + }, + modelParameters: { + modelName: 'RWKV-4-World-1.5B-v1-fixed-20230612-ctx4096.pth', + device: 'CUDA', + precision: 'fp32', + storedLayers: 41, + maxStoredLayers: 41 + } + }, + { + name: 'GPU-8G-3B-World', + apiParameters: { + apiPort: 8000, + maxResponseToken: 4100, + temperature: 1.2, + topP: 0.5, + presencePenalty: 0.4, + frequencyPenalty: 0.4 + }, + modelParameters: { + modelName: 'RWKV-4-World-3B-v1-OnlyForTest_80%_trained-20230612-ctx4096.pth', + device: 'CUDA', + precision: 'fp16', + storedLayers: 41, + maxStoredLayers: 41, + useCustomCuda: true + } + }, { name: 'GPU-8G-3B-EN', apiParameters: { @@ -401,6 +714,25 @@ export const defaultModelConfigs: ModelConfig[] = [ useCustomCuda: true } }, + { + name: 'GPU-8G-7B-World', + apiParameters: { + apiPort: 8000, + maxResponseToken: 4100, + temperature: 1.2, + topP: 0.5, + presencePenalty: 0.4, + frequencyPenalty: 0.4 + }, + modelParameters: { + modelName: 'RWKV-4-World-7B-v1-OnlyForTest_64%_trained-20230610-ctx4096.pth', + device: 'CUDA', + precision: 'int8', + storedLayers: 27, + maxStoredLayers: 41, + useCustomCuda: true + } + }, { name: 'GPU-8G-7B-EN', apiParameters: { @@ -439,6 +771,25 @@ export const defaultModelConfigs: ModelConfig[] = [ useCustomCuda: true } }, + { + name: 'GPU-10G-7B-World', + apiParameters: { + apiPort: 8000, + maxResponseToken: 4100, + temperature: 1.2, + topP: 0.5, + presencePenalty: 0.4, + frequencyPenalty: 0.4 + }, + modelParameters: { + modelName: 'RWKV-4-World-7B-v1-OnlyForTest_64%_trained-20230610-ctx4096.pth', + device: 'CUDA', + precision: 'int8', + storedLayers: 41, + maxStoredLayers: 41, + useCustomCuda: true + } + }, { name: 'GPU-10G-7B-EN', apiParameters: { @@ -496,6 +847,25 @@ export const defaultModelConfigs: ModelConfig[] = [ useCustomCuda: true } }, + { + name: 'GPU-16G-7B-World', + apiParameters: { + apiPort: 8000, + maxResponseToken: 4100, + temperature: 1.2, + topP: 0.5, + presencePenalty: 0.4, + frequencyPenalty: 0.4 + }, + modelParameters: { + modelName: 'RWKV-4-World-7B-v1-OnlyForTest_64%_trained-20230610-ctx4096.pth', + device: 'CUDA', + precision: 'fp16', + storedLayers: 41, + maxStoredLayers: 41, + useCustomCuda: true + } + }, { name: 'GPU-16G-7B-EN', apiParameters: { @@ -591,6 +961,24 @@ export const defaultModelConfigs: ModelConfig[] = [ useCustomCuda: true } }, + { + name: 'CPU-6G-1B5-World', + apiParameters: { + apiPort: 8000, + maxResponseToken: 4100, + temperature: 1.2, + topP: 0.5, + presencePenalty: 0.4, + frequencyPenalty: 0.4 + }, + modelParameters: { + modelName: 'RWKV-4-World-1.5B-v1-fixed-20230612-ctx4096.pth', + device: 'CPU', + precision: 'fp32', + storedLayers: 41, + maxStoredLayers: 41 + } + }, { name: 'CPU-6G-1B5-EN', apiParameters: { @@ -609,6 +997,24 @@ export const defaultModelConfigs: ModelConfig[] = [ maxStoredLayers: 41 } }, + { + name: 'CPU-12G-3B-World', + apiParameters: { + apiPort: 8000, + maxResponseToken: 4100, + temperature: 1.2, + topP: 0.5, + presencePenalty: 0.4, + frequencyPenalty: 0.4 + }, + modelParameters: { + modelName: 'RWKV-4-World-3B-v1-OnlyForTest_80%_trained-20230612-ctx4096.pth', + device: 'CPU', + precision: 'fp32', + storedLayers: 41, + maxStoredLayers: 41 + } + }, { name: 'CPU-12G-3B-EN', apiParameters: { @@ -645,6 +1051,24 @@ export const defaultModelConfigs: ModelConfig[] = [ maxStoredLayers: 41 } }, + { + name: 'CPU-28G-7B-World', + apiParameters: { + apiPort: 8000, + maxResponseToken: 4100, + temperature: 1.2, + topP: 0.5, + presencePenalty: 0.4, + frequencyPenalty: 0.4 + }, + modelParameters: { + modelName: 'RWKV-4-World-7B-v1-OnlyForTest_64%_trained-20230610-ctx4096.pth', + device: 'CPU', + precision: 'fp32', + storedLayers: 41, + maxStoredLayers: 41 + } + }, { name: 'CPU-28G-7B-EN', apiParameters: { diff --git a/manifest.json b/manifest.json index 915733b..352aae8 100644 --- a/manifest.json +++ b/manifest.json @@ -75,7 +75,20 @@ "SHA256": "05bad4ab0ce41250064153d5352587b83215a82eb50134489675129bd4ad1087", "lastUpdated": "2023-06-07T09:33:32", "url": "https://huggingface.co/BlinkDL/rwkv-4-world/blob/main/RWKV-4-World-1.5B-v1-20230607-ctx4096.pth", - "downloadUrl": "https://huggingface.co/BlinkDL/rwkv-4-world/resolve/main/RWKV-4-World-1.5B-v1-20230607-ctx4096.pth" + "downloadUrl": "https://huggingface.co/BlinkDL/rwkv-4-world/resolve/main/RWKV-4-World-1.5B-v1-20230607-ctx4096.pth", + "hide": true + }, + { + "name": "RWKV-4-World-1.5B-v1-fixed-20230612-ctx4096.pth", + "desc": { + "en": "100+ Languages 1.5B v1 fixed", + "zh": "100+ 语言 1.5B v1 修复" + }, + "size": 3155281586, + "SHA256": "71f0c3229f9227cbcb8ae5fee6461197129a57e26366c4d23a49058417b046c9", + "lastUpdated": "2023-06-12T06:31:32", + "url": "https://huggingface.co/BlinkDL/rwkv-4-world/blob/main/RWKV-4-World-1.5B-v1-fixed-20230612-ctx4096.pth", + "downloadUrl": "https://huggingface.co/BlinkDL/rwkv-4-world/resolve/main/RWKV-4-World-1.5B-v1-fixed-20230612-ctx4096.pth" }, { "name": "RWKV-4-World-3B-v1-OnlyForTest_35%_trained-20230529-ctx4096.pth", @@ -113,7 +126,20 @@ "SHA256": "49e8675e09e0786ca12a554442c37b9e809ed93e9211af937cd149968a6b81e9", "lastUpdated": "2023-06-07T09:33:32", "url": "https://huggingface.co/BlinkDL/rwkv-4-world/blob/main/RWKV-4-World-3B-v1-OnlyForTest_64%25_trained-20230607-ctx4096.pth", - "downloadUrl": "https://huggingface.co/BlinkDL/rwkv-4-world/resolve/main/RWKV-4-World-3B-v1-OnlyForTest_64%25_trained-20230607-ctx4096.pth" + "downloadUrl": "https://huggingface.co/BlinkDL/rwkv-4-world/resolve/main/RWKV-4-World-3B-v1-OnlyForTest_64%25_trained-20230607-ctx4096.pth", + "hide": true + }, + { + "name": "RWKV-4-World-3B-v1-OnlyForTest_80%_trained-20230612-ctx4096.pth", + "desc": { + "en": "100+ Languages 3B v1 Test", + "zh": "100+ 语言 3B v1 测试" + }, + "size": 6125597613, + "SHA256": "3bb10caf3017871435d83f39facc8a729fd774020390153470f004eb3ef645bd", + "lastUpdated": "2023-06-12T06:31:32", + "url": "https://huggingface.co/BlinkDL/rwkv-4-world/blob/main/RWKV-4-World-3B-v1-OnlyForTest_80%25_trained-20230612-ctx4096.pth", + "downloadUrl": "https://huggingface.co/BlinkDL/rwkv-4-world/resolve/main/RWKV-4-World-3B-v1-OnlyForTest_80%25_trained-20230612-ctx4096.pth" }, { "name": "RWKV-4-World-7B-v1-OnlyForTest_30%_trained-20230529-ctx4096.pth", @@ -151,7 +177,20 @@ "SHA256": "636405626eadbab230e1a7dc2855bb6244e09b5850547dda7103f650b4849de7", "lastUpdated": "2023-06-06T14:21:31", "url": "https://huggingface.co/BlinkDL/rwkv-4-world/blob/main/RWKV-4-World-7B-v1-OnlyForTest_52%25_trained-20230606-ctx4096.pth", - "downloadUrl": "https://huggingface.co/BlinkDL/rwkv-4-world/resolve/main/RWKV-4-World-7B-v1-OnlyForTest_52%25_trained-20230606-ctx4096.pth" + "downloadUrl": "https://huggingface.co/BlinkDL/rwkv-4-world/resolve/main/RWKV-4-World-7B-v1-OnlyForTest_52%25_trained-20230606-ctx4096.pth", + "hide": true + }, + { + "name": "RWKV-4-World-7B-v1-OnlyForTest_64%_trained-20230610-ctx4096.pth", + "desc": { + "en": "100+ Languages 7B v1 Test", + "zh": "100+ 语言 7B v1 测试" + }, + "size": 15035393581, + "SHA256": "8039be276f555318a5b2e9ad82b9d70001c12bd2e3e668048615fc7b09d5d9a4", + "lastUpdated": "2023-06-11T01:58:29", + "url": "https://huggingface.co/BlinkDL/rwkv-4-world/blob/main/RWKV-4-World-7B-v1-OnlyForTest_64%25_trained-20230610-ctx4096.pth", + "downloadUrl": "https://huggingface.co/BlinkDL/rwkv-4-world/resolve/main/RWKV-4-World-7B-v1-OnlyForTest_64%25_trained-20230610-ctx4096.pth" }, { "name": "RWKV-4-Novel-7B-v1-ChnEng-ChnPro-20230410-ctx4096.pth",