diff --git a/frontend/src/pages/defaultConfigs.ts b/frontend/src/pages/defaultConfigs.ts index 6bd0dca..a4b7aed 100644 --- a/frontend/src/pages/defaultConfigs.ts +++ b/frontend/src/pages/defaultConfigs.ts @@ -111,7 +111,7 @@ export const defaultPresets: CompletionPreset[] = [{ export const defaultModelConfigsMac: ModelConfig[] = [ { - name: 'MAC-0.1B-World', + name: 'GPU-2G-1B5-World', apiParameters: { apiPort: 8000, maxResponseToken: 4100, @@ -121,16 +121,15 @@ export const defaultModelConfigsMac: ModelConfig[] = [ frequencyPenalty: 1 }, modelParameters: { - modelName: 'RWKV-4-World-0.1B-v1-20230520-ctx4096.pth', - device: 'MPS', - precision: 'fp32', + modelName: 'RWKV-5-World-1B5-v2-20231025-ctx4096.pth', + device: 'WebGPU', + precision: 'nf4', storedLayers: 41, - maxStoredLayers: 41, - customStrategy: 'mps fp32' + maxStoredLayers: 41 } }, { - name: 'MAC-0.4B-World', + name: 'GPU-4G-3B-World', apiParameters: { apiPort: 8000, maxResponseToken: 4100, @@ -140,12 +139,101 @@ export const defaultModelConfigsMac: ModelConfig[] = [ frequencyPenalty: 1 }, modelParameters: { - modelName: 'RWKV-4-World-0.4B-v1-20230529-ctx4096.pth', - device: 'MPS', + modelName: 'RWKV-5-World-3B-v2-20231118-ctx16k.pth', + device: 'WebGPU', + precision: 'nf4', + storedLayers: 41, + maxStoredLayers: 41 + } + }, + { + name: 'GPU-4G-3B-CN', + apiParameters: { + apiPort: 8000, + maxResponseToken: 4100, + temperature: 1.0, + topP: 0.3, + presencePenalty: 0, + frequencyPenalty: 1 + }, + modelParameters: { + modelName: 'RWKV-4-World-CHNtuned-3B-v1-20230625-ctx4096.pth', + device: 'WebGPU', + precision: 'nf4', + storedLayers: 41, + maxStoredLayers: 41 + } + }, + { + name: 'GPU-7G-7B-World', + apiParameters: { + apiPort: 8000, + maxResponseToken: 4100, + temperature: 1.0, + topP: 0.3, + presencePenalty: 0, + frequencyPenalty: 1 + }, + modelParameters: { + modelName: 'RWKV-4-World-7B-v1-20230626-ctx4096.pth', + device: 'WebGPU', + precision: 'nf4', + storedLayers: 41, + maxStoredLayers: 41 + } + }, + { + name: 'GPU-7G-7B-CN', + apiParameters: { + apiPort: 8000, + maxResponseToken: 4100, + temperature: 1.0, + topP: 0.3, + presencePenalty: 0, + frequencyPenalty: 1 + }, + modelParameters: { + modelName: 'RWKV-4-World-CHNtuned-7B-v1-20230709-ctx4096.pth', + device: 'WebGPU', + precision: 'nf4', + storedLayers: 41, + maxStoredLayers: 41 + } + }, + { + name: 'CPU-120M-Music', + apiParameters: { + apiPort: 8000, + maxResponseToken: 4100, + temperature: 1.0, + topP: 0.8, + presencePenalty: 0, + frequencyPenalty: 1 + }, + modelParameters: { + modelName: 'RWKV-4-MIDI-120M-v1-20230714-ctx4096.pth', + device: 'CPU', precision: 'fp32', storedLayers: 41, - maxStoredLayers: 41, - customStrategy: 'mps fp32' + maxStoredLayers: 41 + } + }, + { + name: 'CPU-560M-Music', + apiParameters: { + apiPort: 8000, + maxResponseToken: 4100, + temperature: 1.0, + topP: 0.8, + presencePenalty: 0, + frequencyPenalty: 1 + }, + modelParameters: { + modelName: 'RWKV-4-MIDI-560M-v1-20230717-ctx4096.pth', + device: 'CPU', + precision: 'fp32', + storedLayers: 41, + maxStoredLayers: 41 } }, { @@ -159,26 +247,7 @@ export const defaultModelConfigsMac: ModelConfig[] = [ frequencyPenalty: 1 }, modelParameters: { - modelName: 'RWKV-4-World-1.5B-v1-fixed-20230612-ctx4096.pth', - device: 'MPS', - precision: 'fp32', - storedLayers: 41, - maxStoredLayers: 41, - customStrategy: 'mps fp32' - } - }, - { - name: 'MAC-1B5-EN', - apiParameters: { - apiPort: 8000, - maxResponseToken: 4100, - temperature: 1.0, - topP: 0.3, - presencePenalty: 0, - frequencyPenalty: 1 - }, - modelParameters: { - modelName: 'RWKV-4-Raven-1B5-v12-Eng98%-Other2%-20230520-ctx4096.pth', + modelName: 'RWKV-5-World-1B5-v2-20231025-ctx4096.pth', device: 'MPS', precision: 'fp32', storedLayers: 41, @@ -197,26 +266,7 @@ export const defaultModelConfigsMac: ModelConfig[] = [ frequencyPenalty: 1 }, modelParameters: { - modelName: 'RWKV-4-World-3B-v1-20230619-ctx4096.pth', - device: 'MPS', - precision: 'fp32', - storedLayers: 41, - maxStoredLayers: 41, - customStrategy: 'mps fp32' - } - }, - { - name: 'MAC-3B-EN', - apiParameters: { - apiPort: 8000, - maxResponseToken: 4100, - temperature: 1.0, - topP: 0.3, - presencePenalty: 0, - frequencyPenalty: 1 - }, - modelParameters: { - modelName: 'RWKV-4-Raven-3B-v12-Eng98%-Other2%-20230520-ctx4096.pth', + modelName: 'RWKV-5-World-3B-v2-20231118-ctx16k.pth', device: 'MPS', precision: 'fp32', storedLayers: 41, @@ -261,190 +311,29 @@ export const defaultModelConfigsMac: ModelConfig[] = [ maxStoredLayers: 41, customStrategy: 'mps fp32' } - }, - { - name: 'CPU-120M-Music', - apiParameters: { - apiPort: 8000, - maxResponseToken: 4100, - temperature: 1.0, - topP: 0.8, - presencePenalty: 0, - frequencyPenalty: 1 - }, - modelParameters: { - modelName: 'RWKV-4-MIDI-120M-v1-20230714-ctx4096.pth', - device: 'CPU', - precision: 'fp32', - storedLayers: 41, - maxStoredLayers: 41 - } - }, - { - name: 'CPU-560M-Music', - apiParameters: { - apiPort: 8000, - maxResponseToken: 4100, - temperature: 1.0, - topP: 0.8, - presencePenalty: 0, - frequencyPenalty: 1 - }, - modelParameters: { - modelName: 'RWKV-4-MIDI-560M-v1-20230717-ctx4096.pth', - device: 'CPU', - precision: 'fp32', - storedLayers: 41, - maxStoredLayers: 41 - } - }, - { - name: 'CPU-6G-1B5-World', - apiParameters: { - apiPort: 8000, - maxResponseToken: 4100, - temperature: 1.0, - topP: 0.3, - presencePenalty: 0, - frequencyPenalty: 1 - }, - modelParameters: { - modelName: 'RWKV-4-World-1.5B-v1-fixed-20230612-ctx4096.pth', - device: 'CPU', - precision: 'fp32', - storedLayers: 41, - maxStoredLayers: 41 - } - }, - { - name: 'CPU-6G-1B5-EN', - apiParameters: { - apiPort: 8000, - maxResponseToken: 4100, - temperature: 1.0, - topP: 0.3, - presencePenalty: 0, - frequencyPenalty: 1 - }, - modelParameters: { - modelName: 'RWKV-4-Raven-1B5-v12-Eng98%-Other2%-20230520-ctx4096.pth', - device: 'CPU', - precision: 'fp32', - storedLayers: 41, - maxStoredLayers: 41 - } - }, - { - name: 'CPU-12G-3B-World', - apiParameters: { - apiPort: 8000, - maxResponseToken: 4100, - temperature: 1.0, - topP: 0.3, - presencePenalty: 0, - frequencyPenalty: 1 - }, - modelParameters: { - modelName: 'RWKV-4-World-3B-v1-20230619-ctx4096.pth', - device: 'CPU', - precision: 'fp32', - storedLayers: 41, - maxStoredLayers: 41 - } - }, - { - name: 'CPU-12G-3B-EN', - apiParameters: { - apiPort: 8000, - maxResponseToken: 4100, - temperature: 1.0, - topP: 0.3, - presencePenalty: 0, - frequencyPenalty: 1 - }, - modelParameters: { - modelName: 'RWKV-4-Raven-3B-v12-Eng98%-Other2%-20230520-ctx4096.pth', - device: 'CPU', - precision: 'fp32', - storedLayers: 41, - maxStoredLayers: 41 - } - }, - { - name: 'CPU-12G-3B-CN', - apiParameters: { - apiPort: 8000, - maxResponseToken: 4100, - temperature: 1.0, - topP: 0.3, - presencePenalty: 0, - frequencyPenalty: 1 - }, - modelParameters: { - modelName: 'RWKV-4-World-CHNtuned-3B-v1-20230625-ctx4096.pth', - device: 'CPU', - precision: 'fp32', - storedLayers: 41, - maxStoredLayers: 41 - } - }, - { - name: 'CPU-28G-7B-World', - apiParameters: { - apiPort: 8000, - maxResponseToken: 4100, - temperature: 1.0, - topP: 0.3, - presencePenalty: 0, - frequencyPenalty: 1 - }, - modelParameters: { - modelName: 'RWKV-4-World-7B-v1-20230626-ctx4096.pth', - device: 'CPU', - precision: 'fp32', - storedLayers: 41, - maxStoredLayers: 41 - } - }, - { - name: 'CPU-28G-7B-EN', - apiParameters: { - apiPort: 8000, - maxResponseToken: 4100, - temperature: 1.0, - topP: 0.3, - presencePenalty: 0, - frequencyPenalty: 1 - }, - modelParameters: { - modelName: 'RWKV-4-Raven-7B-v12-Eng98%-Other2%-20230521-ctx8192.pth', - device: 'CPU', - precision: 'fp32', - storedLayers: 41, - maxStoredLayers: 41 - } - }, - { - name: 'CPU-28G-7B-CN', - apiParameters: { - apiPort: 8000, - maxResponseToken: 4100, - temperature: 1.0, - topP: 0.3, - presencePenalty: 0, - frequencyPenalty: 1 - }, - modelParameters: { - modelName: 'RWKV-4-World-CHNtuned-7B-v1-20230709-ctx4096.pth', - device: 'CPU', - precision: 'fp32', - storedLayers: 41, - maxStoredLayers: 41 - } } ]; export const defaultModelConfigs: ModelConfig[] = [ + { + name: 'GPU-2G-1B5-World', + apiParameters: { + apiPort: 8000, + maxResponseToken: 4100, + temperature: 1.0, + topP: 0.3, + presencePenalty: 0, + frequencyPenalty: 1 + }, + modelParameters: { + modelName: 'RWKV-5-World-1B5-v2-20231025-ctx4096.pth', + device: 'CUDA', + precision: 'int8', + storedLayers: 41, + maxStoredLayers: 41, + useCustomCuda: true + } + }, { name: 'GPU-2G-3B-World', apiParameters: { @@ -456,7 +345,7 @@ export const defaultModelConfigs: ModelConfig[] = [ frequencyPenalty: 1 }, modelParameters: { - modelName: 'RWKV-4-World-3B-v1-20230619-ctx4096.pth', + modelName: 'RWKV-5-World-3B-v2-20231118-ctx16k.pth', device: 'CUDA', precision: 'int8', storedLayers: 6, @@ -464,61 +353,6 @@ export const defaultModelConfigs: ModelConfig[] = [ useCustomCuda: true } }, - { - name: 'GPU-2G-0.1B-World', - apiParameters: { - apiPort: 8000, - maxResponseToken: 4100, - temperature: 1.0, - topP: 0.3, - presencePenalty: 0, - frequencyPenalty: 1 - }, - modelParameters: { - modelName: 'RWKV-4-World-0.1B-v1-20230520-ctx4096.pth', - device: 'CUDA', - precision: 'fp32', // using fp16 will disable state cache (->) - storedLayers: 41, - maxStoredLayers: 41 - } - }, - { - name: 'GPU-2G-1B5-EN', - apiParameters: { - apiPort: 8000, - maxResponseToken: 4100, - temperature: 1.0, - topP: 0.3, - presencePenalty: 0, - frequencyPenalty: 1 - }, - modelParameters: { - modelName: 'RWKV-4-Raven-1B5-v12-Eng98%-Other2%-20230520-ctx4096.pth', - device: 'CUDA', - precision: 'int8', - storedLayers: 4, - maxStoredLayers: 41, - useCustomCuda: true - } - }, - { - name: 'GPU-4G-0.4B-World', - apiParameters: { - apiPort: 8000, - maxResponseToken: 4100, - temperature: 1.0, - topP: 0.3, - presencePenalty: 0, - frequencyPenalty: 1 - }, - modelParameters: { - modelName: 'RWKV-4-World-0.4B-v1-20230529-ctx4096.pth', - device: 'CUDA', - precision: 'fp32', - storedLayers: 41, - maxStoredLayers: 41 - } - }, { name: 'GPU-4G-1B5-World', apiParameters: { @@ -530,27 +364,9 @@ export const defaultModelConfigs: ModelConfig[] = [ frequencyPenalty: 1 }, modelParameters: { - modelName: 'RWKV-4-World-1.5B-v1-fixed-20230612-ctx4096.pth', + modelName: 'RWKV-5-World-1B5-v2-20231025-ctx4096.pth', device: 'CUDA', - precision: 'fp32', - storedLayers: 8, - maxStoredLayers: 41 - } - }, - { - name: 'GPU-4G-1B5-EN', - apiParameters: { - apiPort: 8000, - maxResponseToken: 4100, - temperature: 1.0, - topP: 0.3, - presencePenalty: 0, - frequencyPenalty: 1 - }, - modelParameters: { - modelName: 'RWKV-4-Raven-1B5-v12-Eng98%-Other2%-20230520-ctx4096.pth', - device: 'CUDA', - precision: 'int8', + precision: 'fp16', storedLayers: 41, maxStoredLayers: 41, useCustomCuda: true @@ -567,26 +383,7 @@ export const defaultModelConfigs: ModelConfig[] = [ frequencyPenalty: 1 }, modelParameters: { - modelName: 'RWKV-4-World-3B-v1-20230619-ctx4096.pth', - device: 'CUDA', - precision: 'int8', - storedLayers: 24, - maxStoredLayers: 41, - useCustomCuda: true - } - }, - { - name: 'GPU-4G-3B-EN', - apiParameters: { - apiPort: 8000, - maxResponseToken: 4100, - temperature: 1.0, - topP: 0.3, - presencePenalty: 0, - frequencyPenalty: 1 - }, - modelParameters: { - modelName: 'RWKV-4-Raven-3B-v12-Eng98%-Other2%-20230520-ctx4096.pth', + modelName: 'RWKV-5-World-3B-v2-20231118-ctx16k.pth', device: 'CUDA', precision: 'int8', storedLayers: 24, @@ -632,25 +429,6 @@ export const defaultModelConfigs: ModelConfig[] = [ useCustomCuda: true } }, - { - name: 'GPU-4G-7B-EN', - apiParameters: { - apiPort: 8000, - maxResponseToken: 4100, - temperature: 1.0, - topP: 0.3, - presencePenalty: 0, - frequencyPenalty: 1 - }, - modelParameters: { - modelName: 'RWKV-4-Raven-7B-v12-Eng98%-Other2%-20230521-ctx8192.pth', - device: 'CUDA', - precision: 'int8', - storedLayers: 8, - maxStoredLayers: 41, - useCustomCuda: true - } - }, { name: 'GPU-4G-7B-CN', apiParameters: { @@ -670,25 +448,6 @@ export const defaultModelConfigs: ModelConfig[] = [ useCustomCuda: true } }, - { - name: 'GPU-6G-1B5-EN', - apiParameters: { - apiPort: 8000, - maxResponseToken: 4100, - temperature: 1.0, - topP: 0.3, - presencePenalty: 0, - frequencyPenalty: 1 - }, - modelParameters: { - modelName: 'RWKV-4-Raven-1B5-v12-Eng98%-Other2%-20230520-ctx4096.pth', - device: 'CUDA', - precision: 'fp16', - storedLayers: 41, - maxStoredLayers: 41, - useCustomCuda: true - } - }, { name: 'GPU-6G-3B-World', apiParameters: { @@ -700,26 +459,7 @@ export const defaultModelConfigs: ModelConfig[] = [ frequencyPenalty: 1 }, modelParameters: { - modelName: 'RWKV-4-World-3B-v1-20230619-ctx4096.pth', - device: 'CUDA', - precision: 'int8', - storedLayers: 41, - maxStoredLayers: 41, - useCustomCuda: true - } - }, - { - name: 'GPU-6G-3B-EN', - apiParameters: { - apiPort: 8000, - maxResponseToken: 4100, - temperature: 1.0, - topP: 0.3, - presencePenalty: 0, - frequencyPenalty: 1 - }, - modelParameters: { - modelName: 'RWKV-4-Raven-3B-v12-Eng98%-Other2%-20230520-ctx4096.pth', + modelName: 'RWKV-5-World-3B-v2-20231118-ctx16k.pth', device: 'CUDA', precision: 'int8', storedLayers: 41, @@ -765,25 +505,6 @@ export const defaultModelConfigs: ModelConfig[] = [ useCustomCuda: true } }, - { - name: 'GPU-6G-7B-EN', - apiParameters: { - apiPort: 8000, - maxResponseToken: 4100, - temperature: 1.0, - topP: 0.3, - presencePenalty: 0, - frequencyPenalty: 1 - }, - modelParameters: { - modelName: 'RWKV-4-Raven-7B-v12-Eng98%-Other2%-20230521-ctx8192.pth', - device: 'CUDA', - precision: 'int8', - storedLayers: 18, - maxStoredLayers: 41, - useCustomCuda: true - } - }, { name: 'GPU-6G-7B-CN', apiParameters: { @@ -803,24 +524,6 @@ export const defaultModelConfigs: ModelConfig[] = [ useCustomCuda: true } }, - { - name: 'GPU-8G-1B5-World', - apiParameters: { - apiPort: 8000, - maxResponseToken: 4100, - temperature: 1.0, - topP: 0.3, - presencePenalty: 0, - frequencyPenalty: 1 - }, - modelParameters: { - modelName: 'RWKV-4-World-1.5B-v1-fixed-20230612-ctx4096.pth', - device: 'CUDA', - precision: 'fp32', - storedLayers: 41, - maxStoredLayers: 41 - } - }, { name: 'GPU-8G-3B-World', apiParameters: { @@ -832,26 +535,7 @@ export const defaultModelConfigs: ModelConfig[] = [ frequencyPenalty: 1 }, modelParameters: { - modelName: 'RWKV-4-World-3B-v1-20230619-ctx4096.pth', - device: 'CUDA', - precision: 'fp16', - storedLayers: 41, - maxStoredLayers: 41, - useCustomCuda: true - } - }, - { - name: 'GPU-8G-3B-EN', - apiParameters: { - apiPort: 8000, - maxResponseToken: 4100, - temperature: 1.0, - topP: 0.3, - presencePenalty: 0, - frequencyPenalty: 1 - }, - modelParameters: { - modelName: 'RWKV-4-Raven-3B-v12-Eng98%-Other2%-20230520-ctx4096.pth', + modelName: 'RWKV-5-World-3B-v2-20231118-ctx16k.pth', device: 'CUDA', precision: 'fp16', storedLayers: 41, @@ -897,25 +581,6 @@ export const defaultModelConfigs: ModelConfig[] = [ useCustomCuda: true } }, - { - name: 'GPU-8G-7B-EN', - apiParameters: { - apiPort: 8000, - maxResponseToken: 4100, - temperature: 1.0, - topP: 0.3, - presencePenalty: 0, - frequencyPenalty: 1 - }, - modelParameters: { - modelName: 'RWKV-4-Raven-7B-v12-Eng98%-Other2%-20230521-ctx8192.pth', - device: 'CUDA', - precision: 'int8', - storedLayers: 27, - maxStoredLayers: 41, - useCustomCuda: true - } - }, { name: 'GPU-8G-7B-CN', apiParameters: { @@ -954,25 +619,6 @@ export const defaultModelConfigs: ModelConfig[] = [ useCustomCuda: true } }, - { - name: 'GPU-10G-7B-EN', - apiParameters: { - apiPort: 8000, - maxResponseToken: 4100, - temperature: 1.0, - topP: 0.3, - presencePenalty: 0, - frequencyPenalty: 1 - }, - modelParameters: { - modelName: 'RWKV-4-Raven-7B-v12-Eng98%-Other2%-20230521-ctx8192.pth', - device: 'CUDA', - precision: 'int8', - storedLayers: 41, - maxStoredLayers: 41, - useCustomCuda: true - } - }, { name: 'GPU-10G-7B-CN', apiParameters: { @@ -992,25 +638,6 @@ export const defaultModelConfigs: ModelConfig[] = [ useCustomCuda: true } }, - { - name: 'GPU-12G-14B-EN', - apiParameters: { - apiPort: 8000, - maxResponseToken: 4100, - temperature: 1.0, - topP: 0.3, - presencePenalty: 0, - frequencyPenalty: 1 - }, - modelParameters: { - modelName: 'RWKV-4-Raven-14B-v12-Eng98%-Other2%-20230523-ctx8192.pth', - device: 'CUDA', - precision: 'int8', - storedLayers: 24, - maxStoredLayers: 41, - useCustomCuda: true - } - }, { name: 'GPU-16G-7B-World', apiParameters: { @@ -1030,25 +657,6 @@ export const defaultModelConfigs: ModelConfig[] = [ useCustomCuda: true } }, - { - name: 'GPU-16G-7B-EN', - apiParameters: { - apiPort: 8000, - maxResponseToken: 4100, - temperature: 1.0, - topP: 0.3, - presencePenalty: 0, - frequencyPenalty: 1 - }, - modelParameters: { - modelName: 'RWKV-4-Raven-7B-v12-Eng98%-Other2%-20230521-ctx8192.pth', - device: 'CUDA', - precision: 'fp16', - storedLayers: 41, - maxStoredLayers: 41, - useCustomCuda: true - } - }, { name: 'GPU-16G-7B-CN', apiParameters: { @@ -1068,63 +676,6 @@ export const defaultModelConfigs: ModelConfig[] = [ useCustomCuda: true } }, - { - name: 'GPU-16G-14B-EN', - apiParameters: { - apiPort: 8000, - maxResponseToken: 4100, - temperature: 1.0, - topP: 0.3, - presencePenalty: 0, - frequencyPenalty: 1 - }, - modelParameters: { - modelName: 'RWKV-4-Raven-14B-v12-Eng98%-Other2%-20230523-ctx8192.pth', - device: 'CUDA', - precision: 'int8', - storedLayers: 37, - maxStoredLayers: 41, - useCustomCuda: true - } - }, - { - name: 'GPU-18G-14B-EN', - apiParameters: { - apiPort: 8000, - maxResponseToken: 4100, - temperature: 1.0, - topP: 0.3, - presencePenalty: 0, - frequencyPenalty: 1 - }, - modelParameters: { - modelName: 'RWKV-4-Raven-14B-v12-Eng98%-Other2%-20230523-ctx8192.pth', - device: 'CUDA', - precision: 'int8', - storedLayers: 41, - maxStoredLayers: 41, - useCustomCuda: true - } - }, - { - name: 'GPU-32G-14B-EN', - apiParameters: { - apiPort: 8000, - maxResponseToken: 4100, - temperature: 1.0, - topP: 0.3, - presencePenalty: 0, - frequencyPenalty: 1 - }, - modelParameters: { - modelName: 'RWKV-4-Raven-14B-v12-Eng98%-Other2%-20230523-ctx8192.pth', - device: 'CUDA', - precision: 'fp16', - storedLayers: 41, - maxStoredLayers: 41, - useCustomCuda: true - } - }, { name: 'CPU-120M-Music', apiParameters: { @@ -1162,7 +713,7 @@ export const defaultModelConfigs: ModelConfig[] = [ } }, { - name: 'CPU-6G-1B5-World', + name: 'AnyGPU-2G-1B5-World', apiParameters: { apiPort: 8000, maxResponseToken: 4100, @@ -1172,15 +723,15 @@ export const defaultModelConfigs: ModelConfig[] = [ frequencyPenalty: 1 }, modelParameters: { - modelName: 'RWKV-4-World-1.5B-v1-fixed-20230612-ctx4096.pth', - device: 'CPU', - precision: 'fp32', + modelName: 'RWKV-5-World-1B5-v2-20231025-ctx4096.pth', + device: 'WebGPU', + precision: 'nf4', storedLayers: 41, maxStoredLayers: 41 } }, { - name: 'CPU-6G-1B5-EN', + name: 'AnyGPU-4G-3B-World', apiParameters: { apiPort: 8000, maxResponseToken: 4100, @@ -1190,51 +741,15 @@ export const defaultModelConfigs: ModelConfig[] = [ frequencyPenalty: 1 }, modelParameters: { - modelName: 'RWKV-4-Raven-1B5-v12-Eng98%-Other2%-20230520-ctx4096.pth', - device: 'CPU', - precision: 'fp32', + modelName: 'RWKV-5-World-3B-v2-20231118-ctx16k.pth', + device: 'WebGPU', + precision: 'nf4', storedLayers: 41, maxStoredLayers: 41 } }, { - name: 'CPU-12G-3B-World', - apiParameters: { - apiPort: 8000, - maxResponseToken: 4100, - temperature: 1.0, - topP: 0.3, - presencePenalty: 0, - frequencyPenalty: 1 - }, - modelParameters: { - modelName: 'RWKV-4-World-3B-v1-20230619-ctx4096.pth', - device: 'CPU', - precision: 'fp32', - storedLayers: 41, - maxStoredLayers: 41 - } - }, - { - name: 'CPU-12G-3B-EN', - apiParameters: { - apiPort: 8000, - maxResponseToken: 4100, - temperature: 1.0, - topP: 0.3, - presencePenalty: 0, - frequencyPenalty: 1 - }, - modelParameters: { - modelName: 'RWKV-4-Raven-3B-v12-Eng98%-Other2%-20230520-ctx4096.pth', - device: 'CPU', - precision: 'fp32', - storedLayers: 41, - maxStoredLayers: 41 - } - }, - { - name: 'CPU-12G-3B-CN', + name: 'AnyGPU-4G-3B-CN', apiParameters: { apiPort: 8000, maxResponseToken: 4100, @@ -1245,14 +760,14 @@ export const defaultModelConfigs: ModelConfig[] = [ }, modelParameters: { modelName: 'RWKV-4-World-CHNtuned-3B-v1-20230625-ctx4096.pth', - device: 'CPU', - precision: 'fp32', + device: 'WebGPU', + precision: 'nf4', storedLayers: 41, maxStoredLayers: 41 } }, { - name: 'CPU-28G-7B-World', + name: 'AnyGPU-7G-7B-World', apiParameters: { apiPort: 8000, maxResponseToken: 4100, @@ -1263,32 +778,14 @@ export const defaultModelConfigs: ModelConfig[] = [ }, modelParameters: { modelName: 'RWKV-4-World-7B-v1-20230626-ctx4096.pth', - device: 'CPU', - precision: 'fp32', + device: 'WebGPU', + precision: 'nf4', storedLayers: 41, maxStoredLayers: 41 } }, { - name: 'CPU-28G-7B-EN', - apiParameters: { - apiPort: 8000, - maxResponseToken: 4100, - temperature: 1.0, - topP: 0.3, - presencePenalty: 0, - frequencyPenalty: 1 - }, - modelParameters: { - modelName: 'RWKV-4-Raven-7B-v12-Eng98%-Other2%-20230521-ctx8192.pth', - device: 'CPU', - precision: 'fp32', - storedLayers: 41, - maxStoredLayers: 41 - } - }, - { - name: 'CPU-28G-7B-CN', + name: 'AnyGPU-7G-7B-CN', apiParameters: { apiPort: 8000, maxResponseToken: 4100, @@ -1299,8 +796,8 @@ export const defaultModelConfigs: ModelConfig[] = [ }, modelParameters: { modelName: 'RWKV-4-World-CHNtuned-7B-v1-20230709-ctx4096.pth', - device: 'CPU', - precision: 'fp32', + device: 'WebGPU', + precision: 'nf4', storedLayers: 41, maxStoredLayers: 41 }