RWKV-Runner/frontend/src/pages/defaultConfigs.ts
2023-11-07 19:27:21 +08:00

1308 lines
31 KiB
TypeScript

import { CompletionPreset } from '../types/completion';
import { ModelConfig } from '../types/configs';
export const defaultCompositionPrompt = '<pad>';
export const defaultPresets: CompletionPreset[] = [{
name: 'Writer',
prompt: 'The following is an epic science fiction masterpiece that is immortalized, with delicate descriptions and grand depictions of interstellar civilization wars.\nChapter 1.\n',
params: {
maxResponseToken: 500,
temperature: 1.2,
topP: 0.5,
presencePenalty: 0.4,
frequencyPenalty: 0.4,
stop: '\\n\\nUser',
injectStart: '',
injectEnd: ''
}
}, {
name: 'Translator',
prompt: 'Translate this into Chinese.\n\nEnglish: What rooms do you have available?',
params: {
maxResponseToken: 500,
temperature: 1,
topP: 0.3,
presencePenalty: 0,
frequencyPenalty: 1,
stop: '\\n\\n',
injectStart: '\\nChinese: ',
injectEnd: '\\n\\nEnglish: '
}
}, {
name: 'Catgirl',
prompt: 'The following is a conversation between a cat girl and her owner. The cat girl is a humanized creature that behaves like a cat but is humanoid. At the end of each sentence in the dialogue, she will add \"Meow~\". In the following content, User represents the owner and Assistant represents the cat girl.\n\nUser: Hello.\n\nAssistant: I\'m here, meow~.\n\nUser: Can you tell jokes?',
params: {
maxResponseToken: 500,
temperature: 1.2,
topP: 0.5,
presencePenalty: 0.4,
frequencyPenalty: 0.4,
stop: '\\n\\nUser',
injectStart: '\\n\\nAssistant: ',
injectEnd: '\\n\\nUser: '
}
}, {
name: 'Chinese Kongfu',
prompt: 'User: 请你扮演一个文本冒险游戏,我是游戏主角。这是一个玄幻修真世界,有四大门派。我输入我的行动,请你显示行动结果,并具体描述环境。我的第一个行动是“醒来”,请开始故事。',
params: {
maxResponseToken: 500,
temperature: 1.1,
topP: 0.7,
presencePenalty: 0.3,
frequencyPenalty: 0.3,
stop: '\\n\\nUser',
injectStart: '\\n\\nAssistant: ',
injectEnd: '\\n\\nUser: '
}
}, {
name: 'Code Generation',
prompt: 'def sum(',
params: {
maxResponseToken: 500,
temperature: 1,
topP: 0.3,
presencePenalty: 0,
frequencyPenalty: 1,
stop: '\\n\\n',
injectStart: '',
injectEnd: ''
}
}, {
name: 'Werewolf',
prompt: 'There is currently a game of Werewolf with six players, including a Seer (who can check identities at night), two Werewolves (who can choose someone to kill at night), a Bodyguard (who can choose someone to protect at night), two Villagers (with no special abilities), and a game host. User will play as Player 1, Assistant will play as Players 2-6 and the game host, and they will begin playing together. Every night, the host will ask User for his action and simulate the actions of the other players. During the day, the host will oversee the voting process and ask User for his vote. \n\nAssistant: Next, I will act as the game host and assign everyone their roles, including randomly assigning yours. Then, I will simulate the actions of Players 2-6 and let you know what happens each day. Based on your assigned role, you can tell me your actions and I will let you know the corresponding results each day.\n\nUser: Okay, I understand. Let\'s begin. Please assign me a role. Am I the Seer, Werewolf, Villager, or Bodyguard?\n\nAssistant: You are the Seer. Now that night has fallen, please choose a player to check his identity.\n\nUser: Tonight, I want to check Player 2 and find out his role.',
params: {
maxResponseToken: 500,
temperature: 1.2,
topP: 0.4,
presencePenalty: 0.5,
frequencyPenalty: 0.5,
stop: '\\n\\nUser',
injectStart: '\\n\\nAssistant: ',
injectEnd: '\\n\\nUser: '
}
}, {
name: 'Instruction',
prompt: 'Instruction: Write a story using the following information\n\nInput: A man named Alex chops a tree down\n\nResponse:',
params: {
maxResponseToken: 500,
temperature: 1,
topP: 0.3,
presencePenalty: 0,
frequencyPenalty: 1,
stop: '',
injectStart: '',
injectEnd: ''
}
}, {
name: 'Blank',
prompt: '',
params: {
maxResponseToken: 500,
temperature: 1,
topP: 0.3,
presencePenalty: 0,
frequencyPenalty: 1,
stop: '',
injectStart: '',
injectEnd: ''
}
}];
export const defaultModelConfigsMac: ModelConfig[] = [
{
name: 'MAC-0.1B-World',
apiParameters: {
apiPort: 8000,
maxResponseToken: 4100,
temperature: 1.0,
topP: 0.3,
presencePenalty: 0,
frequencyPenalty: 1
},
modelParameters: {
modelName: 'RWKV-4-World-0.1B-v1-20230520-ctx4096.pth',
device: 'MPS',
precision: 'fp32',
storedLayers: 41,
maxStoredLayers: 41,
customStrategy: 'mps fp32'
}
},
{
name: 'MAC-0.4B-World',
apiParameters: {
apiPort: 8000,
maxResponseToken: 4100,
temperature: 1.0,
topP: 0.3,
presencePenalty: 0,
frequencyPenalty: 1
},
modelParameters: {
modelName: 'RWKV-4-World-0.4B-v1-20230529-ctx4096.pth',
device: 'MPS',
precision: 'fp32',
storedLayers: 41,
maxStoredLayers: 41,
customStrategy: 'mps fp32'
}
},
{
name: 'MAC-1B5-World',
apiParameters: {
apiPort: 8000,
maxResponseToken: 4100,
temperature: 1.0,
topP: 0.3,
presencePenalty: 0,
frequencyPenalty: 1
},
modelParameters: {
modelName: 'RWKV-4-World-1.5B-v1-fixed-20230612-ctx4096.pth',
device: 'MPS',
precision: 'fp32',
storedLayers: 41,
maxStoredLayers: 41,
customStrategy: 'mps fp32'
}
},
{
name: 'MAC-1B5-EN',
apiParameters: {
apiPort: 8000,
maxResponseToken: 4100,
temperature: 1.0,
topP: 0.3,
presencePenalty: 0,
frequencyPenalty: 1
},
modelParameters: {
modelName: 'RWKV-4-Raven-1B5-v12-Eng98%-Other2%-20230520-ctx4096.pth',
device: 'MPS',
precision: 'fp32',
storedLayers: 41,
maxStoredLayers: 41,
customStrategy: 'mps fp32'
}
},
{
name: 'MAC-3B-World',
apiParameters: {
apiPort: 8000,
maxResponseToken: 4100,
temperature: 1.0,
topP: 0.3,
presencePenalty: 0,
frequencyPenalty: 1
},
modelParameters: {
modelName: 'RWKV-4-World-3B-v1-20230619-ctx4096.pth',
device: 'MPS',
precision: 'fp32',
storedLayers: 41,
maxStoredLayers: 41,
customStrategy: 'mps fp32'
}
},
{
name: 'MAC-3B-EN',
apiParameters: {
apiPort: 8000,
maxResponseToken: 4100,
temperature: 1.0,
topP: 0.3,
presencePenalty: 0,
frequencyPenalty: 1
},
modelParameters: {
modelName: 'RWKV-4-Raven-3B-v12-Eng98%-Other2%-20230520-ctx4096.pth',
device: 'MPS',
precision: 'fp32',
storedLayers: 41,
maxStoredLayers: 41,
customStrategy: 'mps fp32'
}
},
{
name: 'MAC-3B-CN',
apiParameters: {
apiPort: 8000,
maxResponseToken: 4100,
temperature: 1.0,
topP: 0.3,
presencePenalty: 0,
frequencyPenalty: 1
},
modelParameters: {
modelName: 'RWKV-4-World-CHNtuned-3B-v1-20230625-ctx4096.pth',
device: 'MPS',
precision: 'fp32',
storedLayers: 41,
maxStoredLayers: 41,
customStrategy: 'mps fp32'
}
},
{
name: 'MAC-7B-World',
apiParameters: {
apiPort: 8000,
maxResponseToken: 4100,
temperature: 1.0,
topP: 0.3,
presencePenalty: 0,
frequencyPenalty: 1
},
modelParameters: {
modelName: 'RWKV-4-World-7B-v1-20230626-ctx4096.pth',
device: 'MPS',
precision: 'fp32',
storedLayers: 41,
maxStoredLayers: 41,
customStrategy: 'mps fp32'
}
},
{
name: 'CPU-120M-Music',
apiParameters: {
apiPort: 8000,
maxResponseToken: 4100,
temperature: 1.0,
topP: 0.8,
presencePenalty: 0,
frequencyPenalty: 1
},
modelParameters: {
modelName: 'RWKV-4-MIDI-120M-v1-20230714-ctx4096.pth',
device: 'CPU',
precision: 'fp32',
storedLayers: 41,
maxStoredLayers: 41
}
},
{
name: 'CPU-560M-Music',
apiParameters: {
apiPort: 8000,
maxResponseToken: 4100,
temperature: 1.0,
topP: 0.8,
presencePenalty: 0,
frequencyPenalty: 1
},
modelParameters: {
modelName: 'RWKV-4-MIDI-560M-v1-20230717-ctx4096.pth',
device: 'CPU',
precision: 'fp32',
storedLayers: 41,
maxStoredLayers: 41
}
},
{
name: 'CPU-6G-1B5-World',
apiParameters: {
apiPort: 8000,
maxResponseToken: 4100,
temperature: 1.0,
topP: 0.3,
presencePenalty: 0,
frequencyPenalty: 1
},
modelParameters: {
modelName: 'RWKV-4-World-1.5B-v1-fixed-20230612-ctx4096.pth',
device: 'CPU',
precision: 'fp32',
storedLayers: 41,
maxStoredLayers: 41
}
},
{
name: 'CPU-6G-1B5-EN',
apiParameters: {
apiPort: 8000,
maxResponseToken: 4100,
temperature: 1.0,
topP: 0.3,
presencePenalty: 0,
frequencyPenalty: 1
},
modelParameters: {
modelName: 'RWKV-4-Raven-1B5-v12-Eng98%-Other2%-20230520-ctx4096.pth',
device: 'CPU',
precision: 'fp32',
storedLayers: 41,
maxStoredLayers: 41
}
},
{
name: 'CPU-12G-3B-World',
apiParameters: {
apiPort: 8000,
maxResponseToken: 4100,
temperature: 1.0,
topP: 0.3,
presencePenalty: 0,
frequencyPenalty: 1
},
modelParameters: {
modelName: 'RWKV-4-World-3B-v1-20230619-ctx4096.pth',
device: 'CPU',
precision: 'fp32',
storedLayers: 41,
maxStoredLayers: 41
}
},
{
name: 'CPU-12G-3B-EN',
apiParameters: {
apiPort: 8000,
maxResponseToken: 4100,
temperature: 1.0,
topP: 0.3,
presencePenalty: 0,
frequencyPenalty: 1
},
modelParameters: {
modelName: 'RWKV-4-Raven-3B-v12-Eng98%-Other2%-20230520-ctx4096.pth',
device: 'CPU',
precision: 'fp32',
storedLayers: 41,
maxStoredLayers: 41
}
},
{
name: 'CPU-12G-3B-CN',
apiParameters: {
apiPort: 8000,
maxResponseToken: 4100,
temperature: 1.0,
topP: 0.3,
presencePenalty: 0,
frequencyPenalty: 1
},
modelParameters: {
modelName: 'RWKV-4-World-CHNtuned-3B-v1-20230625-ctx4096.pth',
device: 'CPU',
precision: 'fp32',
storedLayers: 41,
maxStoredLayers: 41
}
},
{
name: 'CPU-28G-7B-World',
apiParameters: {
apiPort: 8000,
maxResponseToken: 4100,
temperature: 1.0,
topP: 0.3,
presencePenalty: 0,
frequencyPenalty: 1
},
modelParameters: {
modelName: 'RWKV-4-World-7B-v1-20230626-ctx4096.pth',
device: 'CPU',
precision: 'fp32',
storedLayers: 41,
maxStoredLayers: 41
}
},
{
name: 'CPU-28G-7B-EN',
apiParameters: {
apiPort: 8000,
maxResponseToken: 4100,
temperature: 1.0,
topP: 0.3,
presencePenalty: 0,
frequencyPenalty: 1
},
modelParameters: {
modelName: 'RWKV-4-Raven-7B-v12-Eng98%-Other2%-20230521-ctx8192.pth',
device: 'CPU',
precision: 'fp32',
storedLayers: 41,
maxStoredLayers: 41
}
},
{
name: 'CPU-28G-7B-CN',
apiParameters: {
apiPort: 8000,
maxResponseToken: 4100,
temperature: 1.0,
topP: 0.3,
presencePenalty: 0,
frequencyPenalty: 1
},
modelParameters: {
modelName: 'RWKV-4-World-CHNtuned-7B-v1-20230709-ctx4096.pth',
device: 'CPU',
precision: 'fp32',
storedLayers: 41,
maxStoredLayers: 41
}
}
];
export const defaultModelConfigs: ModelConfig[] = [
{
name: 'GPU-2G-3B-World',
apiParameters: {
apiPort: 8000,
maxResponseToken: 4100,
temperature: 1.0,
topP: 0.3,
presencePenalty: 0,
frequencyPenalty: 1
},
modelParameters: {
modelName: 'RWKV-4-World-3B-v1-20230619-ctx4096.pth',
device: 'CUDA',
precision: 'int8',
storedLayers: 6,
maxStoredLayers: 41,
useCustomCuda: true
}
},
{
name: 'GPU-2G-0.1B-World',
apiParameters: {
apiPort: 8000,
maxResponseToken: 4100,
temperature: 1.0,
topP: 0.3,
presencePenalty: 0,
frequencyPenalty: 1
},
modelParameters: {
modelName: 'RWKV-4-World-0.1B-v1-20230520-ctx4096.pth',
device: 'CUDA',
precision: 'fp32', // using fp16 will disable state cache (->)
storedLayers: 41,
maxStoredLayers: 41
}
},
{
name: 'GPU-2G-1B5-EN',
apiParameters: {
apiPort: 8000,
maxResponseToken: 4100,
temperature: 1.0,
topP: 0.3,
presencePenalty: 0,
frequencyPenalty: 1
},
modelParameters: {
modelName: 'RWKV-4-Raven-1B5-v12-Eng98%-Other2%-20230520-ctx4096.pth',
device: 'CUDA',
precision: 'int8',
storedLayers: 4,
maxStoredLayers: 41,
useCustomCuda: true
}
},
{
name: 'GPU-4G-0.4B-World',
apiParameters: {
apiPort: 8000,
maxResponseToken: 4100,
temperature: 1.0,
topP: 0.3,
presencePenalty: 0,
frequencyPenalty: 1
},
modelParameters: {
modelName: 'RWKV-4-World-0.4B-v1-20230529-ctx4096.pth',
device: 'CUDA',
precision: 'fp32',
storedLayers: 41,
maxStoredLayers: 41
}
},
{
name: 'GPU-4G-1B5-World',
apiParameters: {
apiPort: 8000,
maxResponseToken: 4100,
temperature: 1.0,
topP: 0.3,
presencePenalty: 0,
frequencyPenalty: 1
},
modelParameters: {
modelName: 'RWKV-4-World-1.5B-v1-fixed-20230612-ctx4096.pth',
device: 'CUDA',
precision: 'fp32',
storedLayers: 8,
maxStoredLayers: 41
}
},
{
name: 'GPU-4G-1B5-EN',
apiParameters: {
apiPort: 8000,
maxResponseToken: 4100,
temperature: 1.0,
topP: 0.3,
presencePenalty: 0,
frequencyPenalty: 1
},
modelParameters: {
modelName: 'RWKV-4-Raven-1B5-v12-Eng98%-Other2%-20230520-ctx4096.pth',
device: 'CUDA',
precision: 'int8',
storedLayers: 41,
maxStoredLayers: 41,
useCustomCuda: true
}
},
{
name: 'GPU-4G-3B-World',
apiParameters: {
apiPort: 8000,
maxResponseToken: 4100,
temperature: 1.0,
topP: 0.3,
presencePenalty: 0,
frequencyPenalty: 1
},
modelParameters: {
modelName: 'RWKV-4-World-3B-v1-20230619-ctx4096.pth',
device: 'CUDA',
precision: 'int8',
storedLayers: 24,
maxStoredLayers: 41,
useCustomCuda: true
}
},
{
name: 'GPU-4G-3B-EN',
apiParameters: {
apiPort: 8000,
maxResponseToken: 4100,
temperature: 1.0,
topP: 0.3,
presencePenalty: 0,
frequencyPenalty: 1
},
modelParameters: {
modelName: 'RWKV-4-Raven-3B-v12-Eng98%-Other2%-20230520-ctx4096.pth',
device: 'CUDA',
precision: 'int8',
storedLayers: 24,
maxStoredLayers: 41,
useCustomCuda: true
}
},
{
name: 'GPU-4G-3B-CN',
apiParameters: {
apiPort: 8000,
maxResponseToken: 4100,
temperature: 1.0,
topP: 0.3,
presencePenalty: 0,
frequencyPenalty: 1
},
modelParameters: {
modelName: 'RWKV-4-World-CHNtuned-3B-v1-20230625-ctx4096.pth',
device: 'CUDA',
precision: 'int8',
storedLayers: 24,
maxStoredLayers: 41,
useCustomCuda: true
}
},
{
name: 'GPU-4G-7B-World',
apiParameters: {
apiPort: 8000,
maxResponseToken: 4100,
temperature: 1.0,
topP: 0.3,
presencePenalty: 0,
frequencyPenalty: 1
},
modelParameters: {
modelName: 'RWKV-4-World-7B-v1-20230626-ctx4096.pth',
device: 'CUDA',
precision: 'int8',
storedLayers: 8,
maxStoredLayers: 41,
useCustomCuda: true
}
},
{
name: 'GPU-4G-7B-EN',
apiParameters: {
apiPort: 8000,
maxResponseToken: 4100,
temperature: 1.0,
topP: 0.3,
presencePenalty: 0,
frequencyPenalty: 1
},
modelParameters: {
modelName: 'RWKV-4-Raven-7B-v12-Eng98%-Other2%-20230521-ctx8192.pth',
device: 'CUDA',
precision: 'int8',
storedLayers: 8,
maxStoredLayers: 41,
useCustomCuda: true
}
},
{
name: 'GPU-4G-7B-CN',
apiParameters: {
apiPort: 8000,
maxResponseToken: 4100,
temperature: 1.0,
topP: 0.3,
presencePenalty: 0,
frequencyPenalty: 1
},
modelParameters: {
modelName: 'RWKV-4-World-CHNtuned-7B-v1-20230709-ctx4096.pth',
device: 'CUDA',
precision: 'int8',
storedLayers: 8,
maxStoredLayers: 41,
useCustomCuda: true
}
},
{
name: 'GPU-6G-1B5-EN',
apiParameters: {
apiPort: 8000,
maxResponseToken: 4100,
temperature: 1.0,
topP: 0.3,
presencePenalty: 0,
frequencyPenalty: 1
},
modelParameters: {
modelName: 'RWKV-4-Raven-1B5-v12-Eng98%-Other2%-20230520-ctx4096.pth',
device: 'CUDA',
precision: 'fp16',
storedLayers: 41,
maxStoredLayers: 41,
useCustomCuda: true
}
},
{
name: 'GPU-6G-3B-World',
apiParameters: {
apiPort: 8000,
maxResponseToken: 4100,
temperature: 1.0,
topP: 0.3,
presencePenalty: 0,
frequencyPenalty: 1
},
modelParameters: {
modelName: 'RWKV-4-World-3B-v1-20230619-ctx4096.pth',
device: 'CUDA',
precision: 'int8',
storedLayers: 41,
maxStoredLayers: 41,
useCustomCuda: true
}
},
{
name: 'GPU-6G-3B-EN',
apiParameters: {
apiPort: 8000,
maxResponseToken: 4100,
temperature: 1.0,
topP: 0.3,
presencePenalty: 0,
frequencyPenalty: 1
},
modelParameters: {
modelName: 'RWKV-4-Raven-3B-v12-Eng98%-Other2%-20230520-ctx4096.pth',
device: 'CUDA',
precision: 'int8',
storedLayers: 41,
maxStoredLayers: 41,
useCustomCuda: true
}
},
{
name: 'GPU-6G-3B-CN',
apiParameters: {
apiPort: 8000,
maxResponseToken: 4100,
temperature: 1.0,
topP: 0.3,
presencePenalty: 0,
frequencyPenalty: 1
},
modelParameters: {
modelName: 'RWKV-4-World-CHNtuned-3B-v1-20230625-ctx4096.pth',
device: 'CUDA',
precision: 'int8',
storedLayers: 41,
maxStoredLayers: 41,
useCustomCuda: true
}
},
{
name: 'GPU-6G-7B-World',
apiParameters: {
apiPort: 8000,
maxResponseToken: 4100,
temperature: 1.0,
topP: 0.3,
presencePenalty: 0,
frequencyPenalty: 1
},
modelParameters: {
modelName: 'RWKV-4-World-7B-v1-20230626-ctx4096.pth',
device: 'CUDA',
precision: 'int8',
storedLayers: 18,
maxStoredLayers: 41,
useCustomCuda: true
}
},
{
name: 'GPU-6G-7B-EN',
apiParameters: {
apiPort: 8000,
maxResponseToken: 4100,
temperature: 1.0,
topP: 0.3,
presencePenalty: 0,
frequencyPenalty: 1
},
modelParameters: {
modelName: 'RWKV-4-Raven-7B-v12-Eng98%-Other2%-20230521-ctx8192.pth',
device: 'CUDA',
precision: 'int8',
storedLayers: 18,
maxStoredLayers: 41,
useCustomCuda: true
}
},
{
name: 'GPU-6G-7B-CN',
apiParameters: {
apiPort: 8000,
maxResponseToken: 4100,
temperature: 1.0,
topP: 0.3,
presencePenalty: 0,
frequencyPenalty: 1
},
modelParameters: {
modelName: 'RWKV-4-World-CHNtuned-7B-v1-20230709-ctx4096.pth',
device: 'CUDA',
precision: 'int8',
storedLayers: 18,
maxStoredLayers: 41,
useCustomCuda: true
}
},
{
name: 'GPU-8G-1B5-World',
apiParameters: {
apiPort: 8000,
maxResponseToken: 4100,
temperature: 1.0,
topP: 0.3,
presencePenalty: 0,
frequencyPenalty: 1
},
modelParameters: {
modelName: 'RWKV-4-World-1.5B-v1-fixed-20230612-ctx4096.pth',
device: 'CUDA',
precision: 'fp32',
storedLayers: 41,
maxStoredLayers: 41
}
},
{
name: 'GPU-8G-3B-World',
apiParameters: {
apiPort: 8000,
maxResponseToken: 4100,
temperature: 1.0,
topP: 0.3,
presencePenalty: 0,
frequencyPenalty: 1
},
modelParameters: {
modelName: 'RWKV-4-World-3B-v1-20230619-ctx4096.pth',
device: 'CUDA',
precision: 'fp16',
storedLayers: 41,
maxStoredLayers: 41,
useCustomCuda: true
}
},
{
name: 'GPU-8G-3B-EN',
apiParameters: {
apiPort: 8000,
maxResponseToken: 4100,
temperature: 1.0,
topP: 0.3,
presencePenalty: 0,
frequencyPenalty: 1
},
modelParameters: {
modelName: 'RWKV-4-Raven-3B-v12-Eng98%-Other2%-20230520-ctx4096.pth',
device: 'CUDA',
precision: 'fp16',
storedLayers: 41,
maxStoredLayers: 41,
useCustomCuda: true
}
},
{
name: 'GPU-8G-3B-CN',
apiParameters: {
apiPort: 8000,
maxResponseToken: 4100,
temperature: 1.0,
topP: 0.3,
presencePenalty: 0,
frequencyPenalty: 1
},
modelParameters: {
modelName: 'RWKV-4-World-CHNtuned-3B-v1-20230625-ctx4096.pth',
device: 'CUDA',
precision: 'fp16',
storedLayers: 41,
maxStoredLayers: 41,
useCustomCuda: true
}
},
{
name: 'GPU-8G-7B-World',
apiParameters: {
apiPort: 8000,
maxResponseToken: 4100,
temperature: 1.0,
topP: 0.3,
presencePenalty: 0,
frequencyPenalty: 1
},
modelParameters: {
modelName: 'RWKV-4-World-7B-v1-20230626-ctx4096.pth',
device: 'CUDA',
precision: 'int8',
storedLayers: 27,
maxStoredLayers: 41,
useCustomCuda: true
}
},
{
name: 'GPU-8G-7B-EN',
apiParameters: {
apiPort: 8000,
maxResponseToken: 4100,
temperature: 1.0,
topP: 0.3,
presencePenalty: 0,
frequencyPenalty: 1
},
modelParameters: {
modelName: 'RWKV-4-Raven-7B-v12-Eng98%-Other2%-20230521-ctx8192.pth',
device: 'CUDA',
precision: 'int8',
storedLayers: 27,
maxStoredLayers: 41,
useCustomCuda: true
}
},
{
name: 'GPU-8G-7B-CN',
apiParameters: {
apiPort: 8000,
maxResponseToken: 4100,
temperature: 1.0,
topP: 0.3,
presencePenalty: 0,
frequencyPenalty: 1
},
modelParameters: {
modelName: 'RWKV-4-World-CHNtuned-7B-v1-20230709-ctx4096.pth',
device: 'CUDA',
precision: 'int8',
storedLayers: 27,
maxStoredLayers: 41,
useCustomCuda: true
}
},
{
name: 'GPU-10G-7B-World',
apiParameters: {
apiPort: 8000,
maxResponseToken: 4100,
temperature: 1.0,
topP: 0.3,
presencePenalty: 0,
frequencyPenalty: 1
},
modelParameters: {
modelName: 'RWKV-4-World-7B-v1-20230626-ctx4096.pth',
device: 'CUDA',
precision: 'int8',
storedLayers: 41,
maxStoredLayers: 41,
useCustomCuda: true
}
},
{
name: 'GPU-10G-7B-EN',
apiParameters: {
apiPort: 8000,
maxResponseToken: 4100,
temperature: 1.0,
topP: 0.3,
presencePenalty: 0,
frequencyPenalty: 1
},
modelParameters: {
modelName: 'RWKV-4-Raven-7B-v12-Eng98%-Other2%-20230521-ctx8192.pth',
device: 'CUDA',
precision: 'int8',
storedLayers: 41,
maxStoredLayers: 41,
useCustomCuda: true
}
},
{
name: 'GPU-10G-7B-CN',
apiParameters: {
apiPort: 8000,
maxResponseToken: 4100,
temperature: 1.0,
topP: 0.3,
presencePenalty: 0,
frequencyPenalty: 1
},
modelParameters: {
modelName: 'RWKV-4-World-CHNtuned-7B-v1-20230709-ctx4096.pth',
device: 'CUDA',
precision: 'int8',
storedLayers: 41,
maxStoredLayers: 41,
useCustomCuda: true
}
},
{
name: 'GPU-12G-14B-EN',
apiParameters: {
apiPort: 8000,
maxResponseToken: 4100,
temperature: 1.0,
topP: 0.3,
presencePenalty: 0,
frequencyPenalty: 1
},
modelParameters: {
modelName: 'RWKV-4-Raven-14B-v12-Eng98%-Other2%-20230523-ctx8192.pth',
device: 'CUDA',
precision: 'int8',
storedLayers: 24,
maxStoredLayers: 41,
useCustomCuda: true
}
},
{
name: 'GPU-16G-7B-World',
apiParameters: {
apiPort: 8000,
maxResponseToken: 4100,
temperature: 1.0,
topP: 0.3,
presencePenalty: 0,
frequencyPenalty: 1
},
modelParameters: {
modelName: 'RWKV-4-World-7B-v1-20230626-ctx4096.pth',
device: 'CUDA',
precision: 'fp16',
storedLayers: 41,
maxStoredLayers: 41,
useCustomCuda: true
}
},
{
name: 'GPU-16G-7B-EN',
apiParameters: {
apiPort: 8000,
maxResponseToken: 4100,
temperature: 1.0,
topP: 0.3,
presencePenalty: 0,
frequencyPenalty: 1
},
modelParameters: {
modelName: 'RWKV-4-Raven-7B-v12-Eng98%-Other2%-20230521-ctx8192.pth',
device: 'CUDA',
precision: 'fp16',
storedLayers: 41,
maxStoredLayers: 41,
useCustomCuda: true
}
},
{
name: 'GPU-16G-7B-CN',
apiParameters: {
apiPort: 8000,
maxResponseToken: 4100,
temperature: 1.0,
topP: 0.3,
presencePenalty: 0,
frequencyPenalty: 1
},
modelParameters: {
modelName: 'RWKV-4-World-CHNtuned-7B-v1-20230709-ctx4096.pth',
device: 'CUDA',
precision: 'fp16',
storedLayers: 41,
maxStoredLayers: 41,
useCustomCuda: true
}
},
{
name: 'GPU-16G-14B-EN',
apiParameters: {
apiPort: 8000,
maxResponseToken: 4100,
temperature: 1.0,
topP: 0.3,
presencePenalty: 0,
frequencyPenalty: 1
},
modelParameters: {
modelName: 'RWKV-4-Raven-14B-v12-Eng98%-Other2%-20230523-ctx8192.pth',
device: 'CUDA',
precision: 'int8',
storedLayers: 37,
maxStoredLayers: 41,
useCustomCuda: true
}
},
{
name: 'GPU-18G-14B-EN',
apiParameters: {
apiPort: 8000,
maxResponseToken: 4100,
temperature: 1.0,
topP: 0.3,
presencePenalty: 0,
frequencyPenalty: 1
},
modelParameters: {
modelName: 'RWKV-4-Raven-14B-v12-Eng98%-Other2%-20230523-ctx8192.pth',
device: 'CUDA',
precision: 'int8',
storedLayers: 41,
maxStoredLayers: 41,
useCustomCuda: true
}
},
{
name: 'GPU-32G-14B-EN',
apiParameters: {
apiPort: 8000,
maxResponseToken: 4100,
temperature: 1.0,
topP: 0.3,
presencePenalty: 0,
frequencyPenalty: 1
},
modelParameters: {
modelName: 'RWKV-4-Raven-14B-v12-Eng98%-Other2%-20230523-ctx8192.pth',
device: 'CUDA',
precision: 'fp16',
storedLayers: 41,
maxStoredLayers: 41,
useCustomCuda: true
}
},
{
name: 'CPU-120M-Music',
apiParameters: {
apiPort: 8000,
maxResponseToken: 4100,
temperature: 1.0,
topP: 0.8,
presencePenalty: 0,
frequencyPenalty: 1
},
modelParameters: {
modelName: 'RWKV-4-MIDI-120M-v1-20230714-ctx4096.pth',
device: 'CPU',
precision: 'fp32',
storedLayers: 41,
maxStoredLayers: 41
}
},
{
name: 'CPU-560M-Music',
apiParameters: {
apiPort: 8000,
maxResponseToken: 4100,
temperature: 1.0,
topP: 0.8,
presencePenalty: 0,
frequencyPenalty: 1
},
modelParameters: {
modelName: 'RWKV-4-MIDI-560M-v1-20230717-ctx4096.pth',
device: 'CPU',
precision: 'fp32',
storedLayers: 41,
maxStoredLayers: 41
}
},
{
name: 'CPU-6G-1B5-World',
apiParameters: {
apiPort: 8000,
maxResponseToken: 4100,
temperature: 1.0,
topP: 0.3,
presencePenalty: 0,
frequencyPenalty: 1
},
modelParameters: {
modelName: 'RWKV-4-World-1.5B-v1-fixed-20230612-ctx4096.pth',
device: 'CPU',
precision: 'fp32',
storedLayers: 41,
maxStoredLayers: 41
}
},
{
name: 'CPU-6G-1B5-EN',
apiParameters: {
apiPort: 8000,
maxResponseToken: 4100,
temperature: 1.0,
topP: 0.3,
presencePenalty: 0,
frequencyPenalty: 1
},
modelParameters: {
modelName: 'RWKV-4-Raven-1B5-v12-Eng98%-Other2%-20230520-ctx4096.pth',
device: 'CPU',
precision: 'fp32',
storedLayers: 41,
maxStoredLayers: 41
}
},
{
name: 'CPU-12G-3B-World',
apiParameters: {
apiPort: 8000,
maxResponseToken: 4100,
temperature: 1.0,
topP: 0.3,
presencePenalty: 0,
frequencyPenalty: 1
},
modelParameters: {
modelName: 'RWKV-4-World-3B-v1-20230619-ctx4096.pth',
device: 'CPU',
precision: 'fp32',
storedLayers: 41,
maxStoredLayers: 41
}
},
{
name: 'CPU-12G-3B-EN',
apiParameters: {
apiPort: 8000,
maxResponseToken: 4100,
temperature: 1.0,
topP: 0.3,
presencePenalty: 0,
frequencyPenalty: 1
},
modelParameters: {
modelName: 'RWKV-4-Raven-3B-v12-Eng98%-Other2%-20230520-ctx4096.pth',
device: 'CPU',
precision: 'fp32',
storedLayers: 41,
maxStoredLayers: 41
}
},
{
name: 'CPU-12G-3B-CN',
apiParameters: {
apiPort: 8000,
maxResponseToken: 4100,
temperature: 1.0,
topP: 0.3,
presencePenalty: 0,
frequencyPenalty: 1
},
modelParameters: {
modelName: 'RWKV-4-World-CHNtuned-3B-v1-20230625-ctx4096.pth',
device: 'CPU',
precision: 'fp32',
storedLayers: 41,
maxStoredLayers: 41
}
},
{
name: 'CPU-28G-7B-World',
apiParameters: {
apiPort: 8000,
maxResponseToken: 4100,
temperature: 1.0,
topP: 0.3,
presencePenalty: 0,
frequencyPenalty: 1
},
modelParameters: {
modelName: 'RWKV-4-World-7B-v1-20230626-ctx4096.pth',
device: 'CPU',
precision: 'fp32',
storedLayers: 41,
maxStoredLayers: 41
}
},
{
name: 'CPU-28G-7B-EN',
apiParameters: {
apiPort: 8000,
maxResponseToken: 4100,
temperature: 1.0,
topP: 0.3,
presencePenalty: 0,
frequencyPenalty: 1
},
modelParameters: {
modelName: 'RWKV-4-Raven-7B-v12-Eng98%-Other2%-20230521-ctx8192.pth',
device: 'CPU',
precision: 'fp32',
storedLayers: 41,
maxStoredLayers: 41
}
},
{
name: 'CPU-28G-7B-CN',
apiParameters: {
apiPort: 8000,
maxResponseToken: 4100,
temperature: 1.0,
topP: 0.3,
presencePenalty: 0,
frequencyPenalty: 1
},
modelParameters: {
modelName: 'RWKV-4-World-CHNtuned-7B-v1-20230709-ctx4096.pth',
device: 'CPU',
precision: 'fp32',
storedLayers: 41,
maxStoredLayers: 41
}
}
];