2023-06-06 14:42:38 +00:00
|
|
|
import { ModelConfig } from './Configs';
|
|
|
|
|
|
|
|
export const defaultModelConfigsMac: ModelConfig[] = [
|
2023-06-13 14:46:41 +00:00
|
|
|
{
|
|
|
|
name: 'MAC-0.1B-World',
|
|
|
|
apiParameters: {
|
|
|
|
apiPort: 8000,
|
|
|
|
maxResponseToken: 4100,
|
|
|
|
temperature: 1.2,
|
|
|
|
topP: 0.5,
|
|
|
|
presencePenalty: 0.4,
|
|
|
|
frequencyPenalty: 0.4
|
|
|
|
},
|
|
|
|
modelParameters: {
|
|
|
|
modelName: 'RWKV-4-World-0.1B-v1-20230520-ctx4096.pth',
|
|
|
|
device: 'MPS',
|
|
|
|
precision: 'fp32',
|
|
|
|
storedLayers: 41,
|
|
|
|
maxStoredLayers: 41,
|
|
|
|
customStrategy: 'mps fp32'
|
|
|
|
}
|
|
|
|
},
|
|
|
|
{
|
|
|
|
name: 'MAC-0.4B-World',
|
|
|
|
apiParameters: {
|
|
|
|
apiPort: 8000,
|
|
|
|
maxResponseToken: 4100,
|
|
|
|
temperature: 1.2,
|
|
|
|
topP: 0.5,
|
|
|
|
presencePenalty: 0.4,
|
|
|
|
frequencyPenalty: 0.4
|
|
|
|
},
|
|
|
|
modelParameters: {
|
|
|
|
modelName: 'RWKV-4-World-0.4B-v1-20230529-ctx4096.pth',
|
|
|
|
device: 'MPS',
|
|
|
|
precision: 'fp32',
|
|
|
|
storedLayers: 41,
|
|
|
|
maxStoredLayers: 41,
|
|
|
|
customStrategy: 'mps fp32'
|
|
|
|
}
|
|
|
|
},
|
|
|
|
{
|
|
|
|
name: 'MAC-1B5-World',
|
|
|
|
apiParameters: {
|
|
|
|
apiPort: 8000,
|
|
|
|
maxResponseToken: 4100,
|
|
|
|
temperature: 1.2,
|
|
|
|
topP: 0.5,
|
|
|
|
presencePenalty: 0.4,
|
|
|
|
frequencyPenalty: 0.4
|
|
|
|
},
|
|
|
|
modelParameters: {
|
|
|
|
modelName: 'RWKV-4-World-1.5B-v1-fixed-20230612-ctx4096.pth',
|
|
|
|
device: 'MPS',
|
|
|
|
precision: 'fp32',
|
|
|
|
storedLayers: 41,
|
|
|
|
maxStoredLayers: 41,
|
|
|
|
customStrategy: 'mps fp32'
|
|
|
|
}
|
|
|
|
},
|
2023-06-06 14:42:38 +00:00
|
|
|
{
|
|
|
|
name: 'MAC-1B5-EN',
|
|
|
|
apiParameters: {
|
|
|
|
apiPort: 8000,
|
|
|
|
maxResponseToken: 4100,
|
|
|
|
temperature: 1.2,
|
|
|
|
topP: 0.5,
|
|
|
|
presencePenalty: 0.4,
|
|
|
|
frequencyPenalty: 0.4
|
|
|
|
},
|
|
|
|
modelParameters: {
|
|
|
|
modelName: 'RWKV-4-Raven-1B5-v12-Eng98%-Other2%-20230520-ctx4096.pth',
|
|
|
|
device: 'MPS',
|
|
|
|
precision: 'fp32',
|
|
|
|
storedLayers: 41,
|
|
|
|
maxStoredLayers: 41,
|
2023-06-13 14:46:41 +00:00
|
|
|
customStrategy: 'mps fp32'
|
|
|
|
}
|
|
|
|
},
|
|
|
|
{
|
|
|
|
name: 'MAC-3B-World',
|
|
|
|
apiParameters: {
|
|
|
|
apiPort: 8000,
|
|
|
|
maxResponseToken: 4100,
|
|
|
|
temperature: 1.2,
|
|
|
|
topP: 0.5,
|
|
|
|
presencePenalty: 0.4,
|
|
|
|
frequencyPenalty: 0.4
|
|
|
|
},
|
|
|
|
modelParameters: {
|
2023-06-20 08:07:52 +00:00
|
|
|
modelName: 'RWKV-4-World-3B-v1-20230619-ctx4096.pth',
|
2023-06-13 14:46:41 +00:00
|
|
|
device: 'MPS',
|
|
|
|
precision: 'fp32',
|
|
|
|
storedLayers: 41,
|
|
|
|
maxStoredLayers: 41,
|
2023-06-06 14:42:38 +00:00
|
|
|
customStrategy: 'mps fp32'
|
|
|
|
}
|
|
|
|
},
|
|
|
|
{
|
|
|
|
name: 'MAC-3B-EN',
|
|
|
|
apiParameters: {
|
|
|
|
apiPort: 8000,
|
|
|
|
maxResponseToken: 4100,
|
|
|
|
temperature: 1.2,
|
|
|
|
topP: 0.5,
|
|
|
|
presencePenalty: 0.4,
|
|
|
|
frequencyPenalty: 0.4
|
|
|
|
},
|
|
|
|
modelParameters: {
|
|
|
|
modelName: 'RWKV-4-Raven-3B-v12-Eng98%-Other2%-20230520-ctx4096.pth',
|
|
|
|
device: 'MPS',
|
|
|
|
precision: 'fp32',
|
|
|
|
storedLayers: 41,
|
|
|
|
maxStoredLayers: 41,
|
|
|
|
customStrategy: 'mps fp32'
|
|
|
|
}
|
|
|
|
},
|
|
|
|
{
|
|
|
|
name: 'MAC-3B-CN',
|
|
|
|
apiParameters: {
|
|
|
|
apiPort: 8000,
|
|
|
|
maxResponseToken: 4100,
|
|
|
|
temperature: 1.2,
|
|
|
|
topP: 0.5,
|
|
|
|
presencePenalty: 0.4,
|
|
|
|
frequencyPenalty: 0.4
|
|
|
|
},
|
|
|
|
modelParameters: {
|
2023-06-28 12:57:09 +00:00
|
|
|
modelName: 'RWKV-4-World-CHNtuned-3B-v1-20230625-ctx4096.pth',
|
2023-06-06 14:42:38 +00:00
|
|
|
device: 'MPS',
|
|
|
|
precision: 'fp32',
|
|
|
|
storedLayers: 41,
|
|
|
|
maxStoredLayers: 41,
|
|
|
|
customStrategy: 'mps fp32'
|
|
|
|
}
|
|
|
|
},
|
2023-06-13 14:46:41 +00:00
|
|
|
{
|
|
|
|
name: 'MAC-7B-World',
|
|
|
|
apiParameters: {
|
|
|
|
apiPort: 8000,
|
|
|
|
maxResponseToken: 4100,
|
|
|
|
temperature: 1.2,
|
|
|
|
topP: 0.5,
|
|
|
|
presencePenalty: 0.4,
|
|
|
|
frequencyPenalty: 0.4
|
|
|
|
},
|
|
|
|
modelParameters: {
|
2023-06-28 12:57:09 +00:00
|
|
|
modelName: 'RWKV-4-World-7B-v1-20230626-ctx4096.pth',
|
2023-06-13 14:46:41 +00:00
|
|
|
device: 'MPS',
|
|
|
|
precision: 'fp32',
|
|
|
|
storedLayers: 41,
|
|
|
|
maxStoredLayers: 41,
|
|
|
|
customStrategy: 'mps fp32'
|
|
|
|
}
|
|
|
|
},
|
|
|
|
{
|
|
|
|
name: 'CPU-6G-1B5-World',
|
|
|
|
apiParameters: {
|
|
|
|
apiPort: 8000,
|
|
|
|
maxResponseToken: 4100,
|
|
|
|
temperature: 1.2,
|
|
|
|
topP: 0.5,
|
|
|
|
presencePenalty: 0.4,
|
|
|
|
frequencyPenalty: 0.4
|
|
|
|
},
|
|
|
|
modelParameters: {
|
|
|
|
modelName: 'RWKV-4-World-1.5B-v1-fixed-20230612-ctx4096.pth',
|
|
|
|
device: 'CPU',
|
|
|
|
precision: 'fp32',
|
|
|
|
storedLayers: 41,
|
|
|
|
maxStoredLayers: 41
|
|
|
|
}
|
|
|
|
},
|
2023-06-06 14:42:38 +00:00
|
|
|
{
|
|
|
|
name: 'CPU-6G-1B5-EN',
|
|
|
|
apiParameters: {
|
|
|
|
apiPort: 8000,
|
|
|
|
maxResponseToken: 4100,
|
|
|
|
temperature: 1.2,
|
|
|
|
topP: 0.5,
|
|
|
|
presencePenalty: 0.4,
|
|
|
|
frequencyPenalty: 0.4
|
|
|
|
},
|
|
|
|
modelParameters: {
|
|
|
|
modelName: 'RWKV-4-Raven-1B5-v12-Eng98%-Other2%-20230520-ctx4096.pth',
|
|
|
|
device: 'CPU',
|
|
|
|
precision: 'fp32',
|
|
|
|
storedLayers: 41,
|
2023-06-09 12:49:45 +00:00
|
|
|
maxStoredLayers: 41
|
2023-06-06 14:42:38 +00:00
|
|
|
}
|
|
|
|
},
|
2023-06-13 14:46:41 +00:00
|
|
|
{
|
|
|
|
name: 'CPU-12G-3B-World',
|
|
|
|
apiParameters: {
|
|
|
|
apiPort: 8000,
|
|
|
|
maxResponseToken: 4100,
|
|
|
|
temperature: 1.2,
|
|
|
|
topP: 0.5,
|
|
|
|
presencePenalty: 0.4,
|
|
|
|
frequencyPenalty: 0.4
|
|
|
|
},
|
|
|
|
modelParameters: {
|
2023-06-20 08:07:52 +00:00
|
|
|
modelName: 'RWKV-4-World-3B-v1-20230619-ctx4096.pth',
|
2023-06-13 14:46:41 +00:00
|
|
|
device: 'CPU',
|
|
|
|
precision: 'fp32',
|
|
|
|
storedLayers: 41,
|
|
|
|
maxStoredLayers: 41
|
|
|
|
}
|
|
|
|
},
|
2023-06-06 14:42:38 +00:00
|
|
|
{
|
|
|
|
name: 'CPU-12G-3B-EN',
|
|
|
|
apiParameters: {
|
|
|
|
apiPort: 8000,
|
|
|
|
maxResponseToken: 4100,
|
|
|
|
temperature: 1.2,
|
|
|
|
topP: 0.5,
|
|
|
|
presencePenalty: 0.4,
|
|
|
|
frequencyPenalty: 0.4
|
|
|
|
},
|
|
|
|
modelParameters: {
|
|
|
|
modelName: 'RWKV-4-Raven-3B-v12-Eng98%-Other2%-20230520-ctx4096.pth',
|
|
|
|
device: 'CPU',
|
|
|
|
precision: 'fp32',
|
|
|
|
storedLayers: 41,
|
2023-06-09 12:49:45 +00:00
|
|
|
maxStoredLayers: 41
|
2023-06-06 14:42:38 +00:00
|
|
|
}
|
|
|
|
},
|
|
|
|
{
|
|
|
|
name: 'CPU-12G-3B-CN',
|
|
|
|
apiParameters: {
|
|
|
|
apiPort: 8000,
|
|
|
|
maxResponseToken: 4100,
|
|
|
|
temperature: 1.2,
|
|
|
|
topP: 0.5,
|
|
|
|
presencePenalty: 0.4,
|
|
|
|
frequencyPenalty: 0.4
|
|
|
|
},
|
|
|
|
modelParameters: {
|
2023-06-28 12:57:09 +00:00
|
|
|
modelName: 'RWKV-4-World-CHNtuned-3B-v1-20230625-ctx4096.pth',
|
2023-06-06 14:42:38 +00:00
|
|
|
device: 'CPU',
|
|
|
|
precision: 'fp32',
|
|
|
|
storedLayers: 41,
|
2023-06-09 12:49:45 +00:00
|
|
|
maxStoredLayers: 41
|
2023-06-06 14:42:38 +00:00
|
|
|
}
|
|
|
|
},
|
2023-06-13 14:46:41 +00:00
|
|
|
{
|
|
|
|
name: 'CPU-28G-7B-World',
|
|
|
|
apiParameters: {
|
|
|
|
apiPort: 8000,
|
|
|
|
maxResponseToken: 4100,
|
|
|
|
temperature: 1.2,
|
|
|
|
topP: 0.5,
|
|
|
|
presencePenalty: 0.4,
|
|
|
|
frequencyPenalty: 0.4
|
|
|
|
},
|
|
|
|
modelParameters: {
|
2023-06-28 12:57:09 +00:00
|
|
|
modelName: 'RWKV-4-World-7B-v1-20230626-ctx4096.pth',
|
2023-06-13 14:46:41 +00:00
|
|
|
device: 'CPU',
|
|
|
|
precision: 'fp32',
|
|
|
|
storedLayers: 41,
|
|
|
|
maxStoredLayers: 41
|
|
|
|
}
|
|
|
|
},
|
2023-06-06 14:42:38 +00:00
|
|
|
{
|
|
|
|
name: 'CPU-28G-7B-EN',
|
|
|
|
apiParameters: {
|
|
|
|
apiPort: 8000,
|
|
|
|
maxResponseToken: 4100,
|
|
|
|
temperature: 1.2,
|
|
|
|
topP: 0.5,
|
|
|
|
presencePenalty: 0.4,
|
|
|
|
frequencyPenalty: 0.4
|
|
|
|
},
|
|
|
|
modelParameters: {
|
|
|
|
modelName: 'RWKV-4-Raven-7B-v12-Eng98%-Other2%-20230521-ctx8192.pth',
|
|
|
|
device: 'CPU',
|
|
|
|
precision: 'fp32',
|
|
|
|
storedLayers: 41,
|
2023-06-09 12:49:45 +00:00
|
|
|
maxStoredLayers: 41
|
2023-06-06 14:42:38 +00:00
|
|
|
}
|
|
|
|
},
|
|
|
|
{
|
|
|
|
name: 'CPU-28G-7B-CN',
|
|
|
|
apiParameters: {
|
|
|
|
apiPort: 8000,
|
|
|
|
maxResponseToken: 4100,
|
|
|
|
temperature: 1.2,
|
|
|
|
topP: 0.5,
|
|
|
|
presencePenalty: 0.4,
|
|
|
|
frequencyPenalty: 0.4
|
|
|
|
},
|
|
|
|
modelParameters: {
|
|
|
|
modelName: 'RWKV-4-Raven-7B-v12-Eng49%-Chn49%-Jpn1%-Other1%-20230530-ctx8192.pth',
|
|
|
|
device: 'CPU',
|
|
|
|
precision: 'fp32',
|
|
|
|
storedLayers: 41,
|
2023-06-09 12:49:45 +00:00
|
|
|
maxStoredLayers: 41
|
2023-06-06 14:42:38 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
];
|
|
|
|
|
|
|
|
export const defaultModelConfigs: ModelConfig[] = [
|
2023-06-14 16:07:09 +00:00
|
|
|
{
|
|
|
|
name: 'GPU-2G-3B-World',
|
|
|
|
apiParameters: {
|
|
|
|
apiPort: 8000,
|
|
|
|
maxResponseToken: 4100,
|
|
|
|
temperature: 1.2,
|
|
|
|
topP: 0.5,
|
|
|
|
presencePenalty: 0.4,
|
|
|
|
frequencyPenalty: 0.4
|
|
|
|
},
|
|
|
|
modelParameters: {
|
2023-06-20 08:07:52 +00:00
|
|
|
modelName: 'RWKV-4-World-3B-v1-20230619-ctx4096.pth',
|
2023-06-14 16:07:09 +00:00
|
|
|
device: 'CUDA',
|
|
|
|
precision: 'int8',
|
|
|
|
storedLayers: 6,
|
|
|
|
maxStoredLayers: 41,
|
|
|
|
useCustomCuda: true
|
|
|
|
}
|
|
|
|
},
|
2023-06-13 14:46:41 +00:00
|
|
|
{
|
|
|
|
name: 'GPU-2G-0.1B-World',
|
|
|
|
apiParameters: {
|
|
|
|
apiPort: 8000,
|
|
|
|
maxResponseToken: 4100,
|
|
|
|
temperature: 1.2,
|
|
|
|
topP: 0.5,
|
|
|
|
presencePenalty: 0.4,
|
|
|
|
frequencyPenalty: 0.4
|
|
|
|
},
|
|
|
|
modelParameters: {
|
|
|
|
modelName: 'RWKV-4-World-0.1B-v1-20230520-ctx4096.pth',
|
|
|
|
device: 'CUDA',
|
|
|
|
precision: 'fp32',
|
|
|
|
storedLayers: 41,
|
|
|
|
maxStoredLayers: 41
|
|
|
|
}
|
|
|
|
},
|
2023-06-06 14:42:38 +00:00
|
|
|
{
|
|
|
|
name: 'GPU-2G-1B5-EN',
|
|
|
|
apiParameters: {
|
|
|
|
apiPort: 8000,
|
|
|
|
maxResponseToken: 4100,
|
|
|
|
temperature: 1.2,
|
|
|
|
topP: 0.5,
|
|
|
|
presencePenalty: 0.4,
|
|
|
|
frequencyPenalty: 0.4
|
|
|
|
},
|
|
|
|
modelParameters: {
|
|
|
|
modelName: 'RWKV-4-Raven-1B5-v12-Eng98%-Other2%-20230520-ctx4096.pth',
|
|
|
|
device: 'CUDA',
|
|
|
|
precision: 'int8',
|
|
|
|
storedLayers: 4,
|
|
|
|
maxStoredLayers: 41,
|
|
|
|
useCustomCuda: true
|
|
|
|
}
|
|
|
|
},
|
2023-06-13 14:46:41 +00:00
|
|
|
{
|
|
|
|
name: 'GPU-4G-0.4B-World',
|
|
|
|
apiParameters: {
|
|
|
|
apiPort: 8000,
|
|
|
|
maxResponseToken: 4100,
|
|
|
|
temperature: 1.2,
|
|
|
|
topP: 0.5,
|
|
|
|
presencePenalty: 0.4,
|
|
|
|
frequencyPenalty: 0.4
|
|
|
|
},
|
|
|
|
modelParameters: {
|
|
|
|
modelName: 'RWKV-4-World-0.4B-v1-20230529-ctx4096.pth',
|
|
|
|
device: 'CUDA',
|
|
|
|
precision: 'fp32',
|
|
|
|
storedLayers: 41,
|
|
|
|
maxStoredLayers: 41
|
|
|
|
}
|
|
|
|
},
|
|
|
|
{
|
|
|
|
name: 'GPU-4G-1B5-World',
|
|
|
|
apiParameters: {
|
|
|
|
apiPort: 8000,
|
|
|
|
maxResponseToken: 4100,
|
|
|
|
temperature: 1.2,
|
|
|
|
topP: 0.5,
|
|
|
|
presencePenalty: 0.4,
|
|
|
|
frequencyPenalty: 0.4
|
|
|
|
},
|
|
|
|
modelParameters: {
|
|
|
|
modelName: 'RWKV-4-World-1.5B-v1-fixed-20230612-ctx4096.pth',
|
|
|
|
device: 'CUDA',
|
|
|
|
precision: 'fp32',
|
|
|
|
storedLayers: 8,
|
|
|
|
maxStoredLayers: 41
|
|
|
|
}
|
|
|
|
},
|
2023-06-06 14:42:38 +00:00
|
|
|
{
|
|
|
|
name: 'GPU-4G-1B5-EN',
|
|
|
|
apiParameters: {
|
|
|
|
apiPort: 8000,
|
|
|
|
maxResponseToken: 4100,
|
|
|
|
temperature: 1.2,
|
|
|
|
topP: 0.5,
|
|
|
|
presencePenalty: 0.4,
|
|
|
|
frequencyPenalty: 0.4
|
|
|
|
},
|
|
|
|
modelParameters: {
|
|
|
|
modelName: 'RWKV-4-Raven-1B5-v12-Eng98%-Other2%-20230520-ctx4096.pth',
|
|
|
|
device: 'CUDA',
|
|
|
|
precision: 'int8',
|
|
|
|
storedLayers: 41,
|
|
|
|
maxStoredLayers: 41,
|
|
|
|
useCustomCuda: true
|
|
|
|
}
|
|
|
|
},
|
2023-06-13 14:46:41 +00:00
|
|
|
{
|
|
|
|
name: 'GPU-4G-3B-World',
|
|
|
|
apiParameters: {
|
|
|
|
apiPort: 8000,
|
|
|
|
maxResponseToken: 4100,
|
|
|
|
temperature: 1.2,
|
|
|
|
topP: 0.5,
|
|
|
|
presencePenalty: 0.4,
|
|
|
|
frequencyPenalty: 0.4
|
|
|
|
},
|
|
|
|
modelParameters: {
|
2023-06-20 08:07:52 +00:00
|
|
|
modelName: 'RWKV-4-World-3B-v1-20230619-ctx4096.pth',
|
2023-06-13 14:46:41 +00:00
|
|
|
device: 'CUDA',
|
|
|
|
precision: 'int8',
|
|
|
|
storedLayers: 24,
|
|
|
|
maxStoredLayers: 41,
|
|
|
|
useCustomCuda: true
|
|
|
|
}
|
|
|
|
},
|
2023-06-06 14:42:38 +00:00
|
|
|
{
|
|
|
|
name: 'GPU-4G-3B-EN',
|
|
|
|
apiParameters: {
|
|
|
|
apiPort: 8000,
|
|
|
|
maxResponseToken: 4100,
|
|
|
|
temperature: 1.2,
|
|
|
|
topP: 0.5,
|
|
|
|
presencePenalty: 0.4,
|
|
|
|
frequencyPenalty: 0.4
|
|
|
|
},
|
|
|
|
modelParameters: {
|
|
|
|
modelName: 'RWKV-4-Raven-3B-v12-Eng98%-Other2%-20230520-ctx4096.pth',
|
|
|
|
device: 'CUDA',
|
|
|
|
precision: 'int8',
|
|
|
|
storedLayers: 24,
|
|
|
|
maxStoredLayers: 41,
|
|
|
|
useCustomCuda: true
|
|
|
|
}
|
|
|
|
},
|
|
|
|
{
|
|
|
|
name: 'GPU-4G-3B-CN',
|
|
|
|
apiParameters: {
|
|
|
|
apiPort: 8000,
|
|
|
|
maxResponseToken: 4100,
|
|
|
|
temperature: 1.2,
|
|
|
|
topP: 0.5,
|
|
|
|
presencePenalty: 0.4,
|
|
|
|
frequencyPenalty: 0.4
|
|
|
|
},
|
|
|
|
modelParameters: {
|
2023-06-28 12:57:09 +00:00
|
|
|
modelName: 'RWKV-4-World-CHNtuned-3B-v1-20230625-ctx4096.pth',
|
2023-06-06 14:42:38 +00:00
|
|
|
device: 'CUDA',
|
|
|
|
precision: 'int8',
|
|
|
|
storedLayers: 24,
|
|
|
|
maxStoredLayers: 41,
|
|
|
|
useCustomCuda: true
|
|
|
|
}
|
|
|
|
},
|
2023-06-13 14:46:41 +00:00
|
|
|
{
|
|
|
|
name: 'GPU-4G-7B-World',
|
|
|
|
apiParameters: {
|
|
|
|
apiPort: 8000,
|
|
|
|
maxResponseToken: 4100,
|
|
|
|
temperature: 1.2,
|
|
|
|
topP: 0.5,
|
|
|
|
presencePenalty: 0.4,
|
|
|
|
frequencyPenalty: 0.4
|
|
|
|
},
|
|
|
|
modelParameters: {
|
2023-06-28 12:57:09 +00:00
|
|
|
modelName: 'RWKV-4-World-7B-v1-20230626-ctx4096.pth',
|
2023-06-13 14:46:41 +00:00
|
|
|
device: 'CUDA',
|
|
|
|
precision: 'int8',
|
|
|
|
storedLayers: 8,
|
|
|
|
maxStoredLayers: 41,
|
|
|
|
useCustomCuda: true
|
|
|
|
}
|
|
|
|
},
|
2023-06-06 14:42:38 +00:00
|
|
|
{
|
|
|
|
name: 'GPU-4G-7B-EN',
|
|
|
|
apiParameters: {
|
|
|
|
apiPort: 8000,
|
|
|
|
maxResponseToken: 4100,
|
|
|
|
temperature: 1.2,
|
|
|
|
topP: 0.5,
|
|
|
|
presencePenalty: 0.4,
|
|
|
|
frequencyPenalty: 0.4
|
|
|
|
},
|
|
|
|
modelParameters: {
|
|
|
|
modelName: 'RWKV-4-Raven-7B-v12-Eng98%-Other2%-20230521-ctx8192.pth',
|
|
|
|
device: 'CUDA',
|
|
|
|
precision: 'int8',
|
|
|
|
storedLayers: 8,
|
|
|
|
maxStoredLayers: 41,
|
|
|
|
useCustomCuda: true
|
|
|
|
}
|
|
|
|
},
|
|
|
|
{
|
|
|
|
name: 'GPU-4G-7B-CN',
|
|
|
|
apiParameters: {
|
|
|
|
apiPort: 8000,
|
|
|
|
maxResponseToken: 4100,
|
|
|
|
temperature: 1.2,
|
|
|
|
topP: 0.5,
|
|
|
|
presencePenalty: 0.4,
|
|
|
|
frequencyPenalty: 0.4
|
|
|
|
},
|
|
|
|
modelParameters: {
|
|
|
|
modelName: 'RWKV-4-Raven-7B-v12-Eng49%-Chn49%-Jpn1%-Other1%-20230530-ctx8192.pth',
|
|
|
|
device: 'CUDA',
|
|
|
|
precision: 'int8',
|
|
|
|
storedLayers: 8,
|
|
|
|
maxStoredLayers: 41,
|
|
|
|
useCustomCuda: true
|
|
|
|
}
|
|
|
|
},
|
|
|
|
{
|
|
|
|
name: 'GPU-6G-1B5-EN',
|
|
|
|
apiParameters: {
|
|
|
|
apiPort: 8000,
|
|
|
|
maxResponseToken: 4100,
|
|
|
|
temperature: 1.2,
|
|
|
|
topP: 0.5,
|
|
|
|
presencePenalty: 0.4,
|
|
|
|
frequencyPenalty: 0.4
|
|
|
|
},
|
|
|
|
modelParameters: {
|
|
|
|
modelName: 'RWKV-4-Raven-1B5-v12-Eng98%-Other2%-20230520-ctx4096.pth',
|
|
|
|
device: 'CUDA',
|
|
|
|
precision: 'fp16',
|
|
|
|
storedLayers: 41,
|
|
|
|
maxStoredLayers: 41,
|
|
|
|
useCustomCuda: true
|
|
|
|
}
|
|
|
|
},
|
2023-06-13 14:46:41 +00:00
|
|
|
{
|
|
|
|
name: 'GPU-6G-3B-World',
|
|
|
|
apiParameters: {
|
|
|
|
apiPort: 8000,
|
|
|
|
maxResponseToken: 4100,
|
|
|
|
temperature: 1.2,
|
|
|
|
topP: 0.5,
|
|
|
|
presencePenalty: 0.4,
|
|
|
|
frequencyPenalty: 0.4
|
|
|
|
},
|
|
|
|
modelParameters: {
|
2023-06-20 08:07:52 +00:00
|
|
|
modelName: 'RWKV-4-World-3B-v1-20230619-ctx4096.pth',
|
2023-06-13 14:46:41 +00:00
|
|
|
device: 'CUDA',
|
|
|
|
precision: 'int8',
|
|
|
|
storedLayers: 41,
|
|
|
|
maxStoredLayers: 41,
|
|
|
|
useCustomCuda: true
|
|
|
|
}
|
|
|
|
},
|
2023-06-06 14:42:38 +00:00
|
|
|
{
|
|
|
|
name: 'GPU-6G-3B-EN',
|
|
|
|
apiParameters: {
|
|
|
|
apiPort: 8000,
|
|
|
|
maxResponseToken: 4100,
|
|
|
|
temperature: 1.2,
|
|
|
|
topP: 0.5,
|
|
|
|
presencePenalty: 0.4,
|
|
|
|
frequencyPenalty: 0.4
|
|
|
|
},
|
|
|
|
modelParameters: {
|
|
|
|
modelName: 'RWKV-4-Raven-3B-v12-Eng98%-Other2%-20230520-ctx4096.pth',
|
|
|
|
device: 'CUDA',
|
|
|
|
precision: 'int8',
|
|
|
|
storedLayers: 41,
|
|
|
|
maxStoredLayers: 41,
|
|
|
|
useCustomCuda: true
|
|
|
|
}
|
|
|
|
},
|
|
|
|
{
|
|
|
|
name: 'GPU-6G-3B-CN',
|
|
|
|
apiParameters: {
|
|
|
|
apiPort: 8000,
|
|
|
|
maxResponseToken: 4100,
|
|
|
|
temperature: 1.2,
|
|
|
|
topP: 0.5,
|
|
|
|
presencePenalty: 0.4,
|
|
|
|
frequencyPenalty: 0.4
|
|
|
|
},
|
|
|
|
modelParameters: {
|
2023-06-28 12:57:09 +00:00
|
|
|
modelName: 'RWKV-4-World-CHNtuned-3B-v1-20230625-ctx4096.pth',
|
2023-06-06 14:42:38 +00:00
|
|
|
device: 'CUDA',
|
|
|
|
precision: 'int8',
|
|
|
|
storedLayers: 41,
|
|
|
|
maxStoredLayers: 41,
|
|
|
|
useCustomCuda: true
|
|
|
|
}
|
|
|
|
},
|
2023-06-13 14:46:41 +00:00
|
|
|
{
|
|
|
|
name: 'GPU-6G-7B-World',
|
|
|
|
apiParameters: {
|
|
|
|
apiPort: 8000,
|
|
|
|
maxResponseToken: 4100,
|
|
|
|
temperature: 1.2,
|
|
|
|
topP: 0.5,
|
|
|
|
presencePenalty: 0.4,
|
|
|
|
frequencyPenalty: 0.4
|
|
|
|
},
|
|
|
|
modelParameters: {
|
2023-06-28 12:57:09 +00:00
|
|
|
modelName: 'RWKV-4-World-7B-v1-20230626-ctx4096.pth',
|
2023-06-13 14:46:41 +00:00
|
|
|
device: 'CUDA',
|
|
|
|
precision: 'int8',
|
|
|
|
storedLayers: 18,
|
|
|
|
maxStoredLayers: 41,
|
|
|
|
useCustomCuda: true
|
|
|
|
}
|
|
|
|
},
|
2023-06-06 14:42:38 +00:00
|
|
|
{
|
|
|
|
name: 'GPU-6G-7B-EN',
|
|
|
|
apiParameters: {
|
|
|
|
apiPort: 8000,
|
|
|
|
maxResponseToken: 4100,
|
|
|
|
temperature: 1.2,
|
|
|
|
topP: 0.5,
|
|
|
|
presencePenalty: 0.4,
|
|
|
|
frequencyPenalty: 0.4
|
|
|
|
},
|
|
|
|
modelParameters: {
|
|
|
|
modelName: 'RWKV-4-Raven-7B-v12-Eng98%-Other2%-20230521-ctx8192.pth',
|
|
|
|
device: 'CUDA',
|
|
|
|
precision: 'int8',
|
|
|
|
storedLayers: 18,
|
|
|
|
maxStoredLayers: 41,
|
|
|
|
useCustomCuda: true
|
|
|
|
}
|
|
|
|
},
|
|
|
|
{
|
|
|
|
name: 'GPU-6G-7B-CN',
|
|
|
|
apiParameters: {
|
|
|
|
apiPort: 8000,
|
|
|
|
maxResponseToken: 4100,
|
|
|
|
temperature: 1.2,
|
|
|
|
topP: 0.5,
|
|
|
|
presencePenalty: 0.4,
|
|
|
|
frequencyPenalty: 0.4
|
|
|
|
},
|
|
|
|
modelParameters: {
|
|
|
|
modelName: 'RWKV-4-Raven-7B-v12-Eng49%-Chn49%-Jpn1%-Other1%-20230530-ctx8192.pth',
|
|
|
|
device: 'CUDA',
|
|
|
|
precision: 'int8',
|
|
|
|
storedLayers: 18,
|
|
|
|
maxStoredLayers: 41,
|
|
|
|
useCustomCuda: true
|
|
|
|
}
|
|
|
|
},
|
2023-06-13 14:46:41 +00:00
|
|
|
{
|
|
|
|
name: 'GPU-8G-1B5-World',
|
|
|
|
apiParameters: {
|
|
|
|
apiPort: 8000,
|
|
|
|
maxResponseToken: 4100,
|
|
|
|
temperature: 1.2,
|
|
|
|
topP: 0.5,
|
|
|
|
presencePenalty: 0.4,
|
|
|
|
frequencyPenalty: 0.4
|
|
|
|
},
|
|
|
|
modelParameters: {
|
|
|
|
modelName: 'RWKV-4-World-1.5B-v1-fixed-20230612-ctx4096.pth',
|
|
|
|
device: 'CUDA',
|
|
|
|
precision: 'fp32',
|
|
|
|
storedLayers: 41,
|
|
|
|
maxStoredLayers: 41
|
|
|
|
}
|
|
|
|
},
|
|
|
|
{
|
|
|
|
name: 'GPU-8G-3B-World',
|
|
|
|
apiParameters: {
|
|
|
|
apiPort: 8000,
|
|
|
|
maxResponseToken: 4100,
|
|
|
|
temperature: 1.2,
|
|
|
|
topP: 0.5,
|
|
|
|
presencePenalty: 0.4,
|
|
|
|
frequencyPenalty: 0.4
|
|
|
|
},
|
|
|
|
modelParameters: {
|
2023-06-20 08:07:52 +00:00
|
|
|
modelName: 'RWKV-4-World-3B-v1-20230619-ctx4096.pth',
|
2023-06-13 14:46:41 +00:00
|
|
|
device: 'CUDA',
|
|
|
|
precision: 'fp16',
|
|
|
|
storedLayers: 41,
|
|
|
|
maxStoredLayers: 41,
|
|
|
|
useCustomCuda: true
|
|
|
|
}
|
|
|
|
},
|
2023-06-06 14:42:38 +00:00
|
|
|
{
|
|
|
|
name: 'GPU-8G-3B-EN',
|
|
|
|
apiParameters: {
|
|
|
|
apiPort: 8000,
|
|
|
|
maxResponseToken: 4100,
|
|
|
|
temperature: 1.2,
|
|
|
|
topP: 0.5,
|
|
|
|
presencePenalty: 0.4,
|
|
|
|
frequencyPenalty: 0.4
|
|
|
|
},
|
|
|
|
modelParameters: {
|
|
|
|
modelName: 'RWKV-4-Raven-3B-v12-Eng98%-Other2%-20230520-ctx4096.pth',
|
|
|
|
device: 'CUDA',
|
|
|
|
precision: 'fp16',
|
|
|
|
storedLayers: 41,
|
|
|
|
maxStoredLayers: 41,
|
|
|
|
useCustomCuda: true
|
|
|
|
}
|
|
|
|
},
|
|
|
|
{
|
|
|
|
name: 'GPU-8G-3B-CN',
|
|
|
|
apiParameters: {
|
|
|
|
apiPort: 8000,
|
|
|
|
maxResponseToken: 4100,
|
|
|
|
temperature: 1.2,
|
|
|
|
topP: 0.5,
|
|
|
|
presencePenalty: 0.4,
|
|
|
|
frequencyPenalty: 0.4
|
|
|
|
},
|
|
|
|
modelParameters: {
|
2023-06-28 12:57:09 +00:00
|
|
|
modelName: 'RWKV-4-World-CHNtuned-3B-v1-20230625-ctx4096.pth',
|
2023-06-06 14:42:38 +00:00
|
|
|
device: 'CUDA',
|
|
|
|
precision: 'fp16',
|
|
|
|
storedLayers: 41,
|
|
|
|
maxStoredLayers: 41,
|
|
|
|
useCustomCuda: true
|
|
|
|
}
|
|
|
|
},
|
2023-06-13 14:46:41 +00:00
|
|
|
{
|
|
|
|
name: 'GPU-8G-7B-World',
|
|
|
|
apiParameters: {
|
|
|
|
apiPort: 8000,
|
|
|
|
maxResponseToken: 4100,
|
|
|
|
temperature: 1.2,
|
|
|
|
topP: 0.5,
|
|
|
|
presencePenalty: 0.4,
|
|
|
|
frequencyPenalty: 0.4
|
|
|
|
},
|
|
|
|
modelParameters: {
|
2023-06-28 12:57:09 +00:00
|
|
|
modelName: 'RWKV-4-World-7B-v1-20230626-ctx4096.pth',
|
2023-06-13 14:46:41 +00:00
|
|
|
device: 'CUDA',
|
|
|
|
precision: 'int8',
|
|
|
|
storedLayers: 27,
|
|
|
|
maxStoredLayers: 41,
|
|
|
|
useCustomCuda: true
|
|
|
|
}
|
|
|
|
},
|
2023-06-06 14:42:38 +00:00
|
|
|
{
|
|
|
|
name: 'GPU-8G-7B-EN',
|
|
|
|
apiParameters: {
|
|
|
|
apiPort: 8000,
|
|
|
|
maxResponseToken: 4100,
|
|
|
|
temperature: 1.2,
|
|
|
|
topP: 0.5,
|
|
|
|
presencePenalty: 0.4,
|
|
|
|
frequencyPenalty: 0.4
|
|
|
|
},
|
|
|
|
modelParameters: {
|
|
|
|
modelName: 'RWKV-4-Raven-7B-v12-Eng98%-Other2%-20230521-ctx8192.pth',
|
|
|
|
device: 'CUDA',
|
|
|
|
precision: 'int8',
|
|
|
|
storedLayers: 27,
|
|
|
|
maxStoredLayers: 41,
|
|
|
|
useCustomCuda: true
|
|
|
|
}
|
|
|
|
},
|
|
|
|
{
|
|
|
|
name: 'GPU-8G-7B-CN',
|
|
|
|
apiParameters: {
|
|
|
|
apiPort: 8000,
|
|
|
|
maxResponseToken: 4100,
|
|
|
|
temperature: 1.2,
|
|
|
|
topP: 0.5,
|
|
|
|
presencePenalty: 0.4,
|
|
|
|
frequencyPenalty: 0.4
|
|
|
|
},
|
|
|
|
modelParameters: {
|
|
|
|
modelName: 'RWKV-4-Raven-7B-v12-Eng49%-Chn49%-Jpn1%-Other1%-20230530-ctx8192.pth',
|
|
|
|
device: 'CUDA',
|
|
|
|
precision: 'int8',
|
|
|
|
storedLayers: 27,
|
|
|
|
maxStoredLayers: 41,
|
|
|
|
useCustomCuda: true
|
|
|
|
}
|
|
|
|
},
|
2023-06-13 14:46:41 +00:00
|
|
|
{
|
|
|
|
name: 'GPU-10G-7B-World',
|
|
|
|
apiParameters: {
|
|
|
|
apiPort: 8000,
|
|
|
|
maxResponseToken: 4100,
|
|
|
|
temperature: 1.2,
|
|
|
|
topP: 0.5,
|
|
|
|
presencePenalty: 0.4,
|
|
|
|
frequencyPenalty: 0.4
|
|
|
|
},
|
|
|
|
modelParameters: {
|
2023-06-28 12:57:09 +00:00
|
|
|
modelName: 'RWKV-4-World-7B-v1-20230626-ctx4096.pth',
|
2023-06-13 14:46:41 +00:00
|
|
|
device: 'CUDA',
|
|
|
|
precision: 'int8',
|
|
|
|
storedLayers: 41,
|
|
|
|
maxStoredLayers: 41,
|
|
|
|
useCustomCuda: true
|
|
|
|
}
|
|
|
|
},
|
2023-06-06 14:42:38 +00:00
|
|
|
{
|
|
|
|
name: 'GPU-10G-7B-EN',
|
|
|
|
apiParameters: {
|
|
|
|
apiPort: 8000,
|
|
|
|
maxResponseToken: 4100,
|
|
|
|
temperature: 1.2,
|
|
|
|
topP: 0.5,
|
|
|
|
presencePenalty: 0.4,
|
|
|
|
frequencyPenalty: 0.4
|
|
|
|
},
|
|
|
|
modelParameters: {
|
|
|
|
modelName: 'RWKV-4-Raven-7B-v12-Eng98%-Other2%-20230521-ctx8192.pth',
|
|
|
|
device: 'CUDA',
|
|
|
|
precision: 'int8',
|
|
|
|
storedLayers: 41,
|
|
|
|
maxStoredLayers: 41,
|
|
|
|
useCustomCuda: true
|
|
|
|
}
|
|
|
|
},
|
|
|
|
{
|
|
|
|
name: 'GPU-10G-7B-CN',
|
|
|
|
apiParameters: {
|
|
|
|
apiPort: 8000,
|
|
|
|
maxResponseToken: 4100,
|
|
|
|
temperature: 1.2,
|
|
|
|
topP: 0.5,
|
|
|
|
presencePenalty: 0.4,
|
|
|
|
frequencyPenalty: 0.4
|
|
|
|
},
|
|
|
|
modelParameters: {
|
|
|
|
modelName: 'RWKV-4-Raven-7B-v12-Eng49%-Chn49%-Jpn1%-Other1%-20230530-ctx8192.pth',
|
|
|
|
device: 'CUDA',
|
|
|
|
precision: 'int8',
|
|
|
|
storedLayers: 41,
|
|
|
|
maxStoredLayers: 41,
|
|
|
|
useCustomCuda: true
|
|
|
|
}
|
|
|
|
},
|
|
|
|
{
|
|
|
|
name: 'GPU-12G-14B-EN',
|
|
|
|
apiParameters: {
|
|
|
|
apiPort: 8000,
|
|
|
|
maxResponseToken: 4100,
|
|
|
|
temperature: 1.2,
|
|
|
|
topP: 0.5,
|
|
|
|
presencePenalty: 0.4,
|
|
|
|
frequencyPenalty: 0.4
|
|
|
|
},
|
|
|
|
modelParameters: {
|
|
|
|
modelName: 'RWKV-4-Raven-14B-v12-Eng98%-Other2%-20230523-ctx8192.pth',
|
|
|
|
device: 'CUDA',
|
|
|
|
precision: 'int8',
|
|
|
|
storedLayers: 24,
|
|
|
|
maxStoredLayers: 41,
|
|
|
|
useCustomCuda: true
|
|
|
|
}
|
|
|
|
},
|
2023-06-13 14:46:41 +00:00
|
|
|
{
|
|
|
|
name: 'GPU-16G-7B-World',
|
|
|
|
apiParameters: {
|
|
|
|
apiPort: 8000,
|
|
|
|
maxResponseToken: 4100,
|
|
|
|
temperature: 1.2,
|
|
|
|
topP: 0.5,
|
|
|
|
presencePenalty: 0.4,
|
|
|
|
frequencyPenalty: 0.4
|
|
|
|
},
|
|
|
|
modelParameters: {
|
2023-06-28 12:57:09 +00:00
|
|
|
modelName: 'RWKV-4-World-7B-v1-20230626-ctx4096.pth',
|
2023-06-13 14:46:41 +00:00
|
|
|
device: 'CUDA',
|
|
|
|
precision: 'fp16',
|
|
|
|
storedLayers: 41,
|
|
|
|
maxStoredLayers: 41,
|
|
|
|
useCustomCuda: true
|
|
|
|
}
|
|
|
|
},
|
2023-06-06 14:42:38 +00:00
|
|
|
{
|
|
|
|
name: 'GPU-16G-7B-EN',
|
|
|
|
apiParameters: {
|
|
|
|
apiPort: 8000,
|
|
|
|
maxResponseToken: 4100,
|
|
|
|
temperature: 1.2,
|
|
|
|
topP: 0.5,
|
|
|
|
presencePenalty: 0.4,
|
|
|
|
frequencyPenalty: 0.4
|
|
|
|
},
|
|
|
|
modelParameters: {
|
|
|
|
modelName: 'RWKV-4-Raven-7B-v12-Eng98%-Other2%-20230521-ctx8192.pth',
|
|
|
|
device: 'CUDA',
|
|
|
|
precision: 'fp16',
|
|
|
|
storedLayers: 41,
|
|
|
|
maxStoredLayers: 41,
|
|
|
|
useCustomCuda: true
|
|
|
|
}
|
|
|
|
},
|
|
|
|
{
|
|
|
|
name: 'GPU-16G-7B-CN',
|
|
|
|
apiParameters: {
|
|
|
|
apiPort: 8000,
|
|
|
|
maxResponseToken: 4100,
|
|
|
|
temperature: 1.2,
|
|
|
|
topP: 0.5,
|
|
|
|
presencePenalty: 0.4,
|
|
|
|
frequencyPenalty: 0.4
|
|
|
|
},
|
|
|
|
modelParameters: {
|
|
|
|
modelName: 'RWKV-4-Raven-7B-v12-Eng49%-Chn49%-Jpn1%-Other1%-20230530-ctx8192.pth',
|
|
|
|
device: 'CUDA',
|
|
|
|
precision: 'fp16',
|
|
|
|
storedLayers: 41,
|
|
|
|
maxStoredLayers: 41,
|
|
|
|
useCustomCuda: true
|
|
|
|
}
|
|
|
|
},
|
|
|
|
{
|
|
|
|
name: 'GPU-16G-14B-EN',
|
|
|
|
apiParameters: {
|
|
|
|
apiPort: 8000,
|
|
|
|
maxResponseToken: 4100,
|
|
|
|
temperature: 1.2,
|
|
|
|
topP: 0.5,
|
|
|
|
presencePenalty: 0.4,
|
|
|
|
frequencyPenalty: 0.4
|
|
|
|
},
|
|
|
|
modelParameters: {
|
|
|
|
modelName: 'RWKV-4-Raven-14B-v12-Eng98%-Other2%-20230523-ctx8192.pth',
|
|
|
|
device: 'CUDA',
|
|
|
|
precision: 'int8',
|
|
|
|
storedLayers: 37,
|
|
|
|
maxStoredLayers: 41,
|
|
|
|
useCustomCuda: true
|
|
|
|
}
|
|
|
|
},
|
|
|
|
{
|
|
|
|
name: 'GPU-18G-14B-EN',
|
|
|
|
apiParameters: {
|
|
|
|
apiPort: 8000,
|
|
|
|
maxResponseToken: 4100,
|
|
|
|
temperature: 1.2,
|
|
|
|
topP: 0.5,
|
|
|
|
presencePenalty: 0.4,
|
|
|
|
frequencyPenalty: 0.4
|
|
|
|
},
|
|
|
|
modelParameters: {
|
|
|
|
modelName: 'RWKV-4-Raven-14B-v12-Eng98%-Other2%-20230523-ctx8192.pth',
|
|
|
|
device: 'CUDA',
|
|
|
|
precision: 'int8',
|
|
|
|
storedLayers: 41,
|
|
|
|
maxStoredLayers: 41,
|
|
|
|
useCustomCuda: true
|
|
|
|
}
|
|
|
|
},
|
|
|
|
{
|
|
|
|
name: 'GPU-32G-14B-EN',
|
|
|
|
apiParameters: {
|
|
|
|
apiPort: 8000,
|
|
|
|
maxResponseToken: 4100,
|
|
|
|
temperature: 1.2,
|
|
|
|
topP: 0.5,
|
|
|
|
presencePenalty: 0.4,
|
|
|
|
frequencyPenalty: 0.4
|
|
|
|
},
|
|
|
|
modelParameters: {
|
|
|
|
modelName: 'RWKV-4-Raven-14B-v12-Eng98%-Other2%-20230523-ctx8192.pth',
|
|
|
|
device: 'CUDA',
|
|
|
|
precision: 'fp16',
|
|
|
|
storedLayers: 41,
|
|
|
|
maxStoredLayers: 41,
|
|
|
|
useCustomCuda: true
|
|
|
|
}
|
|
|
|
},
|
2023-06-13 14:46:41 +00:00
|
|
|
{
|
|
|
|
name: 'CPU-6G-1B5-World',
|
|
|
|
apiParameters: {
|
|
|
|
apiPort: 8000,
|
|
|
|
maxResponseToken: 4100,
|
|
|
|
temperature: 1.2,
|
|
|
|
topP: 0.5,
|
|
|
|
presencePenalty: 0.4,
|
|
|
|
frequencyPenalty: 0.4
|
|
|
|
},
|
|
|
|
modelParameters: {
|
|
|
|
modelName: 'RWKV-4-World-1.5B-v1-fixed-20230612-ctx4096.pth',
|
|
|
|
device: 'CPU',
|
|
|
|
precision: 'fp32',
|
|
|
|
storedLayers: 41,
|
|
|
|
maxStoredLayers: 41
|
|
|
|
}
|
|
|
|
},
|
2023-06-06 14:42:38 +00:00
|
|
|
{
|
|
|
|
name: 'CPU-6G-1B5-EN',
|
|
|
|
apiParameters: {
|
|
|
|
apiPort: 8000,
|
|
|
|
maxResponseToken: 4100,
|
|
|
|
temperature: 1.2,
|
|
|
|
topP: 0.5,
|
|
|
|
presencePenalty: 0.4,
|
|
|
|
frequencyPenalty: 0.4
|
|
|
|
},
|
|
|
|
modelParameters: {
|
|
|
|
modelName: 'RWKV-4-Raven-1B5-v12-Eng98%-Other2%-20230520-ctx4096.pth',
|
|
|
|
device: 'CPU',
|
|
|
|
precision: 'fp32',
|
|
|
|
storedLayers: 41,
|
2023-06-09 12:49:45 +00:00
|
|
|
maxStoredLayers: 41
|
2023-06-06 14:42:38 +00:00
|
|
|
}
|
|
|
|
},
|
2023-06-13 14:46:41 +00:00
|
|
|
{
|
|
|
|
name: 'CPU-12G-3B-World',
|
|
|
|
apiParameters: {
|
|
|
|
apiPort: 8000,
|
|
|
|
maxResponseToken: 4100,
|
|
|
|
temperature: 1.2,
|
|
|
|
topP: 0.5,
|
|
|
|
presencePenalty: 0.4,
|
|
|
|
frequencyPenalty: 0.4
|
|
|
|
},
|
|
|
|
modelParameters: {
|
2023-06-20 08:07:52 +00:00
|
|
|
modelName: 'RWKV-4-World-3B-v1-20230619-ctx4096.pth',
|
2023-06-13 14:46:41 +00:00
|
|
|
device: 'CPU',
|
|
|
|
precision: 'fp32',
|
|
|
|
storedLayers: 41,
|
|
|
|
maxStoredLayers: 41
|
|
|
|
}
|
|
|
|
},
|
2023-06-06 14:42:38 +00:00
|
|
|
{
|
|
|
|
name: 'CPU-12G-3B-EN',
|
|
|
|
apiParameters: {
|
|
|
|
apiPort: 8000,
|
|
|
|
maxResponseToken: 4100,
|
|
|
|
temperature: 1.2,
|
|
|
|
topP: 0.5,
|
|
|
|
presencePenalty: 0.4,
|
|
|
|
frequencyPenalty: 0.4
|
|
|
|
},
|
|
|
|
modelParameters: {
|
|
|
|
modelName: 'RWKV-4-Raven-3B-v12-Eng98%-Other2%-20230520-ctx4096.pth',
|
|
|
|
device: 'CPU',
|
|
|
|
precision: 'fp32',
|
|
|
|
storedLayers: 41,
|
2023-06-09 12:49:45 +00:00
|
|
|
maxStoredLayers: 41
|
2023-06-06 14:42:38 +00:00
|
|
|
}
|
|
|
|
},
|
|
|
|
{
|
|
|
|
name: 'CPU-12G-3B-CN',
|
|
|
|
apiParameters: {
|
|
|
|
apiPort: 8000,
|
|
|
|
maxResponseToken: 4100,
|
|
|
|
temperature: 1.2,
|
|
|
|
topP: 0.5,
|
|
|
|
presencePenalty: 0.4,
|
|
|
|
frequencyPenalty: 0.4
|
|
|
|
},
|
|
|
|
modelParameters: {
|
2023-06-28 12:57:09 +00:00
|
|
|
modelName: 'RWKV-4-World-CHNtuned-3B-v1-20230625-ctx4096.pth',
|
2023-06-06 14:42:38 +00:00
|
|
|
device: 'CPU',
|
|
|
|
precision: 'fp32',
|
|
|
|
storedLayers: 41,
|
2023-06-09 12:49:45 +00:00
|
|
|
maxStoredLayers: 41
|
2023-06-06 14:42:38 +00:00
|
|
|
}
|
|
|
|
},
|
2023-06-13 14:46:41 +00:00
|
|
|
{
|
|
|
|
name: 'CPU-28G-7B-World',
|
|
|
|
apiParameters: {
|
|
|
|
apiPort: 8000,
|
|
|
|
maxResponseToken: 4100,
|
|
|
|
temperature: 1.2,
|
|
|
|
topP: 0.5,
|
|
|
|
presencePenalty: 0.4,
|
|
|
|
frequencyPenalty: 0.4
|
|
|
|
},
|
|
|
|
modelParameters: {
|
2023-06-28 12:57:09 +00:00
|
|
|
modelName: 'RWKV-4-World-7B-v1-20230626-ctx4096.pth',
|
2023-06-13 14:46:41 +00:00
|
|
|
device: 'CPU',
|
|
|
|
precision: 'fp32',
|
|
|
|
storedLayers: 41,
|
|
|
|
maxStoredLayers: 41
|
|
|
|
}
|
|
|
|
},
|
2023-06-06 14:42:38 +00:00
|
|
|
{
|
|
|
|
name: 'CPU-28G-7B-EN',
|
|
|
|
apiParameters: {
|
|
|
|
apiPort: 8000,
|
|
|
|
maxResponseToken: 4100,
|
|
|
|
temperature: 1.2,
|
|
|
|
topP: 0.5,
|
|
|
|
presencePenalty: 0.4,
|
|
|
|
frequencyPenalty: 0.4
|
|
|
|
},
|
|
|
|
modelParameters: {
|
|
|
|
modelName: 'RWKV-4-Raven-7B-v12-Eng98%-Other2%-20230521-ctx8192.pth',
|
|
|
|
device: 'CPU',
|
|
|
|
precision: 'fp32',
|
|
|
|
storedLayers: 41,
|
2023-06-09 12:49:45 +00:00
|
|
|
maxStoredLayers: 41
|
2023-06-06 14:42:38 +00:00
|
|
|
}
|
|
|
|
},
|
|
|
|
{
|
|
|
|
name: 'CPU-28G-7B-CN',
|
|
|
|
apiParameters: {
|
|
|
|
apiPort: 8000,
|
|
|
|
maxResponseToken: 4100,
|
|
|
|
temperature: 1.2,
|
|
|
|
topP: 0.5,
|
|
|
|
presencePenalty: 0.4,
|
|
|
|
frequencyPenalty: 0.4
|
|
|
|
},
|
|
|
|
modelParameters: {
|
|
|
|
modelName: 'RWKV-4-Raven-7B-v12-Eng49%-Chn49%-Jpn1%-Other1%-20230530-ctx8192.pth',
|
|
|
|
device: 'CPU',
|
|
|
|
precision: 'fp32',
|
|
|
|
storedLayers: 41,
|
2023-06-09 12:49:45 +00:00
|
|
|
maxStoredLayers: 41
|
2023-06-06 14:42:38 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
];
|