update models and configs

This commit is contained in:
josc146
2023-06-13 22:46:41 +08:00
parent 5896593951
commit 631704d04d
2 changed files with 469 additions and 6 deletions

View File

@@ -1,6 +1,63 @@
import { ModelConfig } from './Configs';
export const defaultModelConfigsMac: ModelConfig[] = [
{
name: 'MAC-0.1B-World',
apiParameters: {
apiPort: 8000,
maxResponseToken: 4100,
temperature: 1.2,
topP: 0.5,
presencePenalty: 0.4,
frequencyPenalty: 0.4
},
modelParameters: {
modelName: 'RWKV-4-World-0.1B-v1-20230520-ctx4096.pth',
device: 'MPS',
precision: 'fp32',
storedLayers: 41,
maxStoredLayers: 41,
customStrategy: 'mps fp32'
}
},
{
name: 'MAC-0.4B-World',
apiParameters: {
apiPort: 8000,
maxResponseToken: 4100,
temperature: 1.2,
topP: 0.5,
presencePenalty: 0.4,
frequencyPenalty: 0.4
},
modelParameters: {
modelName: 'RWKV-4-World-0.4B-v1-20230529-ctx4096.pth',
device: 'MPS',
precision: 'fp32',
storedLayers: 41,
maxStoredLayers: 41,
customStrategy: 'mps fp32'
}
},
{
name: 'MAC-1B5-World',
apiParameters: {
apiPort: 8000,
maxResponseToken: 4100,
temperature: 1.2,
topP: 0.5,
presencePenalty: 0.4,
frequencyPenalty: 0.4
},
modelParameters: {
modelName: 'RWKV-4-World-1.5B-v1-fixed-20230612-ctx4096.pth',
device: 'MPS',
precision: 'fp32',
storedLayers: 41,
maxStoredLayers: 41,
customStrategy: 'mps fp32'
}
},
{
name: 'MAC-1B5-EN',
apiParameters: {
@@ -17,7 +74,25 @@ export const defaultModelConfigsMac: ModelConfig[] = [
precision: 'fp32',
storedLayers: 41,
maxStoredLayers: 41,
useCustomCuda: false,
customStrategy: 'mps fp32'
}
},
{
name: 'MAC-3B-World',
apiParameters: {
apiPort: 8000,
maxResponseToken: 4100,
temperature: 1.2,
topP: 0.5,
presencePenalty: 0.4,
frequencyPenalty: 0.4
},
modelParameters: {
modelName: 'RWKV-4-World-3B-v1-OnlyForTest_80%_trained-20230612-ctx4096.pth',
device: 'MPS',
precision: 'fp32',
storedLayers: 41,
maxStoredLayers: 41,
customStrategy: 'mps fp32'
}
},
@@ -37,7 +112,6 @@ export const defaultModelConfigsMac: ModelConfig[] = [
precision: 'fp32',
storedLayers: 41,
maxStoredLayers: 41,
useCustomCuda: false,
customStrategy: 'mps fp32'
}
},
@@ -57,10 +131,46 @@ export const defaultModelConfigsMac: ModelConfig[] = [
precision: 'fp32',
storedLayers: 41,
maxStoredLayers: 41,
useCustomCuda: false,
customStrategy: 'mps fp32'
}
},
{
name: 'MAC-7B-World',
apiParameters: {
apiPort: 8000,
maxResponseToken: 4100,
temperature: 1.2,
topP: 0.5,
presencePenalty: 0.4,
frequencyPenalty: 0.4
},
modelParameters: {
modelName: 'RWKV-4-World-7B-v1-OnlyForTest_64%_trained-20230610-ctx4096.pth',
device: 'MPS',
precision: 'fp32',
storedLayers: 41,
maxStoredLayers: 41,
customStrategy: 'mps fp32'
}
},
{
name: 'CPU-6G-1B5-World',
apiParameters: {
apiPort: 8000,
maxResponseToken: 4100,
temperature: 1.2,
topP: 0.5,
presencePenalty: 0.4,
frequencyPenalty: 0.4
},
modelParameters: {
modelName: 'RWKV-4-World-1.5B-v1-fixed-20230612-ctx4096.pth',
device: 'CPU',
precision: 'fp32',
storedLayers: 41,
maxStoredLayers: 41
}
},
{
name: 'CPU-6G-1B5-EN',
apiParameters: {
@@ -79,6 +189,24 @@ export const defaultModelConfigsMac: ModelConfig[] = [
maxStoredLayers: 41
}
},
{
name: 'CPU-12G-3B-World',
apiParameters: {
apiPort: 8000,
maxResponseToken: 4100,
temperature: 1.2,
topP: 0.5,
presencePenalty: 0.4,
frequencyPenalty: 0.4
},
modelParameters: {
modelName: 'RWKV-4-World-3B-v1-OnlyForTest_80%_trained-20230612-ctx4096.pth',
device: 'CPU',
precision: 'fp32',
storedLayers: 41,
maxStoredLayers: 41
}
},
{
name: 'CPU-12G-3B-EN',
apiParameters: {
@@ -115,6 +243,24 @@ export const defaultModelConfigsMac: ModelConfig[] = [
maxStoredLayers: 41
}
},
{
name: 'CPU-28G-7B-World',
apiParameters: {
apiPort: 8000,
maxResponseToken: 4100,
temperature: 1.2,
topP: 0.5,
presencePenalty: 0.4,
frequencyPenalty: 0.4
},
modelParameters: {
modelName: 'RWKV-4-World-7B-v1-OnlyForTest_64%_trained-20230610-ctx4096.pth',
device: 'CPU',
precision: 'fp32',
storedLayers: 41,
maxStoredLayers: 41
}
},
{
name: 'CPU-28G-7B-EN',
apiParameters: {
@@ -154,6 +300,24 @@ export const defaultModelConfigsMac: ModelConfig[] = [
];
export const defaultModelConfigs: ModelConfig[] = [
{
name: 'GPU-2G-0.1B-World',
apiParameters: {
apiPort: 8000,
maxResponseToken: 4100,
temperature: 1.2,
topP: 0.5,
presencePenalty: 0.4,
frequencyPenalty: 0.4
},
modelParameters: {
modelName: 'RWKV-4-World-0.1B-v1-20230520-ctx4096.pth',
device: 'CUDA',
precision: 'fp32',
storedLayers: 41,
maxStoredLayers: 41
}
},
{
name: 'GPU-2G-1B5-EN',
apiParameters: {
@@ -173,6 +337,42 @@ export const defaultModelConfigs: ModelConfig[] = [
useCustomCuda: true
}
},
{
name: 'GPU-4G-0.4B-World',
apiParameters: {
apiPort: 8000,
maxResponseToken: 4100,
temperature: 1.2,
topP: 0.5,
presencePenalty: 0.4,
frequencyPenalty: 0.4
},
modelParameters: {
modelName: 'RWKV-4-World-0.4B-v1-20230529-ctx4096.pth',
device: 'CUDA',
precision: 'fp32',
storedLayers: 41,
maxStoredLayers: 41
}
},
{
name: 'GPU-4G-1B5-World',
apiParameters: {
apiPort: 8000,
maxResponseToken: 4100,
temperature: 1.2,
topP: 0.5,
presencePenalty: 0.4,
frequencyPenalty: 0.4
},
modelParameters: {
modelName: 'RWKV-4-World-1.5B-v1-fixed-20230612-ctx4096.pth',
device: 'CUDA',
precision: 'fp32',
storedLayers: 8,
maxStoredLayers: 41
}
},
{
name: 'GPU-4G-1B5-EN',
apiParameters: {
@@ -192,6 +392,25 @@ export const defaultModelConfigs: ModelConfig[] = [
useCustomCuda: true
}
},
{
name: 'GPU-4G-3B-World',
apiParameters: {
apiPort: 8000,
maxResponseToken: 4100,
temperature: 1.2,
topP: 0.5,
presencePenalty: 0.4,
frequencyPenalty: 0.4
},
modelParameters: {
modelName: 'RWKV-4-World-3B-v1-OnlyForTest_80%_trained-20230612-ctx4096.pth',
device: 'CUDA',
precision: 'int8',
storedLayers: 24,
maxStoredLayers: 41,
useCustomCuda: true
}
},
{
name: 'GPU-4G-3B-EN',
apiParameters: {
@@ -230,6 +449,25 @@ export const defaultModelConfigs: ModelConfig[] = [
useCustomCuda: true
}
},
{
name: 'GPU-4G-7B-World',
apiParameters: {
apiPort: 8000,
maxResponseToken: 4100,
temperature: 1.2,
topP: 0.5,
presencePenalty: 0.4,
frequencyPenalty: 0.4
},
modelParameters: {
modelName: 'RWKV-4-World-7B-v1-OnlyForTest_64%_trained-20230610-ctx4096.pth',
device: 'CUDA',
precision: 'int8',
storedLayers: 8,
maxStoredLayers: 41,
useCustomCuda: true
}
},
{
name: 'GPU-4G-7B-EN',
apiParameters: {
@@ -287,6 +525,25 @@ export const defaultModelConfigs: ModelConfig[] = [
useCustomCuda: true
}
},
{
name: 'GPU-6G-3B-World',
apiParameters: {
apiPort: 8000,
maxResponseToken: 4100,
temperature: 1.2,
topP: 0.5,
presencePenalty: 0.4,
frequencyPenalty: 0.4
},
modelParameters: {
modelName: 'RWKV-4-World-3B-v1-OnlyForTest_80%_trained-20230612-ctx4096.pth',
device: 'CUDA',
precision: 'int8',
storedLayers: 41,
maxStoredLayers: 41,
useCustomCuda: true
}
},
{
name: 'GPU-6G-3B-EN',
apiParameters: {
@@ -325,6 +582,25 @@ export const defaultModelConfigs: ModelConfig[] = [
useCustomCuda: true
}
},
{
name: 'GPU-6G-7B-World',
apiParameters: {
apiPort: 8000,
maxResponseToken: 4100,
temperature: 1.2,
topP: 0.5,
presencePenalty: 0.4,
frequencyPenalty: 0.4
},
modelParameters: {
modelName: 'RWKV-4-World-7B-v1-OnlyForTest_64%_trained-20230610-ctx4096.pth',
device: 'CUDA',
precision: 'int8',
storedLayers: 18,
maxStoredLayers: 41,
useCustomCuda: true
}
},
{
name: 'GPU-6G-7B-EN',
apiParameters: {
@@ -363,6 +639,43 @@ export const defaultModelConfigs: ModelConfig[] = [
useCustomCuda: true
}
},
{
name: 'GPU-8G-1B5-World',
apiParameters: {
apiPort: 8000,
maxResponseToken: 4100,
temperature: 1.2,
topP: 0.5,
presencePenalty: 0.4,
frequencyPenalty: 0.4
},
modelParameters: {
modelName: 'RWKV-4-World-1.5B-v1-fixed-20230612-ctx4096.pth',
device: 'CUDA',
precision: 'fp32',
storedLayers: 41,
maxStoredLayers: 41
}
},
{
name: 'GPU-8G-3B-World',
apiParameters: {
apiPort: 8000,
maxResponseToken: 4100,
temperature: 1.2,
topP: 0.5,
presencePenalty: 0.4,
frequencyPenalty: 0.4
},
modelParameters: {
modelName: 'RWKV-4-World-3B-v1-OnlyForTest_80%_trained-20230612-ctx4096.pth',
device: 'CUDA',
precision: 'fp16',
storedLayers: 41,
maxStoredLayers: 41,
useCustomCuda: true
}
},
{
name: 'GPU-8G-3B-EN',
apiParameters: {
@@ -401,6 +714,25 @@ export const defaultModelConfigs: ModelConfig[] = [
useCustomCuda: true
}
},
{
name: 'GPU-8G-7B-World',
apiParameters: {
apiPort: 8000,
maxResponseToken: 4100,
temperature: 1.2,
topP: 0.5,
presencePenalty: 0.4,
frequencyPenalty: 0.4
},
modelParameters: {
modelName: 'RWKV-4-World-7B-v1-OnlyForTest_64%_trained-20230610-ctx4096.pth',
device: 'CUDA',
precision: 'int8',
storedLayers: 27,
maxStoredLayers: 41,
useCustomCuda: true
}
},
{
name: 'GPU-8G-7B-EN',
apiParameters: {
@@ -439,6 +771,25 @@ export const defaultModelConfigs: ModelConfig[] = [
useCustomCuda: true
}
},
{
name: 'GPU-10G-7B-World',
apiParameters: {
apiPort: 8000,
maxResponseToken: 4100,
temperature: 1.2,
topP: 0.5,
presencePenalty: 0.4,
frequencyPenalty: 0.4
},
modelParameters: {
modelName: 'RWKV-4-World-7B-v1-OnlyForTest_64%_trained-20230610-ctx4096.pth',
device: 'CUDA',
precision: 'int8',
storedLayers: 41,
maxStoredLayers: 41,
useCustomCuda: true
}
},
{
name: 'GPU-10G-7B-EN',
apiParameters: {
@@ -496,6 +847,25 @@ export const defaultModelConfigs: ModelConfig[] = [
useCustomCuda: true
}
},
{
name: 'GPU-16G-7B-World',
apiParameters: {
apiPort: 8000,
maxResponseToken: 4100,
temperature: 1.2,
topP: 0.5,
presencePenalty: 0.4,
frequencyPenalty: 0.4
},
modelParameters: {
modelName: 'RWKV-4-World-7B-v1-OnlyForTest_64%_trained-20230610-ctx4096.pth',
device: 'CUDA',
precision: 'fp16',
storedLayers: 41,
maxStoredLayers: 41,
useCustomCuda: true
}
},
{
name: 'GPU-16G-7B-EN',
apiParameters: {
@@ -591,6 +961,24 @@ export const defaultModelConfigs: ModelConfig[] = [
useCustomCuda: true
}
},
{
name: 'CPU-6G-1B5-World',
apiParameters: {
apiPort: 8000,
maxResponseToken: 4100,
temperature: 1.2,
topP: 0.5,
presencePenalty: 0.4,
frequencyPenalty: 0.4
},
modelParameters: {
modelName: 'RWKV-4-World-1.5B-v1-fixed-20230612-ctx4096.pth',
device: 'CPU',
precision: 'fp32',
storedLayers: 41,
maxStoredLayers: 41
}
},
{
name: 'CPU-6G-1B5-EN',
apiParameters: {
@@ -609,6 +997,24 @@ export const defaultModelConfigs: ModelConfig[] = [
maxStoredLayers: 41
}
},
{
name: 'CPU-12G-3B-World',
apiParameters: {
apiPort: 8000,
maxResponseToken: 4100,
temperature: 1.2,
topP: 0.5,
presencePenalty: 0.4,
frequencyPenalty: 0.4
},
modelParameters: {
modelName: 'RWKV-4-World-3B-v1-OnlyForTest_80%_trained-20230612-ctx4096.pth',
device: 'CPU',
precision: 'fp32',
storedLayers: 41,
maxStoredLayers: 41
}
},
{
name: 'CPU-12G-3B-EN',
apiParameters: {
@@ -645,6 +1051,24 @@ export const defaultModelConfigs: ModelConfig[] = [
maxStoredLayers: 41
}
},
{
name: 'CPU-28G-7B-World',
apiParameters: {
apiPort: 8000,
maxResponseToken: 4100,
temperature: 1.2,
topP: 0.5,
presencePenalty: 0.4,
frequencyPenalty: 0.4
},
modelParameters: {
modelName: 'RWKV-4-World-7B-v1-OnlyForTest_64%_trained-20230610-ctx4096.pth',
device: 'CPU',
precision: 'fp32',
storedLayers: 41,
maxStoredLayers: 41
}
},
{
name: 'CPU-28G-7B-EN',
apiParameters: {