RWKV-Runner/backend-python/main.py

69 lines
1.3 KiB
Python
Raw Normal View History

2023-05-06 12:17:39 +00:00
import os
2023-05-17 03:39:00 +00:00
import sys
2023-05-06 12:17:39 +00:00
2023-05-20 15:34:33 +00:00
sys.path.append(os.path.dirname(os.path.realpath(__file__)))
import psutil
2023-05-07 09:27:54 +00:00
from fastapi import FastAPI
2023-05-06 12:17:39 +00:00
from fastapi.middleware.cors import CORSMiddleware
import uvicorn
2023-05-07 09:27:54 +00:00
from utils.rwkv import *
from utils.torch import *
from utils.ngrok import *
from routes import completion, config
import global_var
2023-05-06 12:17:39 +00:00
app = FastAPI()
app.add_middleware(
CORSMiddleware,
allow_origins=["*"],
allow_credentials=True,
allow_methods=["*"],
allow_headers=["*"],
)
2023-05-07 09:27:54 +00:00
app.include_router(completion.router)
app.include_router(config.router)
2023-05-06 12:17:39 +00:00
2023-05-17 03:39:00 +00:00
@app.on_event("startup")
2023-05-06 12:17:39 +00:00
def init():
2023-05-07 09:27:54 +00:00
global_var.init()
2023-05-06 12:17:39 +00:00
set_torch()
if os.environ.get("ngrok_token") is not None:
ngrok_connect()
@app.get("/")
def read_root():
2023-05-17 03:39:00 +00:00
return {"Hello": "World!", "pid": os.getpid()}
2023-05-06 12:17:39 +00:00
2023-05-07 09:27:54 +00:00
@app.post("/exit")
2023-05-07 14:48:52 +00:00
def exit():
2023-05-07 09:27:54 +00:00
parent_pid = os.getpid()
parent = psutil.Process(parent_pid)
for child in parent.children(recursive=True):
child.kill()
parent.kill()
2023-05-06 12:17:39 +00:00
2023-05-21 15:25:58 +00:00
def debug():
model = RWKV(
model="../models/RWKV-4-Raven-7B-v11-Eng49%-Chn49%-Jpn1%-Other1%-20230430-ctx8192.pth",
strategy="cuda fp16",
tokens_path="20B_tokenizer.json",
)
d = model.tokenizer.decode([])
print(d)
2023-05-06 12:17:39 +00:00
if __name__ == "__main__":
2023-05-17 03:39:00 +00:00
uvicorn.run("main:app", port=8000 if len(sys.argv) == 1 else int(sys.argv[1]))
2023-05-21 15:25:58 +00:00
# debug()