first commit
This commit is contained in:
2
chatgpt-web-backend/.gitignore
vendored
Normal file
2
chatgpt-web-backend/.gitignore
vendored
Normal file
@@ -0,0 +1,2 @@
|
||||
dist/
|
||||
__pycache__/
|
||||
11
chatgpt-web-backend/Dockerfile
Normal file
11
chatgpt-web-backend/Dockerfile
Normal file
@@ -0,0 +1,11 @@
|
||||
FROM chenzhaoyu94/chatgpt-web:v2.10.9 as frontend
|
||||
|
||||
FROM arvintian/chatgpt-web-base:v1
|
||||
|
||||
COPY --from=frontend /app/public /app/public
|
||||
|
||||
ADD dist/server /app/server
|
||||
|
||||
EXPOSE 7080
|
||||
|
||||
CMD ["/app/server"]
|
||||
8
chatgpt-web-backend/Dockerfile.base
Normal file
8
chatgpt-web-backend/Dockerfile.base
Normal file
@@ -0,0 +1,8 @@
|
||||
FROM python:3.10-alpine
|
||||
|
||||
WORKDIR app
|
||||
|
||||
ADD tokenizer.py /app/tokenizer.py
|
||||
ADD requirements.txt /app/requirements.txt
|
||||
RUN pip install -i https://mirrors.aliyun.com/pypi/simple --upgrade pip
|
||||
RUN pip install --root-user-action=ignore -i https://mirrors.aliyun.com/pypi/simple -r requirements.txt
|
||||
31
chatgpt-web-backend/Makefile
Normal file
31
chatgpt-web-backend/Makefile
Normal file
@@ -0,0 +1,31 @@
|
||||
REGISTRY = arvintian
|
||||
PROJECT = chatgpt-web
|
||||
BASE_VERSION = v1
|
||||
GIT_VERSION = $(shell git rev-parse --short HEAD)
|
||||
|
||||
.PHONY: build-local
|
||||
build-local:
|
||||
go build -v --ldflags="-w -X main.Version=$(GIT_VERSION)" -o dist/server cmd/*.go
|
||||
|
||||
.PHONY: build
|
||||
build:
|
||||
mkdir -p dist && docker run --rm -ti -e GOPROXY=https://goproxy.cn,direct -v $(GOPATH):/go -v `pwd`:/app -w /app golang:1.19-alpine \
|
||||
go build -v --ldflags="-w -X main.Version=$(GIT_VERSION)" -o dist/server cmd/*.go
|
||||
|
||||
package: build
|
||||
docker build -t $(REGISTRY)/$(PROJECT):$(GIT_VERSION) .
|
||||
|
||||
release: package
|
||||
docker tag $(REGISTRY)/$(PROJECT):$(GIT_VERSION) $(REGISTRY)/$(PROJECT):latest
|
||||
docker push $(REGISTRY)/$(PROJECT):$(GIT_VERSION)
|
||||
docker push $(REGISTRY)/$(PROJECT):latest
|
||||
|
||||
base:
|
||||
docker build -t $(REGISTRY)/$(PROJECT)-base:$(BASE_VERSION) -f Dockerfile.base .
|
||||
|
||||
release-base:
|
||||
docker push $(REGISTRY)/$(PROJECT)-base:$(BASE_VERSION)
|
||||
|
||||
clean:
|
||||
rm -rf dist
|
||||
docker images | grep -E "$(REGISTRY)/$(PROJECT)" | grep -v "base" | awk '{print $$3}' | uniq | xargs -I {} docker rmi --force {}
|
||||
38
chatgpt-web-backend/README.md
Normal file
38
chatgpt-web-backend/README.md
Normal file
@@ -0,0 +1,38 @@
|
||||
# ChatGPT-Web
|
||||
|
||||
[English](https://github.com/Arvintian/chatgpt-web/blob/main/README_en.md)
|
||||
|
||||
使用[Gin](https://github.com/gin-gonic/gin)搭建ChatGPT服务,使用[ChatGPT Web](https://github.com/Chanzhaoyu/chatgpt-web)作为前端
|
||||
|
||||
## Usage
|
||||
|
||||
[Docker Hub](https://hub.docker.com/repository/docker/arvintian/chatgpt-web/general)
|
||||
|
||||
```
|
||||
docker run --restart unless-stopped -d --log-opt max-size=50m -p 7080:7080 \
|
||||
-e OPENAI_KEY=openai-key \
|
||||
-e BASIC_AUTH_USER=user1,user2 \
|
||||
-e BASIC_AUTH_PASSWORD=passwd1,passwd2 \
|
||||
arvintian/chatgpt-web
|
||||
```
|
||||
|
||||
- SERVER_PORT 服务端口,默认7080
|
||||
- SERVER_HOST 服务监听地址,默认0.0.0.0
|
||||
- SOCKS_PROXY socks代理URL,例如socks5://user:password@127.0.0.1:1080
|
||||
- BASIC_AUTH_USER 认证用户,多用户英文逗号分隔
|
||||
- BASIC_AUTH_PASSWORD 认证用户密码,多用户英文逗号分隔
|
||||
- CHAT_SESSION_TTL 会话上下文保持时间,默认30分钟
|
||||
- CHAT_MIN_RESPONSE_TOKENS 预留给会话响应的token数,可能导致截断最久的上下文,默认600
|
||||
- OPENAI_KEY openai api key,参考OpenAI文档
|
||||
- OPENAI_BASE_URL openai api base url,默认https://api.openai.com/v1
|
||||
- OPENAI_MODEL 调用模型,默认gpt-3.5-turbo-0301
|
||||
- OPENAI_MAX_TOKENS 模型max_tokens参数,参考OpenAI文档
|
||||
- OPENAI_TEMPERATURE 模型temperature参数,参考OpenAI文档
|
||||
- OPENAI_PRESENCE_PENALTY 模型presence_penalty参数,参考OpenAI文档
|
||||
- OPENAI_FREQUENCY_PENALTY 模型frequency_penalty参数,参考OpenAI文档
|
||||
|
||||
更详细参数参考: [启动函数](https://github.com/Arvintian/chatgpt-web/blob/main/cmd/main.go#L21)
|
||||
|
||||
Tips:
|
||||
- 模型float32参数使用(整型/100)设置,例如: temperature设置0.8,需要设置为80
|
||||
- 内置支持了对OPENAI_BASE_URL的正向代理,可以作为OpenAI接口的代理服务器
|
||||
34
chatgpt-web-backend/README_en.md
Normal file
34
chatgpt-web-backend/README_en.md
Normal file
@@ -0,0 +1,34 @@
|
||||
Built ChatGPT service using [Gin](https://github.com/gin-gonic/gin) and [ChatGPT Web](https://github.com/Chanzhaoyu/chatgpt-web) as the front-end.
|
||||
|
||||
## Usage
|
||||
|
||||
[Docker Hub](https://hub.docker.com/repository/docker/arvintian/chatgpt-web/general)
|
||||
|
||||
```
|
||||
docker run --restart unless-stopped -d --log-opt max-size=50m -p 7080:7080 \
|
||||
-e OPENAI_KEY=openai-key \
|
||||
-e BASIC_AUTH_USER=user1,user2 \
|
||||
-e BASIC_AUTH_PASSWORD=passwd1,passwd2 \
|
||||
arvintian/chatgpt-web
|
||||
```
|
||||
|
||||
- SERVER_PORT: Server port, default 7080.
|
||||
- SERVER_HOST: Server listen address, default 0.0.0.0.
|
||||
- SOCKS_PROXY: Socks proxy URL, for example socks5://user:password@127.0.0.1:1080.
|
||||
- BASIC_AUTH_USER: Authentication user, multiple users separated by English commas.
|
||||
- BASIC_AUTH_PASSWORD: Authentication user passwords, multiple users separated by English commas.
|
||||
- CHAT_SESSION_TTL: Session context retention time, default 30 minutes.
|
||||
- CHAT_MIN_RESPONSE_TOKENS: Tokens reserved for session response, may lead to truncation of the longest context, default 600.
|
||||
- OPENAI_KEY: OpenAI API key, refer to OpenAI documentation.
|
||||
- OPENAI_BASE_URL: OpenAI API base URL, default https://api.openai.com/v1.
|
||||
- OPENAI_MODEL: Model called, default gpt-3.5-turbo-0301.
|
||||
- OPENAI_MAX_TOKENS: Model max_tokens parameter, refer to OpenAI documentation.
|
||||
- OPENAI_TEMPERATURE: Model temperature parameter, refer to OpenAI documentation.
|
||||
- OPENAI_PRESENCE_PENALTY: Model presence_penalty parameter, refer to OpenAI documentation.
|
||||
- OPENAI_FREQUENCY_PENALTY: Model frequency_penalty parameter, refer to OpenAI documentation.
|
||||
|
||||
For more detailed parameters, please refer to the [start function](https://github.com/Arvintian/chatgpt-web/blob/main/cmd/main.go#L21).
|
||||
|
||||
Tips:
|
||||
- Use (integer/100) to set the float32 model parameters. For example, if temperature is set to 0.8, it needs to be set to 80.
|
||||
- The built-in support for a forward proxy of OPENAI_BASE_URL enables it to function as a proxy server for the OpenAI API.
|
||||
196
chatgpt-web-backend/cmd/main.go
Normal file
196
chatgpt-web-backend/cmd/main.go
Normal file
@@ -0,0 +1,196 @@
|
||||
package main
|
||||
|
||||
import (
|
||||
"context"
|
||||
"fmt"
|
||||
"log"
|
||||
"net/http"
|
||||
"net/http/httputil"
|
||||
"net/url"
|
||||
"os"
|
||||
"os/exec"
|
||||
"strings"
|
||||
"time"
|
||||
|
||||
"github.com/Arvintian/chatgpt-web/pkg/controllers"
|
||||
"github.com/Arvintian/chatgpt-web/pkg/middlewares"
|
||||
"github.com/Arvintian/chatgpt-web/pkg/utils"
|
||||
"github.com/Arvintian/go-utils/cmdutil"
|
||||
"github.com/gin-gonic/gin"
|
||||
"github.com/spf13/cobra"
|
||||
"k8s.io/klog/v2"
|
||||
)
|
||||
|
||||
type ChatGPTWebServer struct {
|
||||
Host string `name:"host" env:"SERVER_HOST" usage:"http bind host" default:"0.0.0.0"`
|
||||
Port int `name:"port" env:"SERVER_PORT" usage:"http bind port" default:"7080"`
|
||||
BasicAuthUser string `name:"auth-user" env:"BASIC_AUTH_USER" usage:"http basic auth user"`
|
||||
BasicAuthPassword string `name:"auth-password" env:"BASIC_AUTH_PASSWORD" usage:"http basic auth password"`
|
||||
FrontendPath string `name:"frontend-path" env:"FRONTEND_PATH" default:"/app/public" usage:"frontend path"`
|
||||
SocksProxy string `name:"socks-proxy" env:"SOCKS_PROXY" usage:"socks proxy url"`
|
||||
ChatSessionTTL int `name:"chat-session-ttl" env:"CHAT_SESSION_TTL" default:"30" usage:"chat session ttl minute"`
|
||||
ChatMinResponseTokens int `name:"chat-min-response-tokens" env:"CHAT_MIN_RESPONSE_TOKENS" default:"600" usage:"chat min response tokens"`
|
||||
OpenAIKey string `name:"openapi-key" env:"OPENAI_KEY" usage:"openai key"`
|
||||
OpenAIBaseURL string `name:"openapi-base-url" env:"OPENAI_BASE_URL" default:"https://api.openai.com/v1" usage:"openai base url"`
|
||||
OpenAIModel string `name:"openai-model" env:"OPENAI_MODEL" default:"gpt-3.5-turbo-0301" usage:"openai params model"`
|
||||
OpenAIMaxTokens int `name:"openai-max-tokens" env:"OPENAI_MAX_TOKENS" default:"4096" usage:"openai params max-tokens"`
|
||||
OpenAITemperature int `name:"openai-temperature" env:"OPENAI_TEMPERATURE" default:"80" usage:"openai params temperature"`
|
||||
OpenAIPresencePenalty int `name:"openai-presence-penalty" env:"OPENAI_PRESENCE_PENALTY" default:"100" usage:"openai params presence-penalty"`
|
||||
OpenAIFrequencyPenalty int `name:"openai-frequency-penalty" env:"OPENAI_FREQUENCY_PENALTY" default:"0" usage:"openai params frequency-penalty"`
|
||||
Version bool `name:"version" usage:"show version"`
|
||||
}
|
||||
|
||||
var Version = "0.0.0-dev"
|
||||
|
||||
func (r *ChatGPTWebServer) Run(cmd *cobra.Command, args []string) error {
|
||||
if r.Version {
|
||||
return r.ShowVersion()
|
||||
}
|
||||
gin.SetMode(gin.ReleaseMode)
|
||||
if err := r.updateAssetsFiles(); err != nil {
|
||||
return err
|
||||
}
|
||||
go r.startTokenizer(cmd.Context())
|
||||
go r.httpServer(cmd.Context())
|
||||
|
||||
<-cmd.Context().Done()
|
||||
return nil
|
||||
}
|
||||
|
||||
func (r *ChatGPTWebServer) httpServer(ctx context.Context) {
|
||||
chatService, err := controllers.NewChatService(r.OpenAIKey, r.OpenAIBaseURL, r.SocksProxy, controllers.ChatCompletionParams{
|
||||
Model: r.OpenAIModel,
|
||||
MaxTokens: r.OpenAIMaxTokens,
|
||||
Temperature: float32(r.OpenAITemperature) / 100.0,
|
||||
PresencePenalty: float32(r.OpenAIPresencePenalty) / 100.0,
|
||||
FrequencyPenalty: float32(r.OpenAIFrequencyPenalty) / 100.0,
|
||||
ChatSessionTTL: time.Duration(r.ChatSessionTTL) * time.Minute,
|
||||
ChatMinResponseTokens: r.ChatMinResponseTokens,
|
||||
})
|
||||
if err != nil {
|
||||
klog.Fatal(err)
|
||||
}
|
||||
|
||||
addr := fmt.Sprintf("%s:%d", r.Host, r.Port)
|
||||
klog.Infof("ChatGPT Web Server on: %s", addr)
|
||||
server := &http.Server{
|
||||
Addr: addr,
|
||||
}
|
||||
entry, proxy := gin.New(), gin.New()
|
||||
entry.Use(gin.Logger())
|
||||
entry.Use(gin.Recovery())
|
||||
chat := entry.Group("/api")
|
||||
if len(r.BasicAuthUser) > 0 {
|
||||
accounts := gin.Accounts{}
|
||||
users := strings.Split(r.BasicAuthUser, ",")
|
||||
passwords := strings.Split(r.BasicAuthPassword, ",")
|
||||
if len(users) != len(passwords) {
|
||||
panic("basic auth setting error")
|
||||
}
|
||||
for i := 0; i < len(users); i++ {
|
||||
accounts[users[i]] = passwords[i]
|
||||
}
|
||||
chat.POST("/chat-process", gin.BasicAuth(accounts), middlewares.RateLimitMiddleware(1, 2), chatService.ChatProcess)
|
||||
} else {
|
||||
chat.POST("/chat-process", middlewares.RateLimitMiddleware(1, 2), chatService.ChatProcess)
|
||||
}
|
||||
chat.POST("/config", func(ctx *gin.Context) {
|
||||
ctx.JSON(200, gin.H{
|
||||
"status": "Success",
|
||||
"data": map[string]string{
|
||||
"apiModel": "ChatGPTAPI",
|
||||
"socksProxy": r.SocksProxy,
|
||||
},
|
||||
})
|
||||
})
|
||||
chat.POST("/session", func(ctx *gin.Context) {
|
||||
ctx.JSON(200, gin.H{
|
||||
"status": "Success",
|
||||
"message": "",
|
||||
"data": gin.H{
|
||||
"auth": false,
|
||||
},
|
||||
})
|
||||
})
|
||||
upstreamURL, err := url.Parse(strings.TrimSuffix(r.OpenAIBaseURL, "/v1"))
|
||||
if err != nil {
|
||||
klog.Fatal(err)
|
||||
}
|
||||
upstream := httputil.NewSingleHostReverseProxy(upstreamURL)
|
||||
if r.SocksProxy != "" {
|
||||
proxyUrl, err := url.Parse(r.SocksProxy)
|
||||
if err != nil {
|
||||
klog.Fatal(err)
|
||||
}
|
||||
upstream.Transport = &http.Transport{
|
||||
Proxy: http.ProxyURL(proxyUrl),
|
||||
}
|
||||
}
|
||||
apis := proxy.Group("/v1")
|
||||
apis.Any("/*relativePath", func(ctx *gin.Context) {
|
||||
ctx.Request.Host = upstreamURL.Host
|
||||
upstream.ServeHTTP(ctx.Writer, ctx.Request)
|
||||
})
|
||||
proxy.NoRoute(func(ctx *gin.Context) {
|
||||
http.FileServer(http.Dir(r.FrontendPath)).ServeHTTP(ctx.Writer, ctx.Request)
|
||||
})
|
||||
entry.NoRoute(func(ctx *gin.Context) {
|
||||
proxy.ServeHTTP(ctx.Writer, ctx.Request)
|
||||
})
|
||||
|
||||
server.Handler = entry
|
||||
go func(ctx context.Context) {
|
||||
<-ctx.Done()
|
||||
ctx, cancel := context.WithTimeout(context.Background(), 5*time.Second)
|
||||
defer cancel()
|
||||
if err := server.Shutdown(ctx); err != nil {
|
||||
log.Printf("Server shutdown with error %v", err)
|
||||
}
|
||||
}(ctx)
|
||||
if err := server.ListenAndServe(); err != http.ErrServerClosed {
|
||||
log.Fatalf("Server listen and serve error %v", err)
|
||||
}
|
||||
}
|
||||
|
||||
func (r *ChatGPTWebServer) startTokenizer(ctx context.Context) {
|
||||
// devnull, err := os.OpenFile(os.DevNull, os.O_WRONLY, 0755)
|
||||
// if err != nil {
|
||||
// klog.Error(err)
|
||||
// os.Exit(1)
|
||||
// }
|
||||
args := strings.Split("nuxt --module tokenizer.py --workers 2", " ")
|
||||
klog.Infof("Start Tokenizer with %v", args)
|
||||
cmd := exec.CommandContext(ctx, args[0], args[1:]...)
|
||||
cmd.Stderr = os.Stderr
|
||||
cmd.Stdout = os.Stdout
|
||||
if err := cmd.Run(); err != nil {
|
||||
klog.Error(err)
|
||||
os.Exit(1)
|
||||
}
|
||||
}
|
||||
|
||||
func (r *ChatGPTWebServer) updateAssetsFiles() error {
|
||||
pairs := map[string]string{}
|
||||
old := `{avatar:"https://raw.githubusercontent.com/Chanzhaoyu/chatgpt-web/main/src/assets/avatar.jpg",name:"ChenZhaoYu",description:'Star on <a href="https://github.com/Chanzhaoyu/chatgpt-bot" class="text-blue-500" target="_blank" >Github</a>'}`
|
||||
new := `{avatar:"https://raw.githubusercontent.com/Chanzhaoyu/chatgpt-web/main/src/assets/avatar.jpg",name:"ChatGPT",description:'Star on <a href="https://github.com/Arvintian/chatgpt-web" class="text-blue-500" target="_blank" >Github</a>'}`
|
||||
pairs[old] = new
|
||||
old = `{}.VITE_GLOB_OPEN_LONG_REPLY`
|
||||
new = `{VITE_GLOB_OPEN_LONG_REPLY:"true"}.VITE_GLOB_OPEN_LONG_REPLY`
|
||||
pairs[old] = new
|
||||
old = `<link rel="manifest" href="/manifest.webmanifest"><script id="vite-plugin-pwa:register-sw" src="/registerSW.js"></script>`
|
||||
new = ``
|
||||
pairs[old] = new
|
||||
return utils.ReplaceFiles(r.FrontendPath, pairs)
|
||||
}
|
||||
|
||||
func (r *ChatGPTWebServer) ShowVersion() error {
|
||||
fmt.Println(Version)
|
||||
return nil
|
||||
}
|
||||
|
||||
func main() {
|
||||
root := cmdutil.Command(&ChatGPTWebServer{}, cobra.Command{
|
||||
Long: "ChatGPT Web Server",
|
||||
})
|
||||
cmdutil.Main(root)
|
||||
}
|
||||
43
chatgpt-web-backend/go.mod
Normal file
43
chatgpt-web-backend/go.mod
Normal file
@@ -0,0 +1,43 @@
|
||||
module github.com/Arvintian/chatgpt-web
|
||||
|
||||
go 1.19
|
||||
|
||||
require (
|
||||
github.com/Arvintian/go-utils v0.0.0-20221012040808-2e61c0c3eece
|
||||
github.com/gin-gonic/gin v1.9.0
|
||||
github.com/google/uuid v1.3.0
|
||||
github.com/karlseguin/ccache/v3 v3.0.3
|
||||
github.com/sashabaranov/go-openai v1.4.2
|
||||
github.com/spf13/cobra v1.6.0
|
||||
golang.org/x/time v0.3.0
|
||||
k8s.io/klog/v2 v2.60.1
|
||||
)
|
||||
|
||||
require (
|
||||
github.com/bytedance/sonic v1.8.0 // indirect
|
||||
github.com/chenzhuoyu/base64x v0.0.0-20221115062448-fe3a3abad311 // indirect
|
||||
github.com/gin-contrib/sse v0.1.0 // indirect
|
||||
github.com/go-logr/logr v1.2.3 // indirect
|
||||
github.com/go-playground/locales v0.14.1 // indirect
|
||||
github.com/go-playground/universal-translator v0.18.1 // indirect
|
||||
github.com/go-playground/validator/v10 v10.11.2 // indirect
|
||||
github.com/goccy/go-json v0.10.0 // indirect
|
||||
github.com/inconshreveable/mousetrap v1.0.1 // indirect
|
||||
github.com/json-iterator/go v1.1.12 // indirect
|
||||
github.com/klauspost/cpuid/v2 v2.0.9 // indirect
|
||||
github.com/leodido/go-urn v1.2.1 // indirect
|
||||
github.com/mattn/go-isatty v0.0.17 // indirect
|
||||
github.com/modern-go/concurrent v0.0.0-20180306012644-bacd9c7ef1dd // indirect
|
||||
github.com/modern-go/reflect2 v1.0.2 // indirect
|
||||
github.com/pelletier/go-toml/v2 v2.0.6 // indirect
|
||||
github.com/spf13/pflag v1.0.5 // indirect
|
||||
github.com/twitchyliquid64/golang-asm v0.15.1 // indirect
|
||||
github.com/ugorji/go/codec v1.2.9 // indirect
|
||||
golang.org/x/arch v0.0.0-20210923205945-b76863e36670 // indirect
|
||||
golang.org/x/crypto v0.5.0 // indirect
|
||||
golang.org/x/net v0.7.0 // indirect
|
||||
golang.org/x/sys v0.5.0 // indirect
|
||||
golang.org/x/text v0.7.0 // indirect
|
||||
google.golang.org/protobuf v1.28.1 // indirect
|
||||
gopkg.in/yaml.v3 v3.0.1 // indirect
|
||||
)
|
||||
105
chatgpt-web-backend/go.sum
Normal file
105
chatgpt-web-backend/go.sum
Normal file
@@ -0,0 +1,105 @@
|
||||
github.com/Arvintian/go-utils v0.0.0-20221012040808-2e61c0c3eece h1:2pV+ZmYaakmpP0DASolUiKVCykieF5AWzz2mMjhiaEY=
|
||||
github.com/Arvintian/go-utils v0.0.0-20221012040808-2e61c0c3eece/go.mod h1:EM4VUepvcCPF4HFKf2Baq9nlNReRTJI4jKw2+rCvsx4=
|
||||
github.com/bytedance/sonic v1.5.0/go.mod h1:ED5hyg4y6t3/9Ku1R6dU/4KyJ48DZ4jPhfY1O2AihPM=
|
||||
github.com/bytedance/sonic v1.8.0 h1:ea0Xadu+sHlu7x5O3gKhRpQ1IKiMrSiHttPF0ybECuA=
|
||||
github.com/bytedance/sonic v1.8.0/go.mod h1:i736AoUSYt75HyZLoJW9ERYxcy6eaN6h4BZXU064P/U=
|
||||
github.com/chenzhuoyu/base64x v0.0.0-20211019084208-fb5309c8db06/go.mod h1:DH46F32mSOjUmXrMHnKwZdA8wcEefY7UVqBKYGjpdQY=
|
||||
github.com/chenzhuoyu/base64x v0.0.0-20221115062448-fe3a3abad311 h1:qSGYFH7+jGhDF8vLC+iwCD4WpbV1EBDSzWkJODFLams=
|
||||
github.com/chenzhuoyu/base64x v0.0.0-20221115062448-fe3a3abad311/go.mod h1:b583jCggY9gE99b6G5LEC39OIiVsWj+R97kbl5odCEk=
|
||||
github.com/cpuguy83/go-md2man/v2 v2.0.2/go.mod h1:tgQtvFlXSQOSOSIRvRPT7W67SCa46tRHOmNcaadrF8o=
|
||||
github.com/davecgh/go-spew v1.1.0/go.mod h1:J7Y8YcW2NihsgmVo/mv3lAwl/skON4iLHjSsI+c5H38=
|
||||
github.com/davecgh/go-spew v1.1.1 h1:vj9j/u1bqnvCEfJOwUhtlOARqs3+rkHYY13jYWTU97c=
|
||||
github.com/davecgh/go-spew v1.1.1/go.mod h1:J7Y8YcW2NihsgmVo/mv3lAwl/skON4iLHjSsI+c5H38=
|
||||
github.com/gin-contrib/sse v0.1.0 h1:Y/yl/+YNO8GZSjAhjMsSuLt29uWRFHdHYUb5lYOV9qE=
|
||||
github.com/gin-contrib/sse v0.1.0/go.mod h1:RHrZQHXnP2xjPF+u1gW/2HnVO7nvIa9PG3Gm+fLHvGI=
|
||||
github.com/gin-gonic/gin v1.9.0 h1:OjyFBKICoexlu99ctXNR2gg+c5pKrKMuyjgARg9qeY8=
|
||||
github.com/gin-gonic/gin v1.9.0/go.mod h1:W1Me9+hsUSyj3CePGrd1/QrKJMSJ1Tu/0hFEH89961k=
|
||||
github.com/go-logr/logr v1.2.0/go.mod h1:jdQByPbusPIv2/zmleS9BjJVeZ6kBagPoEUsqbVz/1A=
|
||||
github.com/go-logr/logr v1.2.3 h1:2DntVwHkVopvECVRSlL5PSo9eG+cAkDCuckLubN+rq0=
|
||||
github.com/go-logr/logr v1.2.3/go.mod h1:jdQByPbusPIv2/zmleS9BjJVeZ6kBagPoEUsqbVz/1A=
|
||||
github.com/go-playground/assert/v2 v2.2.0 h1:JvknZsQTYeFEAhQwI4qEt9cyV5ONwRHC+lYKSsYSR8s=
|
||||
github.com/go-playground/locales v0.14.1 h1:EWaQ/wswjilfKLTECiXz7Rh+3BjFhfDFKv/oXslEjJA=
|
||||
github.com/go-playground/locales v0.14.1/go.mod h1:hxrqLVvrK65+Rwrd5Fc6F2O76J/NuW9t0sjnWqG1slY=
|
||||
github.com/go-playground/universal-translator v0.18.1 h1:Bcnm0ZwsGyWbCzImXv+pAJnYK9S473LQFuzCbDbfSFY=
|
||||
github.com/go-playground/universal-translator v0.18.1/go.mod h1:xekY+UJKNuX9WP91TpwSH2VMlDf28Uj24BCp08ZFTUY=
|
||||
github.com/go-playground/validator/v10 v10.11.2 h1:q3SHpufmypg+erIExEKUmsgmhDTyhcJ38oeKGACXohU=
|
||||
github.com/go-playground/validator/v10 v10.11.2/go.mod h1:NieE624vt4SCTJtD87arVLvdmjPAeV8BQlHtMnw9D7s=
|
||||
github.com/goccy/go-json v0.10.0 h1:mXKd9Qw4NuzShiRlOXKews24ufknHO7gx30lsDyokKA=
|
||||
github.com/goccy/go-json v0.10.0/go.mod h1:6MelG93GURQebXPDq3khkgXZkazVtN9CRI+MGFi0w8I=
|
||||
github.com/golang/protobuf v1.5.0/go.mod h1:FsONVRAS9T7sI+LIUmWTfcYkHO4aIWwzhcaSAoJOfIk=
|
||||
github.com/google/go-cmp v0.5.5 h1:Khx7svrCpmxxtHBq5j2mp/xVjsi8hQMfNLvJFAlrGgU=
|
||||
github.com/google/go-cmp v0.5.5/go.mod h1:v8dTdLbMG2kIc/vJvl+f65V22dbkXbowE6jgT/gNBxE=
|
||||
github.com/google/gofuzz v1.0.0/go.mod h1:dBl0BpW6vV/+mYPU4Po3pmUjxk6FQPldtuIdl/M65Eg=
|
||||
github.com/google/uuid v1.3.0 h1:t6JiXgmwXMjEs8VusXIJk2BXHsn+wx8BZdTaoZ5fu7I=
|
||||
github.com/google/uuid v1.3.0/go.mod h1:TIyPZe4MgqvfeYDBFedMoGGpEw/LqOeaOT+nhxU+yHo=
|
||||
github.com/inconshreveable/mousetrap v1.0.1 h1:U3uMjPSQEBMNp1lFxmllqCPM6P5u/Xq7Pgzkat/bFNc=
|
||||
github.com/inconshreveable/mousetrap v1.0.1/go.mod h1:vpF70FUmC8bwa3OWnCshd2FqLfsEA9PFc4w1p2J65bw=
|
||||
github.com/json-iterator/go v1.1.12 h1:PV8peI4a0ysnczrg+LtxykD8LfKY9ML6u2jnxaEnrnM=
|
||||
github.com/json-iterator/go v1.1.12/go.mod h1:e30LSqwooZae/UwlEbR2852Gd8hjQvJoHmT4TnhNGBo=
|
||||
github.com/karlseguin/ccache/v3 v3.0.3 h1:cz+3tSdTrovp00xHPP3Y6ca/YuSl5kchhYG83wUPYN0=
|
||||
github.com/karlseguin/ccache/v3 v3.0.3/go.mod h1:qxC372+Qn+IBj8Pe3KvGjHPj0sWwEF7AeZVhsNPZ6uY=
|
||||
github.com/klauspost/cpuid/v2 v2.0.9 h1:lgaqFMSdTdQYdZ04uHyN2d/eKdOMyi2YLSvlQIBFYa4=
|
||||
github.com/klauspost/cpuid/v2 v2.0.9/go.mod h1:FInQzS24/EEf25PyTYn52gqo7WaD8xa0213Md/qVLRg=
|
||||
github.com/kr/pretty v0.3.0 h1:WgNl7dwNpEZ6jJ9k1snq4pZsg7DOEN8hP9Xw0Tsjwk0=
|
||||
github.com/kr/text v0.2.0 h1:5Nx0Ya0ZqY2ygV366QzturHI13Jq95ApcVaJBhpS+AY=
|
||||
github.com/leodido/go-urn v1.2.1 h1:BqpAaACuzVSgi/VLzGZIobT2z4v53pjosyNd9Yv6n/w=
|
||||
github.com/leodido/go-urn v1.2.1/go.mod h1:zt4jvISO2HfUBqxjfIshjdMTYS56ZS/qv49ictyFfxY=
|
||||
github.com/mattn/go-isatty v0.0.17 h1:BTarxUcIeDqL27Mc+vyvdWYSL28zpIhv3RoTdsLMPng=
|
||||
github.com/mattn/go-isatty v0.0.17/go.mod h1:kYGgaQfpe5nmfYZH+SKPsOc2e4SrIfOl2e/yFXSvRLM=
|
||||
github.com/modern-go/concurrent v0.0.0-20180228061459-e0a39a4cb421/go.mod h1:6dJC0mAP4ikYIbvyc7fijjWJddQyLn8Ig3JB5CqoB9Q=
|
||||
github.com/modern-go/concurrent v0.0.0-20180306012644-bacd9c7ef1dd h1:TRLaZ9cD/w8PVh93nsPXa1VrQ6jlwL5oN8l14QlcNfg=
|
||||
github.com/modern-go/concurrent v0.0.0-20180306012644-bacd9c7ef1dd/go.mod h1:6dJC0mAP4ikYIbvyc7fijjWJddQyLn8Ig3JB5CqoB9Q=
|
||||
github.com/modern-go/reflect2 v1.0.2 h1:xBagoLtFs94CBntxluKeaWgTMpvLxC4ur3nMaC9Gz0M=
|
||||
github.com/modern-go/reflect2 v1.0.2/go.mod h1:yWuevngMOJpCy52FWWMvUC8ws7m/LJsjYzDa0/r8luk=
|
||||
github.com/pelletier/go-toml/v2 v2.0.6 h1:nrzqCb7j9cDFj2coyLNLaZuJTLjWjlaz6nvTvIwycIU=
|
||||
github.com/pelletier/go-toml/v2 v2.0.6/go.mod h1:eumQOmlWiOPt5WriQQqoM5y18pDHwha2N+QD+EUNTek=
|
||||
github.com/pmezard/go-difflib v1.0.0 h1:4DBwDE0NGyQoBHbLQYPwSUPoCMWR5BEzIk/f1lZbAQM=
|
||||
github.com/pmezard/go-difflib v1.0.0/go.mod h1:iKH77koFhYxTK1pcRnkKkqfTogsbg7gZNVY4sRDYZ/4=
|
||||
github.com/rogpeppe/go-internal v1.8.0 h1:FCbCCtXNOY3UtUuHUYaghJg4y7Fd14rXifAYUAtL9R8=
|
||||
github.com/russross/blackfriday/v2 v2.1.0/go.mod h1:+Rmxgy9KzJVeS9/2gXHxylqXiyQDYRxCVz55jmeOWTM=
|
||||
github.com/sashabaranov/go-openai v1.4.2 h1:IhacPY7O+ljlBoZRQe9VpsLNm0b4PHa6fOBGA9O4vfc=
|
||||
github.com/sashabaranov/go-openai v1.4.2/go.mod h1:lj5b/K+zjTSFxVLijLSTDZuP7adOgerWeFyZLUhAKRg=
|
||||
github.com/spf13/cobra v1.6.0 h1:42a0n6jwCot1pUmomAp4T7DeMD+20LFv4Q54pxLf2LI=
|
||||
github.com/spf13/cobra v1.6.0/go.mod h1:IOw/AERYS7UzyrGinqmz6HLUo219MORXGxhbaJUqzrY=
|
||||
github.com/spf13/pflag v1.0.5 h1:iy+VFUOCP1a+8yFto/drg2CJ5u0yRoB7fZw3DKv/JXA=
|
||||
github.com/spf13/pflag v1.0.5/go.mod h1:McXfInJRrz4CZXVZOBLb0bTZqETkiAhM9Iw0y3An2Bg=
|
||||
github.com/stretchr/objx v0.1.0/go.mod h1:HFkY916IF+rwdDfMAkV7OtwuqBVzrE8GR6GFx+wExME=
|
||||
github.com/stretchr/objx v0.4.0/go.mod h1:YvHI0jy2hoMjB+UWwv71VJQ9isScKT/TqJzVSSt89Yw=
|
||||
github.com/stretchr/objx v0.5.0/go.mod h1:Yh+to48EsGEfYuaHDzXPcE3xhTkx73EhmCGUpEOglKo=
|
||||
github.com/stretchr/testify v1.3.0/go.mod h1:M5WIy9Dh21IEIfnGCwXGc5bZfKNJtfHm1UVUgZn+9EI=
|
||||
github.com/stretchr/testify v1.6.1/go.mod h1:6Fq8oRcR53rry900zMqJjRRixrwX3KX962/h/Wwjteg=
|
||||
github.com/stretchr/testify v1.7.0/go.mod h1:6Fq8oRcR53rry900zMqJjRRixrwX3KX962/h/Wwjteg=
|
||||
github.com/stretchr/testify v1.7.1/go.mod h1:6Fq8oRcR53rry900zMqJjRRixrwX3KX962/h/Wwjteg=
|
||||
github.com/stretchr/testify v1.8.0/go.mod h1:yNjHg4UonilssWZ8iaSj1OCr/vHnekPRkoO+kdMU+MU=
|
||||
github.com/stretchr/testify v1.8.1 h1:w7B6lhMri9wdJUVmEZPGGhZzrYTPvgJArz7wNPgYKsk=
|
||||
github.com/stretchr/testify v1.8.1/go.mod h1:w2LPCIKwWwSfY2zedu0+kehJoqGctiVI29o6fzry7u4=
|
||||
github.com/twitchyliquid64/golang-asm v0.15.1 h1:SU5vSMR7hnwNxj24w34ZyCi/FmDZTkS4MhqMhdFk5YI=
|
||||
github.com/twitchyliquid64/golang-asm v0.15.1/go.mod h1:a1lVb/DtPvCB8fslRZhAngC2+aY1QWCk3Cedj/Gdt08=
|
||||
github.com/ugorji/go/codec v1.2.9 h1:rmenucSohSTiyL09Y+l2OCk+FrMxGMzho2+tjr5ticU=
|
||||
github.com/ugorji/go/codec v1.2.9/go.mod h1:UNopzCgEMSXjBc6AOMqYvWC1ktqTAfzJZUZgYf6w6lg=
|
||||
golang.org/x/arch v0.0.0-20210923205945-b76863e36670 h1:18EFjUmQOcUvxNYSkA6jO9VAiXCnxFY6NyDX0bHDmkU=
|
||||
golang.org/x/arch v0.0.0-20210923205945-b76863e36670/go.mod h1:5om86z9Hs0C8fWVUuoMHwpExlXzs5Tkyp9hOrfG7pp8=
|
||||
golang.org/x/crypto v0.5.0 h1:U/0M97KRkSFvyD/3FSmdP5W5swImpNgle/EHFhOsQPE=
|
||||
golang.org/x/crypto v0.5.0/go.mod h1:NK/OQwhpMQP3MwtdjgLlYHnH9ebylxKWv3e0fK+mkQU=
|
||||
golang.org/x/net v0.7.0 h1:rJrUqqhjsgNp7KqAIc25s9pZnjU7TUcSY7HcVZjdn1g=
|
||||
golang.org/x/net v0.7.0/go.mod h1:2Tu9+aMcznHK/AK1HMvgo6xiTLG5rD5rZLDS+rp2Bjs=
|
||||
golang.org/x/sys v0.0.0-20220811171246-fbc7d0a398ab/go.mod h1:oPkhp1MJrh7nUepCBck5+mAzfO9JrbApNNgaTdGDITg=
|
||||
golang.org/x/sys v0.5.0 h1:MUK/U/4lj1t1oPg0HfuXDN/Z1wv31ZJ/YcPiGccS4DU=
|
||||
golang.org/x/sys v0.5.0/go.mod h1:oPkhp1MJrh7nUepCBck5+mAzfO9JrbApNNgaTdGDITg=
|
||||
golang.org/x/text v0.7.0 h1:4BRB4x83lYWy72KwLD/qYDuTu7q9PjSagHvijDw7cLo=
|
||||
golang.org/x/text v0.7.0/go.mod h1:mrYo+phRRbMaCq/xk9113O4dZlRixOauAjOtrjsXDZ8=
|
||||
golang.org/x/time v0.3.0 h1:rg5rLMjNzMS1RkNLzCG38eapWhnYLFYXDXj2gOlr8j4=
|
||||
golang.org/x/time v0.3.0/go.mod h1:tRJNPiyCQ0inRvYxbN9jk5I+vvW/OXSQhTDSoE431IQ=
|
||||
golang.org/x/xerrors v0.0.0-20191204190536-9bdfabe68543 h1:E7g+9GITq07hpfrRu66IVDexMakfv52eLZ2CXBWiKr4=
|
||||
golang.org/x/xerrors v0.0.0-20191204190536-9bdfabe68543/go.mod h1:I/5z698sn9Ka8TeJc9MKroUUfqBBauWjQqLJ2OPfmY0=
|
||||
google.golang.org/protobuf v1.26.0-rc.1/go.mod h1:jlhhOSvTdKEhbULTjvd4ARK9grFBp09yW+WbY/TyQbw=
|
||||
google.golang.org/protobuf v1.28.1 h1:d0NfwRgPtno5B1Wa6L2DAG+KivqkdutMf1UhdNx175w=
|
||||
google.golang.org/protobuf v1.28.1/go.mod h1:HV8QOd/L58Z+nl8r43ehVNZIU/HEI6OcFqwMG9pJV4I=
|
||||
gopkg.in/check.v1 v0.0.0-20161208181325-20d25e280405/go.mod h1:Co6ibVJAznAaIkqp8huTwlJQCZ016jof/cbN4VW5Yz0=
|
||||
gopkg.in/check.v1 v1.0.0-20201130134442-10cb98267c6c h1:Hei/4ADfdWqJk1ZMxUNpqntNwaWcugrBjAiHlqqRiVk=
|
||||
gopkg.in/yaml.v3 v3.0.0-20200313102051-9f266ea9e77c/go.mod h1:K4uyk7z7BCEPqu6E+C64Yfv1cQ7kz7rIZviUmN+EgEM=
|
||||
gopkg.in/yaml.v3 v3.0.1 h1:fxVm/GzAzEWqLHuvctI91KS9hhNmmWOoWu0XTYJS7CA=
|
||||
gopkg.in/yaml.v3 v3.0.1/go.mod h1:K4uyk7z7BCEPqu6E+C64Yfv1cQ7kz7rIZviUmN+EgEM=
|
||||
k8s.io/klog/v2 v2.60.1 h1:VW25q3bZx9uE3vvdL6M8ezOX79vA2Aq1nEWLqNQclHc=
|
||||
k8s.io/klog/v2 v2.60.1/go.mod h1:y1WjHnz7Dj687irZUWR/WLkLc5N1YHtjLdmgWjndZn0=
|
||||
rsc.io/pdf v0.1.1/go.mod h1:n8OzWcQ6Sp37PL01nO98y4iUCRdTGarVfzxY20ICaU4=
|
||||
BIN
chatgpt-web-backend/main
Executable file
BIN
chatgpt-web-backend/main
Executable file
Binary file not shown.
295
chatgpt-web-backend/pkg/controllers/chat.go
Normal file
295
chatgpt-web-backend/pkg/controllers/chat.go
Normal file
@@ -0,0 +1,295 @@
|
||||
package controllers
|
||||
|
||||
import (
|
||||
"encoding/json"
|
||||
"errors"
|
||||
"fmt"
|
||||
"io"
|
||||
"net/http"
|
||||
"net/url"
|
||||
"strings"
|
||||
"time"
|
||||
|
||||
"github.com/Arvintian/chatgpt-web/pkg/tokenizer"
|
||||
"github.com/Arvintian/chatgpt-web/pkg/utils"
|
||||
"github.com/gin-gonic/gin"
|
||||
"github.com/google/uuid"
|
||||
ccache "github.com/karlseguin/ccache/v3"
|
||||
openai "github.com/sashabaranov/go-openai"
|
||||
"k8s.io/klog/v2"
|
||||
)
|
||||
|
||||
const (
|
||||
ChatPrimedTokens = 2
|
||||
KimiTopP = 0.95
|
||||
)
|
||||
|
||||
type ChatService struct {
|
||||
client *openai.Client
|
||||
store *ccache.Cache[ChatMessage]
|
||||
params ChatCompletionParams
|
||||
}
|
||||
|
||||
type ChatCompletionParams struct {
|
||||
Model string `json:"model"`
|
||||
MaxTokens int `json:"max_tokens,omitempty"`
|
||||
Temperature float32 `json:"temperature,omitempty"`
|
||||
PresencePenalty float32 `json:"presence_penalty,omitempty"`
|
||||
FrequencyPenalty float32 `json:"frequency_penalty,omitempty"`
|
||||
ChatSessionTTL time.Duration `json:"chat_session_ttl"`
|
||||
ChatMinResponseTokens int `json:"chat_min_response_tokens"`
|
||||
}
|
||||
|
||||
type ChatMessageRequest struct {
|
||||
Prompt string `json:"prompt"`
|
||||
Options ChatMessageRequestOptions `json:"options"`
|
||||
}
|
||||
|
||||
type ChatMessageRequestOptions struct {
|
||||
Name string `json:"name"`
|
||||
ParentMessageId string `json:"parentMessageId"`
|
||||
}
|
||||
|
||||
type ChatMessage struct {
|
||||
ID string `json:"id"`
|
||||
Text string `json:"text"`
|
||||
Role string `json:"role"`
|
||||
Name string `json:"name"`
|
||||
Delta string `json:"delta"`
|
||||
Detail openai.ChatCompletionStreamResponse `json:"detail"`
|
||||
TokenCount int `json:"tokenCount"`
|
||||
ParentMessageId string `json:"parentMessageId"`
|
||||
}
|
||||
|
||||
func NewChatService(apiKey string, baseURL string, socksProxy string, params ChatCompletionParams) (*ChatService, error) {
|
||||
config := openai.DefaultConfig(apiKey)
|
||||
if baseURL != "" {
|
||||
config.BaseURL = baseURL
|
||||
}
|
||||
klog.Infof("use openai base url: %s", config.BaseURL)
|
||||
if socksProxy != "" {
|
||||
proxyUrl, err := url.Parse(socksProxy) //socks5://user:password@127.0.0.1:1080
|
||||
if err != nil {
|
||||
return nil, err
|
||||
}
|
||||
config.HTTPClient = &http.Client{
|
||||
Transport: &http.Transport{
|
||||
Proxy: http.ProxyURL(proxyUrl),
|
||||
},
|
||||
}
|
||||
klog.Infof("use sock proxy: %s", proxyUrl)
|
||||
}
|
||||
chat := ChatService{
|
||||
client: openai.NewClientWithConfig(config),
|
||||
params: params,
|
||||
store: ccache.New(ccache.Configure[ChatMessage]()),
|
||||
}
|
||||
return &chat, nil
|
||||
}
|
||||
|
||||
func (chat *ChatService) ChatProcess(ctx *gin.Context) {
|
||||
payload := ChatMessageRequest{}
|
||||
if err := ctx.BindJSON(&payload); err != nil {
|
||||
klog.Error(err)
|
||||
ctx.JSON(200, gin.H{
|
||||
"status": "Fail",
|
||||
"message": fmt.Sprintf("%v", err),
|
||||
"data": nil,
|
||||
})
|
||||
return
|
||||
}
|
||||
|
||||
messageID := uuid.New().String()
|
||||
|
||||
message := ChatMessage{
|
||||
ID: messageID,
|
||||
Role: openai.ChatMessageRoleUser,
|
||||
Text: payload.Prompt,
|
||||
ParentMessageId: payload.Options.ParentMessageId,
|
||||
}
|
||||
|
||||
result := ChatMessage{
|
||||
ID: uuid.New().String(),
|
||||
Role: openai.ChatMessageRoleAssistant,
|
||||
Text: "",
|
||||
ParentMessageId: messageID,
|
||||
}
|
||||
|
||||
messages, numTokens, tokenCount, err := chat.buildMessage(payload)
|
||||
if err != nil {
|
||||
ctx.JSON(200, gin.H{
|
||||
"status": "Fail",
|
||||
"message": fmt.Sprintf("%v", err),
|
||||
"data": nil,
|
||||
})
|
||||
return
|
||||
}
|
||||
|
||||
message.TokenCount = tokenCount
|
||||
chat.store.Set(messageID, message, chat.params.ChatSessionTTL)
|
||||
|
||||
//klog.Infof("send message %d tokens, set completion %d max tokens", numTokens, chat.params.MaxTokens-numTokens)
|
||||
|
||||
stream, err := chat.client.CreateChatCompletionStream(ctx, openai.ChatCompletionRequest{
|
||||
Model: chat.params.Model,
|
||||
Messages: messages,
|
||||
MaxTokens: chat.params.MaxTokens - numTokens,
|
||||
Temperature: chat.params.Temperature,
|
||||
PresencePenalty: chat.params.PresencePenalty,
|
||||
FrequencyPenalty: chat.params.FrequencyPenalty,
|
||||
TopP: chat.topP(),
|
||||
Stream: true,
|
||||
})
|
||||
if err != nil {
|
||||
klog.Error(err)
|
||||
ctx.JSON(200, gin.H{
|
||||
"status": "Fail",
|
||||
"message": fmt.Sprintf("%v", err),
|
||||
"data": nil,
|
||||
})
|
||||
return
|
||||
}
|
||||
defer stream.Close()
|
||||
|
||||
resp := stream.GetResponse()
|
||||
if resp.StatusCode != 200 {
|
||||
bts, _ := io.ReadAll(resp.Body)
|
||||
ctx.JSON(200, gin.H{
|
||||
"status": "Fail",
|
||||
"message": fmt.Sprintf("%v", string(bts)),
|
||||
"data": nil,
|
||||
})
|
||||
return
|
||||
}
|
||||
|
||||
firstChunk := true
|
||||
ctx.Header("Content-type", "application/octet-stream")
|
||||
for {
|
||||
rsp, err := stream.Recv()
|
||||
if errors.Is(err, io.EOF) {
|
||||
go func() {
|
||||
tokenCount, err := tokenizer.GetTokenCount(openai.ChatCompletionMessage{
|
||||
Role: result.Role,
|
||||
Content: result.Text,
|
||||
Name: result.Name,
|
||||
}, chat.params.Model)
|
||||
if err != nil {
|
||||
klog.Error(err)
|
||||
}
|
||||
result.TokenCount = tokenCount
|
||||
chat.store.Set(result.ID, result, chat.params.ChatSessionTTL)
|
||||
}()
|
||||
return
|
||||
}
|
||||
|
||||
if err != nil {
|
||||
klog.Error(err)
|
||||
ctx.JSON(200, gin.H{
|
||||
"status": "Fail",
|
||||
"message": fmt.Sprintf("OpenAI Event Error %v", err),
|
||||
"data": nil,
|
||||
})
|
||||
return
|
||||
}
|
||||
|
||||
if rsp.ID != "" {
|
||||
result.ID = rsp.ID
|
||||
}
|
||||
|
||||
if len(rsp.Choices) > 0 {
|
||||
content := rsp.Choices[0].Delta.Content
|
||||
result.Delta = content
|
||||
if len(content) > 0 {
|
||||
result.Text += content
|
||||
}
|
||||
result.Detail = rsp
|
||||
}
|
||||
|
||||
bts, err := json.Marshal(result)
|
||||
if err != nil {
|
||||
klog.Error(err)
|
||||
ctx.JSON(200, gin.H{
|
||||
"status": "Fail",
|
||||
"message": fmt.Sprintf("OpenAI Event Marshal Error %v", err),
|
||||
"data": nil,
|
||||
})
|
||||
return
|
||||
}
|
||||
|
||||
if !firstChunk {
|
||||
ctx.Writer.Write([]byte("\n"))
|
||||
} else {
|
||||
firstChunk = false
|
||||
}
|
||||
|
||||
if _, err := ctx.Writer.Write(bts); err != nil {
|
||||
klog.Error(err)
|
||||
return
|
||||
}
|
||||
|
||||
ctx.Writer.Flush()
|
||||
}
|
||||
}
|
||||
|
||||
func (chat *ChatService) topP() float32 {
|
||||
if strings.HasPrefix(chat.params.Model, "kimi-") || strings.HasPrefix(chat.params.Model, "moonshot-") {
|
||||
return KimiTopP
|
||||
}
|
||||
return 1
|
||||
}
|
||||
|
||||
func (chat *ChatService) buildMessage(payload ChatMessageRequest) ([]openai.ChatCompletionMessage, int, int, error) {
|
||||
parentMessageId := payload.Options.ParentMessageId
|
||||
messages := []openai.ChatCompletionMessage{}
|
||||
tokenCount := 0
|
||||
var err error
|
||||
if len(payload.Prompt) > 0 {
|
||||
chatMessage := openai.ChatCompletionMessage{
|
||||
Role: openai.ChatMessageRoleUser,
|
||||
Content: payload.Prompt,
|
||||
Name: payload.Options.Name,
|
||||
}
|
||||
messages = append(messages, chatMessage)
|
||||
tokenCount, err = tokenizer.GetTokenCount(chatMessage, chat.params.Model)
|
||||
if err != nil {
|
||||
return nil, 0, 0, err
|
||||
}
|
||||
if tokenCount >= (chat.params.MaxTokens - chat.params.ChatMinResponseTokens) {
|
||||
return nil, 0, 0, fmt.Errorf("this model's maximum context length is %d tokens. you requested %d tokens in the messages", chat.params.MaxTokens, tokenCount)
|
||||
}
|
||||
}
|
||||
numTokens := tokenCount + ChatPrimedTokens
|
||||
for {
|
||||
if parentMessageId == "" {
|
||||
break
|
||||
}
|
||||
parentMessage, ok := chat.getMessageByID(parentMessageId)
|
||||
if !ok {
|
||||
break
|
||||
}
|
||||
parentCompletioMessage := openai.ChatCompletionMessage{
|
||||
Role: parentMessage.Role,
|
||||
Content: parentMessage.Text,
|
||||
Name: parentMessage.Name,
|
||||
}
|
||||
if (numTokens + parentMessage.TokenCount) >= (chat.params.MaxTokens - chat.params.ChatMinResponseTokens) {
|
||||
break
|
||||
}
|
||||
numTokens += parentMessage.TokenCount
|
||||
messages = append(messages, parentCompletioMessage)
|
||||
parentMessageId = parentMessage.ParentMessageId
|
||||
}
|
||||
utils.Reverse(messages)
|
||||
return messages, numTokens, tokenCount, nil
|
||||
}
|
||||
|
||||
func (chat *ChatService) getMessageByID(id string) (ChatMessage, bool) {
|
||||
item := chat.store.Get(id)
|
||||
if item == nil {
|
||||
return ChatMessage{}, false
|
||||
}
|
||||
if item.Expired() {
|
||||
return ChatMessage{}, false
|
||||
}
|
||||
return item.Value(), true
|
||||
}
|
||||
23
chatgpt-web-backend/pkg/middlewares/rate_limit.go
Normal file
23
chatgpt-web-backend/pkg/middlewares/rate_limit.go
Normal file
@@ -0,0 +1,23 @@
|
||||
package middlewares
|
||||
|
||||
import (
|
||||
"github.com/gin-gonic/gin"
|
||||
"golang.org/x/time/rate"
|
||||
)
|
||||
|
||||
func RateLimitMiddleware(r rate.Limit, b int) gin.HandlerFunc {
|
||||
limiter := rate.NewLimiter(r, b)
|
||||
return func(c *gin.Context) {
|
||||
if !limiter.Allow() {
|
||||
// 请求被限制,返回错误信息
|
||||
c.JSON(429, gin.H{
|
||||
"status": "Fail",
|
||||
"message": "Too many requests, please try again later",
|
||||
"data": nil,
|
||||
})
|
||||
c.Abort()
|
||||
return
|
||||
}
|
||||
c.Next()
|
||||
}
|
||||
}
|
||||
43
chatgpt-web-backend/pkg/tokenizer/tokenizer.go
Normal file
43
chatgpt-web-backend/pkg/tokenizer/tokenizer.go
Normal file
@@ -0,0 +1,43 @@
|
||||
package tokenizer
|
||||
|
||||
import (
|
||||
"bytes"
|
||||
"encoding/json"
|
||||
"fmt"
|
||||
"net/http"
|
||||
|
||||
"github.com/sashabaranov/go-openai"
|
||||
)
|
||||
|
||||
type tokenInfo struct {
|
||||
Code int `json:"code"`
|
||||
Count int `json:"num_tokens"`
|
||||
Msg string `json:"msg"`
|
||||
}
|
||||
|
||||
func GetTokenCount(message openai.ChatCompletionMessage, model string) (int, error) {
|
||||
url := fmt.Sprintf("http://127.0.0.1:5000/tokenizer/%s", model)
|
||||
info := tokenInfo{}
|
||||
if err := postJSON(url, &message, &info); err != nil {
|
||||
return 0, err
|
||||
}
|
||||
if info.Code != 200 {
|
||||
return 0, fmt.Errorf("%v", info.Msg)
|
||||
}
|
||||
return info.Count, nil
|
||||
}
|
||||
|
||||
func postJSON(url string, requestData *openai.ChatCompletionMessage, responseData *tokenInfo) error {
|
||||
requestBody, err := json.Marshal(requestData)
|
||||
if err != nil {
|
||||
return err
|
||||
}
|
||||
|
||||
resp, err := http.Post(url, "application/json", bytes.NewBuffer(requestBody))
|
||||
if err != nil {
|
||||
return err
|
||||
}
|
||||
defer resp.Body.Close()
|
||||
|
||||
return json.NewDecoder(resp.Body).Decode(responseData)
|
||||
}
|
||||
65
chatgpt-web-backend/pkg/utils/utils.go
Normal file
65
chatgpt-web-backend/pkg/utils/utils.go
Normal file
@@ -0,0 +1,65 @@
|
||||
package utils
|
||||
|
||||
import (
|
||||
"io/ioutil"
|
||||
"os"
|
||||
"path/filepath"
|
||||
"strings"
|
||||
|
||||
"k8s.io/klog/v2"
|
||||
)
|
||||
|
||||
func ReplaceInFile(filePath string, targetStr string, replaceStr string) error {
|
||||
// 读取文件内容
|
||||
content, err := ioutil.ReadFile(filePath)
|
||||
if err != nil {
|
||||
return err
|
||||
}
|
||||
// 判断是否需要替换
|
||||
if !strings.Contains(string(content), targetStr) {
|
||||
return nil
|
||||
}
|
||||
|
||||
// 替换字符串并写回文件,保持原有 filemode
|
||||
info, err := os.Stat(filePath)
|
||||
if err != nil {
|
||||
return err
|
||||
}
|
||||
newContent := strings.ReplaceAll(string(content), targetStr, replaceStr)
|
||||
err = ioutil.WriteFile(filePath, []byte(newContent), info.Mode())
|
||||
if err != nil {
|
||||
return err
|
||||
}
|
||||
klog.Infof("Replaced in file: %s\n", filePath)
|
||||
return nil
|
||||
}
|
||||
|
||||
func ReplaceFiles(rootDir string, replacePairs map[string]string) error {
|
||||
err := filepath.Walk(rootDir, func(path string, info os.FileInfo, err error) error {
|
||||
if err != nil {
|
||||
return err
|
||||
}
|
||||
// 如果当前路径是目录,则继续遍历
|
||||
if info.IsDir() {
|
||||
return nil
|
||||
}
|
||||
// 处理文件
|
||||
for targetStr, replaceStr := range replacePairs {
|
||||
err = ReplaceInFile(path, targetStr, replaceStr)
|
||||
if err != nil {
|
||||
return err
|
||||
}
|
||||
}
|
||||
return nil
|
||||
})
|
||||
if err != nil {
|
||||
return err
|
||||
}
|
||||
return nil
|
||||
}
|
||||
|
||||
func Reverse[S ~[]E, E any](s S) {
|
||||
for i, j := 0, len(s)-1; i < j; i, j = i+1, j-1 {
|
||||
s[i], s[j] = s[j], s[i]
|
||||
}
|
||||
}
|
||||
2
chatgpt-web-backend/requirements.txt
Normal file
2
chatgpt-web-backend/requirements.txt
Normal file
@@ -0,0 +1,2 @@
|
||||
nuxt>=0.2.0
|
||||
tiktoken>=0.3.3
|
||||
1
chatgpt-web-backend/tests/test.txt
Normal file
1
chatgpt-web-backend/tests/test.txt
Normal file
@@ -0,0 +1 @@
|
||||
{avatar:"https://raw.githubusercontent.com/Chanzhaoyu/chatgpt-web/main/src/assets/avatar.jpg",name:"ChatGPT",description:'知之为知之'}
|
||||
65
chatgpt-web-backend/tokenizer.py
Normal file
65
chatgpt-web-backend/tokenizer.py
Normal file
@@ -0,0 +1,65 @@
|
||||
from nuxt import route, logger, Request
|
||||
from nuxt.repositorys.validation import fields, use_args
|
||||
import traceback
|
||||
import tiktoken
|
||||
|
||||
encoding_cache = {}
|
||||
|
||||
support_models = set(["kimi-k2.5",
|
||||
"gpt-3.5-turbo",
|
||||
"gpt-3.5-turbo-16k",
|
||||
"gpt-4",
|
||||
"gpt-4-32k"])
|
||||
|
||||
support_model_prefixes = (
|
||||
"gpt-3.5-turbo-",
|
||||
"gpt-4-",
|
||||
"moonshot-",
|
||||
"kimi-",
|
||||
)
|
||||
|
||||
|
||||
@route("/tokenizer/<str:model_name>", methods=["POST"])
|
||||
@use_args({
|
||||
"role": fields.Str(required=True),
|
||||
"content": fields.Str(required=True),
|
||||
"name": fields.Str(required=False)
|
||||
}, location="json")
|
||||
def get_num_tokens(req: Request, message: dict, model_name: str):
|
||||
try:
|
||||
return {
|
||||
"code": 200,
|
||||
"num_tokens": num_tokens_from_messages([message], model=model_name)
|
||||
}
|
||||
except Exception as e:
|
||||
logger.error(traceback.format_exc())
|
||||
return {
|
||||
"code": 500,
|
||||
"msg": "{}".format(e)
|
||||
}
|
||||
|
||||
|
||||
def num_tokens_from_messages(messages, model="gpt-3.5-turbo"):
|
||||
"""Returns the number of tokens used by a list of messages."""
|
||||
encoding = None
|
||||
if model in encoding_cache:
|
||||
encoding = encoding_cache.get(model)
|
||||
else:
|
||||
try:
|
||||
encoding = tiktoken.encoding_for_model(model)
|
||||
except KeyError:
|
||||
encoding = tiktoken.get_encoding("cl100k_base")
|
||||
encoding_cache[model] = encoding
|
||||
if model in support_models or model.startswith(support_model_prefixes):
|
||||
num_tokens = 0
|
||||
for message in messages:
|
||||
num_tokens += 4 # every message follows <im_start>{role/name}\n{content}<im_end>\n
|
||||
for key, value in message.items():
|
||||
num_tokens += len(encoding.encode(value))
|
||||
if key == "name": # if there's a name, the role is omitted
|
||||
num_tokens += -1 # role is always required and always 1 token
|
||||
num_tokens += 3 # every reply is primed with <im_start>assistant
|
||||
return num_tokens
|
||||
else:
|
||||
raise NotImplementedError(f"""num_tokens_from_messages() is not presently implemented for model {model}.
|
||||
See https://github.com/openai/openai-python/blob/main/chatml.md for information on how messages are converted to tokens.""")
|
||||
Reference in New Issue
Block a user