2024-07-25 11:30:49 +02:00
|
|
|
// Copyright 2024, Command Line Inc.
|
|
|
|
// SPDX-License-Identifier: Apache-2.0
|
|
|
|
|
|
|
|
package waveai
|
|
|
|
|
|
|
|
import (
|
|
|
|
"context"
|
|
|
|
"encoding/json"
|
|
|
|
"fmt"
|
|
|
|
"io"
|
|
|
|
"log"
|
|
|
|
"os"
|
2024-10-09 22:36:02 +02:00
|
|
|
"regexp"
|
|
|
|
"strings"
|
2024-07-25 11:30:49 +02:00
|
|
|
"time"
|
|
|
|
|
|
|
|
openaiapi "github.com/sashabaranov/go-openai"
|
2024-09-05 23:25:45 +02:00
|
|
|
"github.com/wavetermdev/waveterm/pkg/wavebase"
|
|
|
|
"github.com/wavetermdev/waveterm/pkg/wcloud"
|
|
|
|
"github.com/wavetermdev/waveterm/pkg/wshrpc"
|
2024-07-25 11:30:49 +02:00
|
|
|
|
|
|
|
"github.com/gorilla/websocket"
|
|
|
|
)
|
|
|
|
|
|
|
|
const OpenAIPacketStr = "openai"
|
|
|
|
const OpenAICloudReqStr = "openai-cloudreq"
|
|
|
|
const PacketEOFStr = "EOF"
|
2024-10-09 22:36:02 +02:00
|
|
|
const DefaultAzureAPIVersion = "2023-05-15"
|
2024-07-25 11:30:49 +02:00
|
|
|
|
|
|
|
type OpenAICmdInfoPacketOutputType struct {
|
|
|
|
Model string `json:"model,omitempty"`
|
|
|
|
Created int64 `json:"created,omitempty"`
|
|
|
|
FinishReason string `json:"finish_reason,omitempty"`
|
|
|
|
Message string `json:"message,omitempty"`
|
|
|
|
Error string `json:"error,omitempty"`
|
|
|
|
}
|
|
|
|
|
2024-07-26 22:30:11 +02:00
|
|
|
func MakeOpenAIPacket() *wshrpc.OpenAIPacketType {
|
|
|
|
return &wshrpc.OpenAIPacketType{Type: OpenAIPacketStr}
|
2024-07-25 11:30:49 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
type OpenAICmdInfoChatMessage struct {
|
|
|
|
MessageID int `json:"messageid"`
|
|
|
|
IsAssistantResponse bool `json:"isassistantresponse,omitempty"`
|
|
|
|
AssistantResponse *OpenAICmdInfoPacketOutputType `json:"assistantresponse,omitempty"`
|
|
|
|
UserQuery string `json:"userquery,omitempty"`
|
|
|
|
UserEngineeredQuery string `json:"userengineeredquery,omitempty"`
|
|
|
|
}
|
|
|
|
|
|
|
|
type OpenAICloudReqPacketType struct {
|
2024-07-26 22:30:11 +02:00
|
|
|
Type string `json:"type"`
|
|
|
|
ClientId string `json:"clientid"`
|
|
|
|
Prompt []wshrpc.OpenAIPromptMessageType `json:"prompt"`
|
|
|
|
MaxTokens int `json:"maxtokens,omitempty"`
|
|
|
|
MaxChoices int `json:"maxchoices,omitempty"`
|
2024-07-25 11:30:49 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
func MakeOpenAICloudReqPacket() *OpenAICloudReqPacketType {
|
|
|
|
return &OpenAICloudReqPacketType{
|
|
|
|
Type: OpenAICloudReqStr,
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
func GetWSEndpoint() string {
|
|
|
|
if !wavebase.IsDevMode() {
|
2024-10-09 22:36:02 +02:00
|
|
|
return WCloudWSEndpoint
|
2024-07-25 11:30:49 +02:00
|
|
|
} else {
|
2024-10-09 22:36:02 +02:00
|
|
|
endpoint := os.Getenv(WCloudWSEndpointVarName)
|
2024-07-25 11:30:49 +02:00
|
|
|
if endpoint == "" {
|
2024-10-09 22:36:02 +02:00
|
|
|
panic("Invalid WCloud websocket dev endpoint, WCLOUD_WS_ENDPOINT not set or invalid")
|
2024-07-25 11:30:49 +02:00
|
|
|
}
|
|
|
|
return endpoint
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2024-10-09 22:36:02 +02:00
|
|
|
const DefaultMaxTokens = 2048
|
2024-08-28 21:05:29 +02:00
|
|
|
const DefaultModel = "gpt-4o-mini"
|
2024-10-09 22:36:02 +02:00
|
|
|
const WCloudWSEndpoint = "wss://wsapi.waveterm.dev/"
|
|
|
|
const WCloudWSEndpointVarName = "WCLOUD_WS_ENDPOINT"
|
2024-07-25 11:30:49 +02:00
|
|
|
|
|
|
|
const CloudWebsocketConnectTimeout = 1 * time.Minute
|
|
|
|
|
2024-10-09 22:36:02 +02:00
|
|
|
func IsCloudAIRequest(opts *wshrpc.OpenAIOptsType) bool {
|
|
|
|
if opts == nil {
|
|
|
|
return true
|
|
|
|
}
|
|
|
|
return opts.BaseURL == "" && opts.APIToken == ""
|
|
|
|
}
|
|
|
|
|
2024-07-26 22:30:11 +02:00
|
|
|
func convertUsage(resp openaiapi.ChatCompletionResponse) *wshrpc.OpenAIUsageType {
|
2024-07-25 11:30:49 +02:00
|
|
|
if resp.Usage.TotalTokens == 0 {
|
|
|
|
return nil
|
|
|
|
}
|
2024-07-26 22:30:11 +02:00
|
|
|
return &wshrpc.OpenAIUsageType{
|
2024-07-25 11:30:49 +02:00
|
|
|
PromptTokens: resp.Usage.PromptTokens,
|
|
|
|
CompletionTokens: resp.Usage.CompletionTokens,
|
|
|
|
TotalTokens: resp.Usage.TotalTokens,
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2024-07-26 22:30:11 +02:00
|
|
|
func ConvertPrompt(prompt []wshrpc.OpenAIPromptMessageType) []openaiapi.ChatCompletionMessage {
|
2024-07-25 11:30:49 +02:00
|
|
|
var rtn []openaiapi.ChatCompletionMessage
|
|
|
|
for _, p := range prompt {
|
|
|
|
msg := openaiapi.ChatCompletionMessage{Role: p.Role, Content: p.Content, Name: p.Name}
|
|
|
|
rtn = append(rtn, msg)
|
|
|
|
}
|
|
|
|
return rtn
|
|
|
|
}
|
|
|
|
|
2024-08-09 03:24:54 +02:00
|
|
|
func makeAIError(err error) wshrpc.RespOrErrorUnion[wshrpc.OpenAIPacketType] {
|
|
|
|
return wshrpc.RespOrErrorUnion[wshrpc.OpenAIPacketType]{Error: err}
|
|
|
|
}
|
|
|
|
|
2024-10-09 22:36:02 +02:00
|
|
|
func RunAICommand(ctx context.Context, request wshrpc.OpenAiStreamRequest) chan wshrpc.RespOrErrorUnion[wshrpc.OpenAIPacketType] {
|
|
|
|
if IsCloudAIRequest(request.Opts) {
|
|
|
|
log.Print("sending ai chat message to default waveterm cloud endpoint\n")
|
|
|
|
return RunCloudCompletionStream(ctx, request)
|
|
|
|
}
|
|
|
|
log.Printf("sending ai chat message to user-configured endpoint %s\n", request.Opts.BaseURL)
|
|
|
|
return RunLocalCompletionStream(ctx, request)
|
|
|
|
}
|
|
|
|
|
2024-07-26 22:30:11 +02:00
|
|
|
func RunCloudCompletionStream(ctx context.Context, request wshrpc.OpenAiStreamRequest) chan wshrpc.RespOrErrorUnion[wshrpc.OpenAIPacketType] {
|
|
|
|
rtn := make(chan wshrpc.RespOrErrorUnion[wshrpc.OpenAIPacketType])
|
2024-08-09 03:24:54 +02:00
|
|
|
wsEndpoint := wcloud.GetWSEndpoint()
|
2024-07-25 11:30:49 +02:00
|
|
|
go func() {
|
|
|
|
defer close(rtn)
|
2024-08-09 03:24:54 +02:00
|
|
|
if wsEndpoint == "" {
|
|
|
|
rtn <- makeAIError(fmt.Errorf("no cloud ws endpoint found"))
|
|
|
|
return
|
|
|
|
}
|
2024-07-25 11:30:49 +02:00
|
|
|
if request.Opts == nil {
|
2024-08-09 03:24:54 +02:00
|
|
|
rtn <- makeAIError(fmt.Errorf("no openai opts found"))
|
2024-07-25 11:30:49 +02:00
|
|
|
return
|
|
|
|
}
|
|
|
|
websocketContext, dialCancelFn := context.WithTimeout(context.Background(), CloudWebsocketConnectTimeout)
|
|
|
|
defer dialCancelFn()
|
2024-08-09 03:24:54 +02:00
|
|
|
conn, _, err := websocket.DefaultDialer.DialContext(websocketContext, wsEndpoint, nil)
|
2024-07-25 11:30:49 +02:00
|
|
|
if err == context.DeadlineExceeded {
|
2024-08-09 03:24:54 +02:00
|
|
|
rtn <- makeAIError(fmt.Errorf("OpenAI request, timed out connecting to cloud server: %v", err))
|
2024-07-25 11:30:49 +02:00
|
|
|
return
|
|
|
|
} else if err != nil {
|
2024-08-09 03:24:54 +02:00
|
|
|
rtn <- makeAIError(fmt.Errorf("OpenAI request, websocket connect error: %v", err))
|
2024-07-25 11:30:49 +02:00
|
|
|
return
|
|
|
|
}
|
2024-07-26 22:30:11 +02:00
|
|
|
defer func() {
|
|
|
|
err = conn.Close()
|
|
|
|
if err != nil {
|
2024-08-09 03:24:54 +02:00
|
|
|
rtn <- makeAIError(fmt.Errorf("unable to close openai channel: %v", err))
|
2024-07-26 22:30:11 +02:00
|
|
|
}
|
|
|
|
}()
|
2024-10-09 23:50:56 +02:00
|
|
|
var sendablePromptMsgs []wshrpc.OpenAIPromptMessageType
|
|
|
|
for _, promptMsg := range request.Prompt {
|
|
|
|
if promptMsg.Role == "error" {
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
sendablePromptMsgs = append(sendablePromptMsgs, promptMsg)
|
|
|
|
}
|
2024-07-25 11:30:49 +02:00
|
|
|
reqPk := MakeOpenAICloudReqPacket()
|
|
|
|
reqPk.ClientId = request.ClientId
|
2024-10-09 23:50:56 +02:00
|
|
|
reqPk.Prompt = sendablePromptMsgs
|
2024-07-25 11:30:49 +02:00
|
|
|
reqPk.MaxTokens = request.Opts.MaxTokens
|
|
|
|
reqPk.MaxChoices = request.Opts.MaxChoices
|
|
|
|
configMessageBuf, err := json.Marshal(reqPk)
|
|
|
|
if err != nil {
|
2024-08-09 03:24:54 +02:00
|
|
|
rtn <- makeAIError(fmt.Errorf("OpenAI request, packet marshal error: %v", err))
|
2024-07-25 11:30:49 +02:00
|
|
|
return
|
|
|
|
}
|
|
|
|
err = conn.WriteMessage(websocket.TextMessage, configMessageBuf)
|
|
|
|
if err != nil {
|
2024-08-09 03:24:54 +02:00
|
|
|
rtn <- makeAIError(fmt.Errorf("OpenAI request, websocket write config error: %v", err))
|
2024-07-25 11:30:49 +02:00
|
|
|
return
|
|
|
|
}
|
|
|
|
for {
|
|
|
|
_, socketMessage, err := conn.ReadMessage()
|
|
|
|
if err == io.EOF {
|
|
|
|
break
|
|
|
|
}
|
|
|
|
if err != nil {
|
|
|
|
log.Printf("err received: %v", err)
|
2024-08-09 03:24:54 +02:00
|
|
|
rtn <- makeAIError(fmt.Errorf("OpenAI request, websocket error reading message: %v", err))
|
2024-07-25 11:30:49 +02:00
|
|
|
break
|
|
|
|
}
|
2024-07-26 22:30:11 +02:00
|
|
|
var streamResp *wshrpc.OpenAIPacketType
|
2024-07-25 11:30:49 +02:00
|
|
|
err = json.Unmarshal(socketMessage, &streamResp)
|
|
|
|
if err != nil {
|
2024-08-09 03:24:54 +02:00
|
|
|
rtn <- makeAIError(fmt.Errorf("OpenAI request, websocket response json decode error: %v", err))
|
2024-07-25 11:30:49 +02:00
|
|
|
break
|
|
|
|
}
|
|
|
|
if streamResp.Error == PacketEOFStr {
|
|
|
|
// got eof packet from socket
|
|
|
|
break
|
|
|
|
} else if streamResp.Error != "" {
|
|
|
|
// use error from server directly
|
2024-08-09 03:24:54 +02:00
|
|
|
rtn <- makeAIError(fmt.Errorf("%v", streamResp.Error))
|
2024-07-25 11:30:49 +02:00
|
|
|
break
|
|
|
|
}
|
2024-07-26 22:30:11 +02:00
|
|
|
rtn <- wshrpc.RespOrErrorUnion[wshrpc.OpenAIPacketType]{Response: *streamResp}
|
2024-07-25 11:30:49 +02:00
|
|
|
}
|
|
|
|
}()
|
|
|
|
return rtn
|
|
|
|
}
|
|
|
|
|
2024-10-09 22:36:02 +02:00
|
|
|
// copied from go-openai/config.go
|
|
|
|
func defaultAzureMapperFn(model string) string {
|
|
|
|
return regexp.MustCompile(`[.:]`).ReplaceAllString(model, "")
|
|
|
|
}
|
|
|
|
|
2024-10-09 23:50:56 +02:00
|
|
|
func setApiType(opts *wshrpc.OpenAIOptsType, clientConfig *openaiapi.ClientConfig) error {
|
2024-10-09 22:36:02 +02:00
|
|
|
ourApiType := strings.ToLower(opts.APIType)
|
2024-10-09 23:50:56 +02:00
|
|
|
if ourApiType == "" || ourApiType == strings.ToLower(string(openaiapi.APITypeOpenAI)) {
|
|
|
|
clientConfig.APIType = openaiapi.APITypeOpenAI
|
2024-10-09 22:36:02 +02:00
|
|
|
return nil
|
2024-10-09 23:50:56 +02:00
|
|
|
} else if ourApiType == strings.ToLower(string(openaiapi.APITypeAzure)) {
|
|
|
|
clientConfig.APIType = openaiapi.APITypeAzure
|
2024-10-09 22:36:02 +02:00
|
|
|
clientConfig.APIVersion = DefaultAzureAPIVersion
|
|
|
|
clientConfig.AzureModelMapperFunc = defaultAzureMapperFn
|
|
|
|
return nil
|
2024-10-09 23:50:56 +02:00
|
|
|
} else if ourApiType == strings.ToLower(string(openaiapi.APITypeAzureAD)) {
|
|
|
|
clientConfig.APIType = openaiapi.APITypeAzureAD
|
2024-10-09 22:36:02 +02:00
|
|
|
clientConfig.APIVersion = DefaultAzureAPIVersion
|
|
|
|
clientConfig.AzureModelMapperFunc = defaultAzureMapperFn
|
|
|
|
return nil
|
2024-10-09 23:50:56 +02:00
|
|
|
} else if ourApiType == strings.ToLower(string(openaiapi.APITypeCloudflareAzure)) {
|
|
|
|
clientConfig.APIType = openaiapi.APITypeCloudflareAzure
|
2024-10-09 22:36:02 +02:00
|
|
|
clientConfig.APIVersion = DefaultAzureAPIVersion
|
|
|
|
clientConfig.AzureModelMapperFunc = defaultAzureMapperFn
|
|
|
|
return nil
|
|
|
|
} else {
|
|
|
|
return fmt.Errorf("invalid api type %q", opts.APIType)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2024-07-26 22:30:11 +02:00
|
|
|
func RunLocalCompletionStream(ctx context.Context, request wshrpc.OpenAiStreamRequest) chan wshrpc.RespOrErrorUnion[wshrpc.OpenAIPacketType] {
|
|
|
|
rtn := make(chan wshrpc.RespOrErrorUnion[wshrpc.OpenAIPacketType])
|
2024-07-25 11:30:49 +02:00
|
|
|
go func() {
|
|
|
|
defer close(rtn)
|
|
|
|
if request.Opts == nil {
|
2024-07-26 22:30:11 +02:00
|
|
|
rtn <- wshrpc.RespOrErrorUnion[wshrpc.OpenAIPacketType]{Error: fmt.Errorf("no openai opts found")}
|
2024-07-25 11:30:49 +02:00
|
|
|
return
|
|
|
|
}
|
|
|
|
if request.Opts.Model == "" {
|
2024-07-26 22:30:11 +02:00
|
|
|
rtn <- wshrpc.RespOrErrorUnion[wshrpc.OpenAIPacketType]{Error: fmt.Errorf("no openai model specified")}
|
2024-07-25 11:30:49 +02:00
|
|
|
return
|
|
|
|
}
|
|
|
|
if request.Opts.BaseURL == "" && request.Opts.APIToken == "" {
|
2024-07-26 22:30:11 +02:00
|
|
|
rtn <- wshrpc.RespOrErrorUnion[wshrpc.OpenAIPacketType]{Error: fmt.Errorf("no api token")}
|
2024-07-25 11:30:49 +02:00
|
|
|
return
|
|
|
|
}
|
|
|
|
clientConfig := openaiapi.DefaultConfig(request.Opts.APIToken)
|
|
|
|
if request.Opts.BaseURL != "" {
|
|
|
|
clientConfig.BaseURL = request.Opts.BaseURL
|
|
|
|
}
|
2024-10-09 22:36:02 +02:00
|
|
|
err := setApiType(request.Opts, &clientConfig)
|
|
|
|
if err != nil {
|
|
|
|
rtn <- wshrpc.RespOrErrorUnion[wshrpc.OpenAIPacketType]{Error: err}
|
|
|
|
return
|
|
|
|
}
|
|
|
|
if request.Opts.OrgID != "" {
|
|
|
|
clientConfig.OrgID = request.Opts.OrgID
|
|
|
|
}
|
|
|
|
if request.Opts.APIVersion != "" {
|
|
|
|
clientConfig.APIVersion = request.Opts.APIVersion
|
|
|
|
}
|
2024-07-25 11:30:49 +02:00
|
|
|
client := openaiapi.NewClientWithConfig(clientConfig)
|
|
|
|
req := openaiapi.ChatCompletionRequest{
|
|
|
|
Model: request.Opts.Model,
|
|
|
|
Messages: ConvertPrompt(request.Prompt),
|
|
|
|
MaxTokens: request.Opts.MaxTokens,
|
|
|
|
Stream: true,
|
|
|
|
}
|
|
|
|
if request.Opts.MaxChoices > 1 {
|
|
|
|
req.N = request.Opts.MaxChoices
|
|
|
|
}
|
|
|
|
apiResp, err := client.CreateChatCompletionStream(ctx, req)
|
|
|
|
if err != nil {
|
2024-07-26 22:30:11 +02:00
|
|
|
rtn <- wshrpc.RespOrErrorUnion[wshrpc.OpenAIPacketType]{Error: fmt.Errorf("error calling openai API: %v", err)}
|
2024-07-25 11:30:49 +02:00
|
|
|
return
|
|
|
|
}
|
|
|
|
sentHeader := false
|
|
|
|
for {
|
|
|
|
streamResp, err := apiResp.Recv()
|
|
|
|
if err == io.EOF {
|
|
|
|
break
|
|
|
|
}
|
|
|
|
if err != nil {
|
|
|
|
log.Printf("err received2: %v", err)
|
2024-07-26 22:30:11 +02:00
|
|
|
rtn <- wshrpc.RespOrErrorUnion[wshrpc.OpenAIPacketType]{Error: fmt.Errorf("OpenAI request, websocket error reading message: %v", err)}
|
2024-07-25 11:30:49 +02:00
|
|
|
break
|
|
|
|
}
|
|
|
|
if streamResp.Model != "" && !sentHeader {
|
|
|
|
pk := MakeOpenAIPacket()
|
|
|
|
pk.Model = streamResp.Model
|
|
|
|
pk.Created = streamResp.Created
|
2024-07-26 22:30:11 +02:00
|
|
|
rtn <- wshrpc.RespOrErrorUnion[wshrpc.OpenAIPacketType]{Response: *pk}
|
2024-07-25 11:30:49 +02:00
|
|
|
sentHeader = true
|
|
|
|
}
|
|
|
|
for _, choice := range streamResp.Choices {
|
|
|
|
pk := MakeOpenAIPacket()
|
|
|
|
pk.Index = choice.Index
|
|
|
|
pk.Text = choice.Delta.Content
|
|
|
|
pk.FinishReason = string(choice.FinishReason)
|
2024-07-26 22:30:11 +02:00
|
|
|
rtn <- wshrpc.RespOrErrorUnion[wshrpc.OpenAIPacketType]{Response: *pk}
|
2024-07-25 11:30:49 +02:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}()
|
|
|
|
return rtn
|
|
|
|
}
|