azure ai support (#997)

2024-12-22 16:48:23 +01:00 · 2024-10-09 13:36:02 -07:00 · 2024-10-09 13:36:02 -07:00 · f33028af1d
commit f33028af1d
parent b81ab63ddc
8 changed files with 100 additions and 68 deletions
--- a/frontend/app/view/waveai/waveai.tsx
+++ b/frontend/app/view/waveai/waveai.tsx
@ -194,12 +194,15 @@ export class WaveAiModel implements ViewModel {
            };
            addMessage(newMessage);
            // send message to backend and get response
-            const settings = globalStore.get(atoms.settingsAtom);
+            const settings = globalStore.get(atoms.settingsAtom) ?? {};
            const opts: OpenAIOptsType = {
                model: settings["ai:model"],
                apitype: settings["ai:apitype"],
                orgid: settings["ai:orgid"],
                apitoken: settings["ai:apitoken"],
                apiversion: settings["ai:apiversion"],
                maxtokens: settings["ai:maxtokens"],
-                timeout: settings["ai:timeoutms"] / 1000,
+                timeoutms: settings["ai:timeoutms"] ?? 60000,
                baseurl: settings["ai:baseurl"],
            };
            const newPrompt: OpenAIPromptMessageType = {
@ -222,7 +225,7 @@ export class WaveAiModel implements ViewModel {
                    opts: opts,
                    prompt: [...history, newPrompt],
                };
-                const aiGen = RpcApi.StreamWaveAiCommand(WindowRpcClient, beMsg, { timeout: 60000 });
+                const aiGen = RpcApi.StreamWaveAiCommand(WindowRpcClient, beMsg, { timeout: opts.timeoutms });
                let fullMsg = "";
                for await (const msg of aiGen) {
                    fullMsg += msg.text ?? "";
--- a/frontend/types/gotypes.d.ts
+++ b/frontend/types/gotypes.d.ts
@ -329,11 +329,14 @@ declare global {
    // wshrpc.OpenAIOptsType
    type OpenAIOptsType = {
        model: string;
        apitype?: string;
        apitoken: string;
        orgid?: string;
        apiversion?: string;
        baseurl?: string;
        maxtokens?: number;
        maxchoices?: number;
-        timeout?: number;
+        timeoutms?: number;
    };
    // wshrpc.OpenAIPacketType
@ -413,10 +416,13 @@ declare global {
    // wconfig.SettingsType
    type SettingsType = {
        "ai:*"?: boolean;
        "ai:apitype"?: string;
        "ai:baseurl"?: string;
        "ai:apitoken"?: string;
        "ai:name"?: string;
        "ai:model"?: string;
        "ai:orgid"?: string;
        "ai:apiversion"?: string;
        "ai:maxtokens"?: number;
        "ai:timeoutms"?: number;
        "term:*"?: boolean;
--- a/pkg/waveai/waveai.go
+++ b/pkg/waveai/waveai.go
@ -10,8 +10,11 @@ import (
 	"io"
 	"log"
 	"os"
 	"regexp"
 	"strings"
 	"time"
 	"github.com/sashabaranov/go-openai"
 	openaiapi "github.com/sashabaranov/go-openai"
 	"github.com/wavetermdev/waveterm/pkg/wavebase"
 	"github.com/wavetermdev/waveterm/pkg/wcloud"
@ -23,6 +26,7 @@ import (
 const OpenAIPacketStr = "openai"
 const OpenAICloudReqStr = "openai-cloudreq"
 const PacketEOFStr = "EOF"
 const DefaultAzureAPIVersion = "2023-05-15"
 type OpenAICmdInfoPacketOutputType struct {
 	Model        string `json:"model,omitempty"`
@ -52,16 +56,6 @@ type OpenAICloudReqPacketType struct {
 	MaxChoices int                              `json:"maxchoices,omitempty"`
 }
 type OpenAIOptsType struct {
 	Model      string `json:"model"`
 	APIToken   string `json:"apitoken"`
 	BaseURL    string `json:"baseurl,omitempty"`
 	MaxTokens  int    `json:"maxtokens,omitempty"`
 	MaxChoices int    `json:"maxchoices,omitempty"`
 	Timeout    int    `json:"timeout,omitempty"`
 	BlockId    string `json:"blockid"`
 }
 func MakeOpenAICloudReqPacket() *OpenAICloudReqPacketType {
 	return &OpenAICloudReqPacketType{
 		Type: OpenAICloudReqStr,
@ -69,26 +63,31 @@ func MakeOpenAICloudReqPacket() *OpenAICloudReqPacketType {
 }
 func GetWSEndpoint() string {
 	return PCloudWSEndpoint
 	if !wavebase.IsDevMode() {
-		return PCloudWSEndpoint
+		return WCloudWSEndpoint
 	} else {
-		endpoint := os.Getenv(PCloudWSEndpointVarName)
+		endpoint := os.Getenv(WCloudWSEndpointVarName)
 		if endpoint == "" {
-			panic("Invalid PCloud ws dev endpoint, PCLOUD_WS_ENDPOINT not set or invalid")
+			panic("Invalid WCloud websocket dev endpoint, WCLOUD_WS_ENDPOINT not set or invalid")
 		}
 		return endpoint
 	}
 }
-const DefaultMaxTokens = 1000
+const DefaultMaxTokens = 2048
 const DefaultModel = "gpt-4o-mini"
-const DefaultStreamChanSize = 10
+const WCloudWSEndpoint = "wss://wsapi.waveterm.dev/"
-const PCloudWSEndpoint = "wss://wsapi.waveterm.dev/"
+const WCloudWSEndpointVarName = "WCLOUD_WS_ENDPOINT"
 const PCloudWSEndpointVarName = "PCLOUD_WS_ENDPOINT"
 const CloudWebsocketConnectTimeout = 1 * time.Minute
 func IsCloudAIRequest(opts *wshrpc.OpenAIOptsType) bool {
 	if opts == nil {
 		return true
 	}
 	return opts.BaseURL == "" && opts.APIToken == ""
 }
 func convertUsage(resp openaiapi.ChatCompletionResponse) *wshrpc.OpenAIUsageType {
 	if resp.Usage.TotalTokens == 0 {
 		return nil
@ -113,6 +112,15 @@ func makeAIError(err error) wshrpc.RespOrErrorUnion[wshrpc.OpenAIPacketType] {
 	return wshrpc.RespOrErrorUnion[wshrpc.OpenAIPacketType]{Error: err}
 }
 func RunAICommand(ctx context.Context, request wshrpc.OpenAiStreamRequest) chan wshrpc.RespOrErrorUnion[wshrpc.OpenAIPacketType] {
 	if IsCloudAIRequest(request.Opts) {
 		log.Print("sending ai chat message to default waveterm cloud endpoint\n")
 		return RunCloudCompletionStream(ctx, request)
 	}
 	log.Printf("sending ai chat message to user-configured endpoint %s\n", request.Opts.BaseURL)
 	return RunLocalCompletionStream(ctx, request)
 }
 func RunCloudCompletionStream(ctx context.Context, request wshrpc.OpenAiStreamRequest) chan wshrpc.RespOrErrorUnion[wshrpc.OpenAIPacketType] {
 	rtn := make(chan wshrpc.RespOrErrorUnion[wshrpc.OpenAIPacketType])
 	wsEndpoint := wcloud.GetWSEndpoint()
@ -187,6 +195,36 @@ func RunCloudCompletionStream(ctx context.Context, request wshrpc.OpenAiStreamRe
 	return rtn
 }
 // copied from go-openai/config.go
 func defaultAzureMapperFn(model string) string {
 	return regexp.MustCompile(`[.:]`).ReplaceAllString(model, "")
 }
 func setApiType(opts *wshrpc.OpenAIOptsType, clientConfig *openai.ClientConfig) error {
 	ourApiType := strings.ToLower(opts.APIType)
 	if ourApiType == "" || ourApiType == strings.ToLower(string(openai.APITypeOpenAI)) {
 		clientConfig.APIType = openai.APITypeOpenAI
 		return nil
 	} else if ourApiType == strings.ToLower(string(openai.APITypeAzure)) {
 		clientConfig.APIType = openai.APITypeAzure
 		clientConfig.APIVersion = DefaultAzureAPIVersion
 		clientConfig.AzureModelMapperFunc = defaultAzureMapperFn
 		return nil
 	} else if ourApiType == strings.ToLower(string(openai.APITypeAzureAD)) {
 		clientConfig.APIType = openai.APITypeAzureAD
 		clientConfig.APIVersion = DefaultAzureAPIVersion
 		clientConfig.AzureModelMapperFunc = defaultAzureMapperFn
 		return nil
 	} else if ourApiType == strings.ToLower(string(openai.APITypeCloudflareAzure)) {
 		clientConfig.APIType = openai.APITypeCloudflareAzure
 		clientConfig.APIVersion = DefaultAzureAPIVersion
 		clientConfig.AzureModelMapperFunc = defaultAzureMapperFn
 		return nil
 	} else {
 		return fmt.Errorf("invalid api type %q", opts.APIType)
 	}
 }
 func RunLocalCompletionStream(ctx context.Context, request wshrpc.OpenAiStreamRequest) chan wshrpc.RespOrErrorUnion[wshrpc.OpenAIPacketType] {
 	rtn := make(chan wshrpc.RespOrErrorUnion[wshrpc.OpenAIPacketType])
 	go func() {
@ -207,6 +245,17 @@ func RunLocalCompletionStream(ctx context.Context, request wshrpc.OpenAiStreamRe
 		if request.Opts.BaseURL != "" {
 			clientConfig.BaseURL = request.Opts.BaseURL
 		}
 		err := setApiType(request.Opts, &clientConfig)
 		if err != nil {
 			rtn <- wshrpc.RespOrErrorUnion[wshrpc.OpenAIPacketType]{Error: err}
 			return
 		}
 		if request.Opts.OrgID != "" {
 			clientConfig.OrgID = request.Opts.OrgID
 		}
 		if request.Opts.APIVersion != "" {
 			clientConfig.APIVersion = request.Opts.APIVersion
 		}
 		client := openaiapi.NewClientWithConfig(clientConfig)
 		req := openaiapi.ChatCompletionRequest{
 			Model:     request.Opts.Model,
@ -251,33 +300,3 @@ func RunLocalCompletionStream(ctx context.Context, request wshrpc.OpenAiStreamRe
 	}()
 	return rtn
 }
 func marshalResponse(resp openaiapi.ChatCompletionResponse) []*wshrpc.OpenAIPacketType {
 	var rtn []*wshrpc.OpenAIPacketType
 	headerPk := MakeOpenAIPacket()
 	headerPk.Model = resp.Model
 	headerPk.Created = resp.Created
 	headerPk.Usage = convertUsage(resp)
 	rtn = append(rtn, headerPk)
 	for _, choice := range resp.Choices {
 		choicePk := MakeOpenAIPacket()
 		choicePk.Index = choice.Index
 		choicePk.Text = choice.Message.Content
 		choicePk.FinishReason = string(choice.FinishReason)
 		rtn = append(rtn, choicePk)
 	}
 	return rtn
 }
 func CreateErrorPacket(errStr string) *wshrpc.OpenAIPacketType {
 	errPk := MakeOpenAIPacket()
 	errPk.FinishReason = "error"
 	errPk.Error = errStr
 	return errPk
 }
 func CreateTextPacket(text string) *wshrpc.OpenAIPacketType {
 	pk := MakeOpenAIPacket()
 	pk.Text = text
 	return pk
 }
--- a/pkg/wconfig/defaultconfig/settings.json
+++ b/pkg/wconfig/defaultconfig/settings.json
@ -1,7 +1,7 @@
 {
    "ai:model": "gpt-4o-mini",
-    "ai:maxtokens": 1000,
+    "ai:maxtokens": 2048,
-    "ai:timeoutms": 10000,
+    "ai:timeoutms": 60000,
    "autoupdate:enabled": true,
    "autoupdate:installonquit": true,
    "autoupdate:intervalms": 3600000,
--- a/pkg/wconfig/metaconsts.go
+++ b/pkg/wconfig/metaconsts.go
@ -7,10 +7,13 @@ package wconfig
 const (
 	ConfigKey_AiClear                        = "ai:*"
 	ConfigKey_AiApiType                      = "ai:apitype"
 	ConfigKey_AiBaseURL                      = "ai:baseurl"
 	ConfigKey_AiApiToken                     = "ai:apitoken"
 	ConfigKey_AiName                         = "ai:name"
 	ConfigKey_AiModel                        = "ai:model"
 	ConfigKey_AiOrgID                        = "ai:orgid"
 	ConfigKey_AIApiVersion                   = "ai:apiversion"
 	ConfigKey_AiMaxTokens                    = "ai:maxtokens"
 	ConfigKey_AiTimeoutMs                    = "ai:timeoutms"
--- a/pkg/wconfig/settingsconfig.go
+++ b/pkg/wconfig/settingsconfig.go
@ -41,10 +41,13 @@ func (m MetaSettingsType) MarshalJSON() ([]byte, error) {
 type SettingsType struct {
 	AiClear      bool    `json:"ai:*,omitempty"`
 	AiApiType    string  `json:"ai:apitype,omitempty"`
 	AiBaseURL    string  `json:"ai:baseurl,omitempty"`
 	AiApiToken   string  `json:"ai:apitoken,omitempty"`
 	AiName       string  `json:"ai:name,omitempty"`
 	AiModel      string  `json:"ai:model,omitempty"`
 	AiOrgID      string  `json:"ai:orgid,omitempty"`
 	AIApiVersion string  `json:"ai:apiversion,omitempty"`
 	AiMaxTokens  float64 `json:"ai:maxtokens,omitempty"`
 	AiTimeoutMs  float64 `json:"ai:timeoutms,omitempty"`
--- a/pkg/wshrpc/wshrpctypes.go
+++ b/pkg/wshrpc/wshrpctypes.go
@ -275,11 +275,14 @@ type OpenAIPromptMessageType struct {
 type OpenAIOptsType struct {
 	Model      string `json:"model"`
 	APIType    string `json:"apitype,omitempty"`
 	APIToken   string `json:"apitoken"`
 	OrgID      string `json:"orgid,omitempty"`
 	APIVersion string `json:"apiversion,omitempty"`
 	BaseURL    string `json:"baseurl,omitempty"`
 	MaxTokens  int    `json:"maxtokens,omitempty"`
 	MaxChoices int    `json:"maxchoices,omitempty"`
-	Timeout    int    `json:"timeout,omitempty"`
+	TimeoutMs  int    `json:"timeoutms,omitempty"`
 }
 type OpenAIPacketType struct {
--- a/pkg/wshrpc/wshserver/wshserver.go
+++ b/pkg/wshrpc/wshserver/wshserver.go
@ -74,12 +74,7 @@ func (ws *WshServer) StreamTestCommand(ctx context.Context) chan wshrpc.RespOrEr
 }
 func (ws *WshServer) StreamWaveAiCommand(ctx context.Context, request wshrpc.OpenAiStreamRequest) chan wshrpc.RespOrErrorUnion[wshrpc.OpenAIPacketType] {
-	if request.Opts.BaseURL == "" && request.Opts.APIToken == "" {
+	return waveai.RunAICommand(ctx, request)
 		log.Print("sending ai chat message to waveterm default endpoint with openai\n")
 		return waveai.RunCloudCompletionStream(ctx, request)
 	}
 	log.Printf("sending ai chat message to user-configured endpoint %s\n", request.Opts.BaseURL)
 	return waveai.RunLocalCompletionStream(ctx, request)
 }
 func MakePlotData(ctx context.Context, blockId string) error {