tui: Add --system-prompt handling

And some state handling changes
Update command flag handling
2024-05-07 08:19:45 +00:00 · 2024-05-07 08:18:48 +00:00 · 2024-05-05 08:15:17 +00:00 · 2024-05-05 07:32:35 +00:00 · 2024-04-29 06:16:41 +00:00 · 2024-04-29 06:14:36 +00:00
21 changed files with 353 additions and 217 deletions
--- a/go.mod
+++ b/go.mod
@ -9,7 +9,6 @@ require (
 	github.com/charmbracelet/lipgloss v0.10.0
 	github.com/go-yaml/yaml v2.1.0+incompatible
 	github.com/muesli/reflow v0.3.0
 	github.com/sashabaranov/go-openai v1.17.7
 	github.com/spf13/cobra v1.8.0
 	github.com/sqids/sqids-go v0.4.1
 	gopkg.in/yaml.v2 v2.2.2
--- a/go.sum
+++ b/go.sum
@ -61,8 +61,6 @@ github.com/rivo/uniseg v0.4.7/go.mod h1:FN3SvrM+Zdj16jyLfmOkMNblXMcoc8DfTHruCPUc
 github.com/rogpeppe/go-internal v1.9.0 h1:73kH8U+JUqXU8lRuOHeVHaa/SZPifC7BkcraZVejAe8=
 github.com/rogpeppe/go-internal v1.9.0/go.mod h1:WtVeX8xhTBvf0smdhujwtBcq4Qrzq/fJaraNFVN+nFs=
 github.com/russross/blackfriday/v2 v2.1.0/go.mod h1:+Rmxgy9KzJVeS9/2gXHxylqXiyQDYRxCVz55jmeOWTM=
 github.com/sashabaranov/go-openai v1.17.7 h1:MPcAwlwbeo7ZmhQczoOgZBHtIBY1TfZqsdx6+/ndloM=
 github.com/sashabaranov/go-openai v1.17.7/go.mod h1:lj5b/K+zjTSFxVLijLSTDZuP7adOgerWeFyZLUhAKRg=
 github.com/spf13/cobra v1.8.0 h1:7aJaZx1B85qltLMc546zn58BxxfZdR/W22ej9CFoEf0=
 github.com/spf13/cobra v1.8.0/go.mod h1:WXLWApfZ71AjXPya3WOlMsY9yMs7YeiHhFVlvLyhcho=
 github.com/spf13/pflag v1.0.5 h1:iy+VFUOCP1a+8yFto/drg2CJ5u0yRoB7fZw3DKv/JXA=
--- a/pkg/cmd/chat.go
+++ b/pkg/cmd/chat.go
@ -33,5 +33,6 @@ func ChatCmd(ctx *lmcli.Context) *cobra.Command {
 			return ctx.Store.ConversationShortNameCompletions(toComplete), compMode
 		},
 	}
 	applyPromptFlags(ctx, cmd)
 	return cmd
 }
--- a/pkg/cmd/cmd.go
+++ b/pkg/cmd/cmd.go
@ -8,10 +8,6 @@ import (
 	"github.com/spf13/cobra"
 )
 var (
 	systemPromptFile string
 )
 func RootCmd(ctx *lmcli.Context) *cobra.Command {
 	var root = &cobra.Command{
 		Use:           "lmcli <command> [flags]",
@ -23,58 +19,43 @@ func RootCmd(ctx *lmcli.Context) *cobra.Command {
 		},
 	}
 	chatCmd := ChatCmd(ctx)
 	continueCmd := ContinueCmd(ctx)
 	cloneCmd := CloneCmd(ctx)
 	editCmd := EditCmd(ctx)
 	listCmd := ListCmd(ctx)
 	newCmd := NewCmd(ctx)
 	promptCmd := PromptCmd(ctx)
 	renameCmd := RenameCmd(ctx)
 	replyCmd := ReplyCmd(ctx)
 	retryCmd := RetryCmd(ctx)
 	rmCmd := RemoveCmd(ctx)
 	viewCmd := ViewCmd(ctx)
 	inputCmds := []*cobra.Command{newCmd, promptCmd, replyCmd, retryCmd, continueCmd, editCmd}
 	for _, cmd := range inputCmds {
 		cmd.Flags().StringVar(ctx.Config.Defaults.Model, "model", *ctx.Config.Defaults.Model, "Which model to use")
 		cmd.RegisterFlagCompletionFunc("model", func(*cobra.Command, []string, string) ([]string, cobra.ShellCompDirective) {
 			return ctx.GetModels(), cobra.ShellCompDirectiveDefault
 		})
 		cmd.Flags().IntVar(ctx.Config.Defaults.MaxTokens, "length", *ctx.Config.Defaults.MaxTokens, "Maximum response tokens")
 		cmd.Flags().StringVar(ctx.Config.Defaults.SystemPrompt, "system-prompt", *ctx.Config.Defaults.SystemPrompt, "System prompt")
 		cmd.Flags().StringVar(&systemPromptFile, "system-prompt-file", "", "A path to a file containing the system prompt")
 		cmd.MarkFlagsMutuallyExclusive("system-prompt", "system-prompt-file")
 	}
 	root.AddCommand(
-		chatCmd,
+		ChatCmd(ctx),
-		cloneCmd,
+		ContinueCmd(ctx),
-		continueCmd,
+		CloneCmd(ctx),
-		editCmd,
+		EditCmd(ctx),
-		listCmd,
+		ListCmd(ctx),
-		newCmd,
+		NewCmd(ctx),
-		promptCmd,
+		PromptCmd(ctx),
-		renameCmd,
+		RenameCmd(ctx),
-		replyCmd,
+		ReplyCmd(ctx),
-		retryCmd,
+		RetryCmd(ctx),
-		rmCmd,
+		RemoveCmd(ctx),
-		viewCmd,
+		ViewCmd(ctx),
 	)
 	return root
 }
-func getSystemPrompt(ctx *lmcli.Context) string {
+func applyPromptFlags(ctx *lmcli.Context, cmd *cobra.Command) {
-	if systemPromptFile != "" {
+	f := cmd.Flags()
-		content, err := util.ReadFileContents(systemPromptFile)
+
-		if err != nil {
+	f.StringVarP(
-			lmcli.Fatal("Could not read file contents at %s: %v\n", systemPromptFile, err)
+		ctx.Config.Defaults.Model,
-		}
+		"model", "m",
-		return content
+		*ctx.Config.Defaults.Model,
-	}
+		"The model to generate a response with",
-	return *ctx.Config.Defaults.SystemPrompt
+	)
 	cmd.RegisterFlagCompletionFunc("model", func(*cobra.Command, []string, string) ([]string, cobra.ShellCompDirective) {
 		return ctx.GetModels(), cobra.ShellCompDirectiveDefault
 	})
 	f.IntVar(ctx.Config.Defaults.MaxTokens, "max-length", *ctx.Config.Defaults.MaxTokens, "Maximum response tokens")
 	f.Float32VarP(ctx.Config.Defaults.Temperature, "temperature", "t", *ctx.Config.Defaults.Temperature, "Sampling temperature")
 	f.StringVar(ctx.Config.Defaults.SystemPrompt, "system-prompt", *ctx.Config.Defaults.SystemPrompt, "System prompt")
 	f.StringVar(&ctx.SystemPromptFile, "system-prompt-file", "", "A path to a file containing the system prompt")
 	cmd.MarkFlagsMutuallyExclusive("system-prompt", "system-prompt-file")
 }
 // inputFromArgsOrEditor returns either the provided input from the args slice
--- a/pkg/cmd/continue.go
+++ b/pkg/cmd/continue.go
@ -44,7 +44,7 @@ func ContinueCmd(ctx *lmcli.Context) *cobra.Command {
 			fmt.Print(lastMessage.Content)
 			// Submit the LLM request, allowing it to continue the last message
-			continuedOutput, err := cmdutil.FetchAndShowCompletion(ctx, messages, nil)
+			continuedOutput, err := cmdutil.Prompt(ctx, messages, nil)
 			if err != nil {
 				return fmt.Errorf("error fetching LLM response: %v", err)
 			}
@ -68,5 +68,6 @@ func ContinueCmd(ctx *lmcli.Context) *cobra.Command {
 			return ctx.Store.ConversationShortNameCompletions(toComplete), compMode
 		},
 	}
 	applyPromptFlags(ctx, cmd)
 	return cmd
 }
--- a/pkg/cmd/new.go
+++ b/pkg/cmd/new.go
@ -30,7 +30,7 @@ func NewCmd(ctx *lmcli.Context) *cobra.Command {
 				{
 					ConversationID: conversation.ID,
 					Role:           model.MessageRoleSystem,
-					Content: getSystemPrompt(ctx),
+					Content:        ctx.GetSystemPrompt(),
 				},
 				{
 					ConversationID: conversation.ID,
@ -56,5 +56,6 @@ func NewCmd(ctx *lmcli.Context) *cobra.Command {
 		},
 	}
 	applyPromptFlags(ctx, cmd)
 	return cmd
 }
--- a/pkg/cmd/prompt.go
+++ b/pkg/cmd/prompt.go
@ -23,7 +23,7 @@ func PromptCmd(ctx *lmcli.Context) *cobra.Command {
 			messages := []model.Message{
 				{
 					Role:    model.MessageRoleSystem,
-					Content: getSystemPrompt(ctx),
+					Content: ctx.GetSystemPrompt(),
 				},
 				{
 					Role:    model.MessageRoleUser,
@ -31,12 +31,14 @@ func PromptCmd(ctx *lmcli.Context) *cobra.Command {
 				},
 			}
-			_, err := cmdutil.FetchAndShowCompletion(ctx, messages, nil)
+			_, err := cmdutil.Prompt(ctx, messages, nil)
 			if err != nil {
 				return fmt.Errorf("Error fetching LLM response: %v", err)
 			}
 			return nil
 		},
 	}
 	applyPromptFlags(ctx, cmd)
 	return cmd
 }
--- a/pkg/cmd/reply.go
+++ b/pkg/cmd/reply.go
@ -45,5 +45,7 @@ func ReplyCmd(ctx *lmcli.Context) *cobra.Command {
 			return ctx.Store.ConversationShortNameCompletions(toComplete), compMode
 		},
 	}
 	applyPromptFlags(ctx, cmd)
 	return cmd
 }
--- a/pkg/cmd/retry.go
+++ b/pkg/cmd/retry.go
@ -54,5 +54,7 @@ func RetryCmd(ctx *lmcli.Context) *cobra.Command {
 			return ctx.Store.ConversationShortNameCompletions(toComplete), compMode
 		},
 	}
 	applyPromptFlags(ctx, cmd)
 	return cmd
 }
--- a/pkg/cmd/util/util.go
+++ b/pkg/cmd/util/util.go
@ -13,9 +13,9 @@ import (
 	"github.com/charmbracelet/lipgloss"
 )
-// fetchAndShowCompletion prompts the LLM with the given messages and streams
+// Prompt prompts the configured the configured model and streams the response
-// the response to stdout. Returns all model reply messages.
+// to stdout. Returns all model reply messages.
-func FetchAndShowCompletion(ctx *lmcli.Context, messages []model.Message, callback func(model.Message)) (string, error) {
+func Prompt(ctx *lmcli.Context, messages []model.Message, callback func(model.Message)) (string, error) {
 	content := make(chan string) // receives the reponse from LLM
 	defer close(content)
@ -46,7 +46,7 @@ func FetchAndShowCompletion(ctx *lmcli.Context, messages []model.Message, callba
 			err = nil
 		}
 	}
-	return response, nil
+	return response, err
 }
 // lookupConversation either returns the conversation found by the
@ -109,7 +109,7 @@ func HandleConversationReply(ctx *lmcli.Context, c *model.Conversation, persist
 		}
 	}
-	_, err = FetchAndShowCompletion(ctx, allMessages, replyCallback)
+	_, err = Prompt(ctx, allMessages, replyCallback)
 	if err != nil {
 		lmcli.Fatal("Error fetching LLM response: %v\n", err)
 	}
--- a/pkg/lmcli/config.go
+++ b/pkg/lmcli/config.go
@ -19,16 +19,14 @@ type Config struct {
 		TitleGenerationModel *string `yaml:"titleGenerationModel" default:"gpt-3.5-turbo"`
 	} `yaml:"conversations"`
 	Tools *struct {
-		EnabledTools *[]string `yaml:"enabledTools"`
+		EnabledTools []string `yaml:"enabledTools"`
 	} `yaml:"tools"`
-	OpenAI *struct {
+	Providers []*struct {
-		APIKey *string   `yaml:"apiKey" default:"your_key_here"`
+		Kind    *string   `yaml:"kind"`
 		BaseURL *string   `yaml:"baseUrl"`
 		APIKey  *string   `yaml:"apiKey"`
 		Models  *[]string `yaml:"models"`
-	} `yaml:"openai"`
+	} `yaml:"providers"`
 	Anthropic *struct {
 		APIKey *string   `yaml:"apiKey" default:"your_key_here"`
 		Models *[]string `yaml:"models"`
 	} `yaml:"anthropic"`
 	Chroma *struct {
 		Style     *string `yaml:"style" default:"onedark"`
 		Formatter *string `yaml:"formatter" default:"terminal16m"`
--- a/pkg/lmcli/lmcli.go
+++ b/pkg/lmcli/lmcli.go
@ -10,17 +10,20 @@ import (
 	"git.mlow.ca/mlow/lmcli/pkg/lmcli/provider/anthropic"
 	"git.mlow.ca/mlow/lmcli/pkg/lmcli/provider/openai"
 	"git.mlow.ca/mlow/lmcli/pkg/lmcli/tools"
 	"git.mlow.ca/mlow/lmcli/pkg/util"
 	"git.mlow.ca/mlow/lmcli/pkg/util/tty"
 	"gorm.io/driver/sqlite"
 	"gorm.io/gorm"
 )
 type Context struct {
-	Config *Config
+	Config *Config // may be updated at runtime
 	Store  ConversationStore
 	Chroma       *tty.ChromaHighlighter
 	EnabledTools []model.Tool
 	SystemPromptFile string
 }
 func NewContext() (*Context, error) {
@ -43,46 +46,70 @@ func NewContext() (*Context, error) {
 	chroma := tty.NewChromaHighlighter("markdown", *config.Chroma.Formatter, *config.Chroma.Style)
 	var enabledTools []model.Tool
-	for _, toolName := range *config.Tools.EnabledTools {
+	for _, toolName := range config.Tools.EnabledTools {
 		tool, ok := tools.AvailableTools[toolName]
 		if ok {
 			enabledTools = append(enabledTools, tool)
 		}
 	}
-	return &Context{config, store, chroma, enabledTools}, nil
+	return &Context{config, store, chroma, enabledTools, ""}, nil
 }
 func (c *Context) GetModels() (models []string) {
-	for _, m := range *c.Config.Anthropic.Models {
+	for _, p := range c.Config.Providers {
 		for _, m := range *p.Models {
 			models = append(models, m)
 		}
 	for _, m := range *c.Config.OpenAI.Models {
 		models = append(models, m)
 	}
 	return
 }
 func (c *Context) GetCompletionProvider(model string) (provider.ChatCompletionClient, error) {
-	for _, m := range *c.Config.Anthropic.Models {
+	for _, p := range c.Config.Providers {
 		for _, m := range *p.Models {
 			if m == model {
 				switch *p.Kind {
 				case "anthropic":
 					url := "https://api.anthropic.com/v1"
 					if p.BaseURL != nil {
 						url = *p.BaseURL
 					}
 					anthropic := &anthropic.AnthropicClient{
-				APIKey: *c.Config.Anthropic.APIKey,
+						BaseURL: url,
 						APIKey:  *p.APIKey,
 					}
 					return anthropic, nil
 				case "openai":
 					url := "https://api.openai.com/v1"
 					if p.BaseURL != nil {
 						url = *p.BaseURL
 					}
 	}
 	for _, m := range *c.Config.OpenAI.Models {
 		if m == model {
 					openai := &openai.OpenAIClient{
-				APIKey: *c.Config.OpenAI.APIKey,
+						BaseURL: url,
 						APIKey:  *p.APIKey,
 					}
 					return openai, nil
 				default:
 					return nil, fmt.Errorf("unknown provider kind: %s", *p.Kind)
 				}
 			}
 		}
 	}
 	return nil, fmt.Errorf("unknown model: %s", model)
 }
 func (c *Context) GetSystemPrompt() string {
 	if c.SystemPromptFile != "" {
 		content, err := util.ReadFileContents(c.SystemPromptFile)
 		if err != nil {
 			Fatal("Could not read file contents at %s: %v\n", c.SystemPromptFile, err)
 		}
 		return content
 	}
 	return *c.Config.Defaults.SystemPrompt
 }
 func configDir() string {
 	var configDir string
--- a/pkg/lmcli/model/conversation.go
+++ b/pkg/lmcli/model/conversation.go
@ -33,11 +33,11 @@ type Conversation struct {
 type RequestParameters struct {
 	Model string
 	MaxTokens   int
 	Temperature float32
 	TopP        float32
 	SystemPrompt string
 	ToolBag []Tool
 }
--- a/pkg/lmcli/provider/anthropic/anthropic.go
+++ b/pkg/lmcli/provider/anthropic/anthropic.go
@ -15,48 +15,10 @@ import (
 	"git.mlow.ca/mlow/lmcli/pkg/lmcli/tools"
 )
 type AnthropicClient struct {
 	APIKey string
 }
 type Message struct {
 	Role    string `json:"role"`
 	Content string `json:"content"`
 }
 type Request struct {
 	Model         string    `json:"model"`
 	Messages      []Message `json:"messages"`
 	System        string    `json:"system,omitempty"`
 	MaxTokens     int       `json:"max_tokens,omitempty"`
 	StopSequences []string  `json:"stop_sequences,omitempty"`
 	Stream        bool      `json:"stream,omitempty"`
 	Temperature   float32   `json:"temperature,omitempty"`
 	//TopP          float32   `json:"top_p,omitempty"`
 	//TopK          float32   `json:"top_k,omitempty"`
 }
 type OriginalContent struct {
 	Type string `json:"type"`
 	Text string `json:"text"`
 }
 type Response struct {
 	Id           string            `json:"id"`
 	Type         string            `json:"type"`
 	Role         string            `json:"role"`
 	Content      []OriginalContent `json:"content"`
 	StopReason   string            `json:"stop_reason"`
 	StopSequence string            `json:"stop_sequence"`
 }
 const FUNCTION_STOP_SEQUENCE = "</function_calls>"
 func buildRequest(params model.RequestParameters, messages []model.Message) Request {
 	requestBody := Request{
 		Model:       params.Model,
 		Messages:    make([]Message, len(messages)),
 		System:      params.SystemPrompt,
 		MaxTokens:   params.MaxTokens,
 		Temperature: params.Temperature,
 		Stream:      false,
@ -118,14 +80,12 @@ func buildRequest(params model.RequestParameters, messages []model.Message) Requ
 }
 func sendRequest(ctx context.Context, c *AnthropicClient, r Request) (*http.Response, error) {
 	url := "https://api.anthropic.com/v1/messages"
 	jsonBody, err := json.Marshal(r)
 	if err != nil {
 		return nil, fmt.Errorf("failed to marshal request body: %v", err)
 	}
-	req, err := http.NewRequestWithContext(ctx, "POST", url, bytes.NewBuffer(jsonBody))
+	req, err := http.NewRequestWithContext(ctx, "POST", c.BaseURL+"/messages", bytes.NewBuffer(jsonBody))
 	if err != nil {
 		return nil, fmt.Errorf("failed to create HTTP request: %v", err)
 	}
--- a/pkg/lmcli/provider/anthropic/tools.go
+++ b/pkg/lmcli/provider/anthropic/tools.go
@ -9,6 +9,8 @@ import (
 	"git.mlow.ca/mlow/lmcli/pkg/lmcli/model"
 )
 const FUNCTION_STOP_SEQUENCE = "</function_calls>"
 const TOOL_PREAMBLE = `You have access to the following tools when replying.
 You may call them like this:
--- a/pkg/lmcli/provider/anthropic/types.go
+++ b/pkg/lmcli/provider/anthropic/types.go
@ -0,0 +1,38 @@
 package anthropic
 type AnthropicClient struct {
 	BaseURL string
 	APIKey string
 }
 type Message struct {
 	Role    string `json:"role"`
 	Content string `json:"content"`
 }
 type Request struct {
 	Model         string    `json:"model"`
 	Messages      []Message `json:"messages"`
 	System        string    `json:"system,omitempty"`
 	MaxTokens     int       `json:"max_tokens,omitempty"`
 	StopSequences []string  `json:"stop_sequences,omitempty"`
 	Stream        bool      `json:"stream,omitempty"`
 	Temperature   float32   `json:"temperature,omitempty"`
 	//TopP          float32   `json:"top_p,omitempty"`
 	//TopK          float32   `json:"top_k,omitempty"`
 }
 type OriginalContent struct {
 	Type string `json:"type"`
 	Text string `json:"text"`
 }
 type Response struct {
 	Id           string            `json:"id"`
 	Type         string            `json:"type"`
 	Role         string            `json:"role"`
 	Content      []OriginalContent `json:"content"`
 	StopReason   string            `json:"stop_reason"`
 	StopSequence string            `json:"stop_sequence"`
 }
--- a/pkg/lmcli/provider/openai/openai.go
+++ b/pkg/lmcli/provider/openai/openai.go
@ -1,45 +1,30 @@
 package openai
 import (
 	"bufio"
 	"bytes"
 	"context"
 	"encoding/json"
 	"errors"
 	"fmt"
 	"io"
 	"net/http"
 	"strings"
 	"git.mlow.ca/mlow/lmcli/pkg/lmcli/model"
 	"git.mlow.ca/mlow/lmcli/pkg/lmcli/provider"
 	"git.mlow.ca/mlow/lmcli/pkg/lmcli/tools"
 	openai "github.com/sashabaranov/go-openai"
 )
-type OpenAIClient struct {
+func convertTools(tools []model.Tool) []Tool {
-	APIKey string
+	openaiTools := make([]Tool, len(tools))
 }
 type OpenAIToolParameters struct {
 	Type       string                         `json:"type"`
 	Properties map[string]OpenAIToolParameter `json:"properties,omitempty"`
 	Required   []string                       `json:"required,omitempty"`
 }
 type OpenAIToolParameter struct {
 	Type        string   `json:"type"`
 	Description string   `json:"description"`
 	Enum        []string `json:"enum,omitempty"`
 }
 func convertTools(tools []model.Tool) []openai.Tool {
 	openaiTools := make([]openai.Tool, len(tools))
 	for i, tool := range tools {
 		openaiTools[i].Type = "function"
-		params := make(map[string]OpenAIToolParameter)
+		params := make(map[string]ToolParameter)
 		var required []string
 		for _, param := range tool.Parameters {
-			params[param.Name] = OpenAIToolParameter{
+			params[param.Name] = ToolParameter{
 				Type:        param.Type,
 				Description: param.Description,
 				Enum:        param.Enum,
@ -49,10 +34,10 @@ func convertTools(tools []model.Tool) []openai.Tool {
 			}
 		}
-		openaiTools[i].Function = openai.FunctionDefinition{
+		openaiTools[i].Function = FunctionDefinition{
 			Name:        tool.Name,
 			Description: tool.Description,
-			Parameters: OpenAIToolParameters{
+			Parameters: ToolParameters{
 				Type:       "object",
 				Properties: params,
 				Required:   required,
@ -62,8 +47,8 @@ func convertTools(tools []model.Tool) []openai.Tool {
 	return openaiTools
 }
-func convertToolCallToOpenAI(toolCalls []model.ToolCall) []openai.ToolCall {
+func convertToolCallToOpenAI(toolCalls []model.ToolCall) []ToolCall {
-	converted := make([]openai.ToolCall, len(toolCalls))
+	converted := make([]ToolCall, len(toolCalls))
 	for i, call := range toolCalls {
 		converted[i].Type = "function"
 		converted[i].ID = call.ID
@ -75,7 +60,7 @@ func convertToolCallToOpenAI(toolCalls []model.ToolCall) []openai.ToolCall {
 	return converted
 }
-func convertToolCallToAPI(toolCalls []openai.ToolCall) []model.ToolCall {
+func convertToolCallToAPI(toolCalls []ToolCall) []model.ToolCall {
 	converted := make([]model.ToolCall, len(toolCalls))
 	for i, call := range toolCalls {
 		converted[i].ID = call.ID
@ -86,16 +71,15 @@ func convertToolCallToAPI(toolCalls []openai.ToolCall) []model.ToolCall {
 }
 func createChatCompletionRequest(
 	c *OpenAIClient,
 	params model.RequestParameters,
 	messages []model.Message,
-) openai.ChatCompletionRequest {
+) ChatCompletionRequest {
-	requestMessages := make([]openai.ChatCompletionMessage, 0, len(messages))
+	requestMessages := make([]ChatCompletionMessage, 0, len(messages))
 	for _, m := range messages {
 		switch m.Role {
 		case "tool_call":
-			message := openai.ChatCompletionMessage{}
+			message := ChatCompletionMessage{}
 			message.Role = "assistant"
 			message.Content = m.Content
 			message.ToolCalls = convertToolCallToOpenAI(m.ToolCalls)
@ -103,21 +87,21 @@ func createChatCompletionRequest(
 		case "tool_result":
 			// expand tool_result messages' results into multiple openAI messages
 			for _, result := range m.ToolResults {
-				message := openai.ChatCompletionMessage{}
+				message := ChatCompletionMessage{}
 				message.Role = "tool"
 				message.Content = result.Result
 				message.ToolCallID = result.ToolCallID
 				requestMessages = append(requestMessages, message)
 			}
 		default:
-			message := openai.ChatCompletionMessage{}
+			message := ChatCompletionMessage{}
 			message.Role = string(m.Role)
 			message.Content = m.Content
 			requestMessages = append(requestMessages, message)
 		}
 	}
-	request := openai.ChatCompletionRequest{
+	request := ChatCompletionRequest{
 		Model:       params.Model,
 		MaxTokens:   params.MaxTokens,
 		Temperature: params.Temperature,
@ -136,7 +120,7 @@ func createChatCompletionRequest(
 func handleToolCalls(
 	params model.RequestParameters,
 	content string,
-	toolCalls []openai.ToolCall,
+	toolCalls []ToolCall,
 	callback provider.ReplyCallback,
 	messages []model.Message,
 ) ([]model.Message, error) {
@ -177,6 +161,21 @@ func handleToolCalls(
 	return messages, nil
 }
 func (c *OpenAIClient) sendRequest(ctx context.Context, req *http.Request) (*http.Response, error) {
 	req.Header.Set("Content-Type", "application/json")
 	req.Header.Set("Authorization", "Bearer "+c.APIKey)
 	client := &http.Client{}
 	resp, err := client.Do(req.WithContext(ctx))
 	if resp.StatusCode != 200 {
 		bytes, _ := io.ReadAll(resp.Body)
 		return resp, fmt.Errorf("%v", string(bytes))
 	}
 	return resp, err
 }
 func (c *OpenAIClient) CreateChatCompletion(
 	ctx context.Context,
 	params model.RequestParameters,
@ -187,14 +186,30 @@ func (c *OpenAIClient) CreateChatCompletion(
 		return "", fmt.Errorf("Can't create completion from no messages")
 	}
-	client := openai.NewClient(c.APIKey)
+	req := createChatCompletionRequest(params, messages)
-	req := createChatCompletionRequest(c, params, messages)
+	jsonData, err := json.Marshal(req)
 	resp, err := client.CreateChatCompletion(ctx, req)
 	if err != nil {
 		return "", err
 	}
-	choice := resp.Choices[0]
+	httpReq, err := http.NewRequest("POST", c.BaseURL+"/chat/completions", bytes.NewBuffer(jsonData))
 	if err != nil {
 		return "", err
 	}
 	resp, err := c.sendRequest(ctx, httpReq)
 	if err != nil {
 		return "", err
 	}
 	defer resp.Body.Close()
 	var completionResp ChatCompletionResponse
 	err = json.NewDecoder(resp.Body).Decode(&completionResp)
 	if err != nil {
 		return "", err
 	}
 	choice := completionResp.Choices[0]
 	var content string
 	lastMessage := messages[len(messages)-1]
@ -236,36 +251,60 @@ func (c *OpenAIClient) CreateChatCompletionStream(
 		return "", fmt.Errorf("Can't create completion from no messages")
 	}
-	client := openai.NewClient(c.APIKey)
+	req := createChatCompletionRequest(params, messages)
-	req := createChatCompletionRequest(c, params, messages)
+	req.Stream = true
-	stream, err := client.CreateChatCompletionStream(ctx, req)
+	jsonData, err := json.Marshal(req)
 	if err != nil {
 		return "", err
 	}
-	defer stream.Close()
+
 	httpReq, err := http.NewRequest("POST", c.BaseURL+"/chat/completions", bytes.NewBuffer(jsonData))
 	if err != nil {
 		return "", err
 	}
 	resp, err := c.sendRequest(ctx, httpReq)
 	if err != nil {
 		return "", err
 	}
 	defer resp.Body.Close()
 	content := strings.Builder{}
-	toolCalls := []openai.ToolCall{}
+	toolCalls := []ToolCall{}
 	lastMessage := messages[len(messages)-1]
 	if lastMessage.Role.IsAssistant() {
 		content.WriteString(lastMessage.Content)
 	}
-	// Iterate stream segments
+	reader := bufio.NewReader(resp.Body)
 	for {
-		response, e := stream.Recv()
+		line, err := reader.ReadBytes('\n')
-		if errors.Is(e, io.EOF) {
+		if err != nil {
 			if err == io.EOF {
 				break
 			}
 			return "", err
 		}
 		line = bytes.TrimSpace(line)
 		if len(line) == 0 || !bytes.HasPrefix(line, []byte("data: ")) {
 			continue
 		}
 		line = bytes.TrimPrefix(line, []byte("data: "))
 		if bytes.Equal(line, []byte("[DONE]")) {
 			break
 		}
-		if e != nil {
+		var streamResp ChatCompletionStreamResponse
-			err = e
+		err = json.Unmarshal(line, &streamResp)
-			break
+		if err != nil {
 			return "", err
 		}
-		delta := response.Choices[0].Delta
+		delta := streamResp.Choices[0].Delta
 		if len(delta.ToolCalls) > 0 {
 			// Construct streamed tool_call arguments
 			for _, tc := range delta.ToolCalls {
@ -278,7 +317,8 @@ func (c *OpenAIClient) CreateChatCompletionStream(
 					toolCalls[*tc.Index].Function.Arguments += tc.Function.Arguments
 				}
 			}
-		} else {
+		}
 		if len(delta.Content) > 0 {
 			output <- delta.Content
 			content.WriteString(delta.Content)
 		}
@ -301,5 +341,5 @@ func (c *OpenAIClient) CreateChatCompletionStream(
 		}
 	}
-	return content.String(), err
+	return content.String(), nil
 }
--- a/pkg/lmcli/provider/openai/types.go
+++ b/pkg/lmcli/provider/openai/types.go
@ -0,0 +1,71 @@
 package openai
 type OpenAIClient struct {
 	APIKey  string
 	BaseURL string
 }
 type ChatCompletionMessage struct {
 	Role       string     `json:"role"`
 	Content    string     `json:"content,omitempty"`
 	ToolCalls  []ToolCall `json:"tool_calls,omitempty"`
 	ToolCallID string     `json:"tool_call_id,omitempty"`
 }
 type ToolCall struct {
 	Type     string             `json:"type"`
 	ID       string             `json:"id"`
 	Index    *int               `json:"index,omitempty"`
 	Function FunctionDefinition `json:"function"`
 }
 type FunctionDefinition struct {
 	Name        string         `json:"name"`
 	Description string         `json:"description"`
 	Parameters  ToolParameters `json:"parameters"`
 	Arguments   string         `json:"arguments,omitempty"`
 }
 type ToolParameters struct {
 	Type       string                   `json:"type"`
 	Properties map[string]ToolParameter `json:"properties,omitempty"`
 	Required   []string                 `json:"required,omitempty"`
 }
 type ToolParameter struct {
 	Type        string   `json:"type"`
 	Description string   `json:"description"`
 	Enum        []string `json:"enum,omitempty"`
 }
 type Tool struct {
 	Type     string             `json:"type"`
 	Function FunctionDefinition `json:"function"`
 }
 type ChatCompletionRequest struct {
 	Model       string                  `json:"model"`
 	MaxTokens   int                     `json:"max_tokens,omitempty"`
 	Temperature float32                 `json:"temperature,omitempty"`
 	Messages    []ChatCompletionMessage `json:"messages"`
 	N           int                     `json:"n"`
 	Tools       []Tool                  `json:"tools,omitempty"`
 	ToolChoice  string                  `json:"tool_choice,omitempty"`
 	Stream      bool                    `json:"stream,omitempty"`
 }
 type ChatCompletionChoice struct {
 	Message ChatCompletionMessage `json:"message"`
 }
 type ChatCompletionResponse struct {
 	Choices []ChatCompletionChoice `json:"choices"`
 }
 type ChatCompletionStreamChoice struct {
 	Delta ChatCompletionMessage `json:"delta"`
 }
 type ChatCompletionStreamResponse struct {
 	Choices []ChatCompletionStreamChoice `json:"choices"`
 }
--- a/pkg/tui/chat.go
+++ b/pkg/tui/chat.go
@ -115,6 +115,14 @@ func newChatModel(tui *model) chatModel {
 		)),
 	}
 	system := tui.ctx.GetSystemPrompt()
 	if system != "" {
 		m.messages = []models.Message{{
 			Role:    models.MessageRoleSystem,
 			Content: system,
 		}}
 	}
 	m.input.Focus()
 	m.input.MaxHeight = 0
 	m.input.CharLimit = 0
@ -177,16 +185,17 @@ func (m *chatModel) handleInput(msg tea.KeyMsg) (bool, tea.Cmd) {
 	switch msg.String() {
 	case "esc":
 		return true, func() tea.Msg {
 			return msgChangeState(stateConversations)
 		}
 	case "ctrl+c":
 		if m.waitingForReply {
 			m.stopSignal <- struct{}{}
 			return true, nil
 		}
 		return true, func() tea.Msg {
-			return msgChangeState(stateConversations)
+			return msgStateChange(stateConversations)
 		}
 	case "ctrl+c":
 		if m.waitingForReply {
 			m.stopSignal <- struct{}{}
 			return true, nil
 		}
 	case "ctrl+p":
 		m.persistence = !m.persistence
@ -227,10 +236,12 @@ func (m *chatModel) handleResize(width, height int) {
 func (m chatModel) Update(msg tea.Msg) (chatModel, tea.Cmd) {
 	var cmds []tea.Cmd
 	switch msg := msg.(type) {
-	case msgChangeState:
+	case msgStateEnter:
 		if m.opts.convShortname != "" && m.conversation.ShortName.String != m.opts.convShortname {
 			cmds = append(cmds, m.loadConversation(m.opts.convShortname))
 		}
 		m.rebuildMessageCache()
 		m.updateContent()
 	case tea.WindowSizeMsg:
 		m.handleResize(msg.Width, msg.Height)
 	case msgTempfileEditorClosed:
@ -254,7 +265,8 @@ func (m chatModel) Update(msg tea.Msg) (chatModel, tea.Cmd) {
 		cmds = append(cmds, m.loadMessages(m.conversation))
 	case msgMessagesLoaded:
 		m.selectedMessage = len(msg) - 1
-		m.setMessages(msg)
+		m.messages = msg
 		m.rebuildMessageCache()
 		m.updateContent()
 		m.content.GotoBottom()
 	case msgResponseChunk:
@ -358,10 +370,12 @@ func (m chatModel) Update(msg tea.Msg) (chatModel, tea.Cmd) {
 		fixedHeight := height(m.views.header) + height(m.views.error) + height(m.views.footer)
 		// calculate clamped input height to accomodate input text
 		// minimum 4 lines, maximum half of content area
 		newHeight := max(4, min((m.height-fixedHeight-1)/2, m.input.LineCount()))
 		m.input.SetHeight(newHeight)
 		m.views.input = m.input.View()
 		// remaining height towards content
 		m.content.Height = m.height - fixedHeight - height(m.views.input)
 		m.views.content = m.content.View()
 	}
@ -701,11 +715,6 @@ func (m *chatModel) footerView() string {
 	return footerStyle.Width(m.width).Render(footer)
 }
 func (m *chatModel) setMessages(messages []models.Message) {
 	m.messages = messages
 	m.rebuildMessageCache()
 }
 func (m *chatModel) setMessage(i int, msg models.Message) {
 	if i >= len(m.messages) {
 		panic("i out of range")
--- a/pkg/tui/conversations.go
+++ b/pkg/tui/conversations.go
@ -115,7 +115,7 @@ func (m *conversationsModel) handleResize(width, height int) {
 func (m conversationsModel) Update(msg tea.Msg) (conversationsModel, tea.Cmd) {
 	var cmds []tea.Cmd
 	switch msg := msg.(type) {
-	case msgChangeState:
+	case msgStateChange:
 		cmds = append(cmds, m.loadConversations())
 		m.content.SetContent(m.renderConversationList())
 	case tea.WindowSizeMsg:
--- a/pkg/tui/tui.go
+++ b/pkg/tui/tui.go
@ -35,8 +35,10 @@ type views struct {
 }
 type (
-	// send to change the current app state
+	// send to change the current state
-	msgChangeState state
+	msgStateChange state
 	// sent to a state when it is entered
 	msgStateEnter struct{}
 	// sent when an error occurs
 	msgError error
 )
@ -81,7 +83,7 @@ func (m model) Init() tea.Cmd {
 		m.conversations.Init(),
 		m.chat.Init(),
 		func() tea.Msg {
-			return msgChangeState(m.state)
+			return msgStateChange(m.state)
 		},
 	)
 }
@ -124,18 +126,20 @@ func (m model) Update(msg tea.Msg) (tea.Model, tea.Cmd) {
 		if handled {
 			return m, cmd
 		}
-	case msgChangeState:
+	case msgStateChange:
-		switch msg {
+		m.state = state(msg)
 		switch m.state {
 		case stateChat:
 			m.chat.handleResize(m.width, m.height)
 		case stateConversations:
 			m.conversations.handleResize(m.width, m.height)
 		}
-		m.state = state(msg)
+		return m, func() tea.Msg { return msgStateEnter(struct{}{}) }
 	case msgConversationSelected:
 		// passed up through conversation list model
 		m.opts.convShortname = msg.ShortName.String
 		cmds = append(cmds, func() tea.Msg {
-			return msgChangeState(stateChat)
+			return msgStateChange(stateChat)
 		})
 	case tea.WindowSizeMsg:
 		m.width, m.height = msg.Width, msg.Height
Author	SHA1	Message	Date
Matt Low	aeeb7bb7f7	tui: Add --system-prompt handling And some state handling changes	2024-05-07 08:19:45 +00:00
Matt Low	2b38db7db7	Update command flag handling `lmcli chat` now supports common prompt flags (model, length, system prompt, etc)	2024-05-07 08:18:48 +00:00
Matt Low	8e4ff90ab4	Multiple provider configuration Add support for having multiple openai or anthropic compatible providers accessible via different baseUrls	2024-05-05 08:15:17 +00:00
Matt Low	bdaf6204f6	Add openai response error handling	2024-05-05 07:32:35 +00:00
Matt Low	1b9a8f319c	Split anthropic types out to types.go	2024-04-29 06:16:41 +00:00
Matt Low	ffe9d299ef	Remove go-openai	2024-04-29 06:14:36 +00:00