lmcli/pkg/cli/openai.go

package cli

import (
	"context"
	"database/sql"
	"encoding/json"
	"errors"
	"fmt"
	"io"
	"strings"

	openai "github.com/sashabaranov/go-openai"
)

func CreateChatCompletionRequest(model string, messages []Message, maxTokens int) openai.ChatCompletionRequest {
	chatCompletionMessages := []openai.ChatCompletionMessage{}
	for _, m := range messages {
		message := openai.ChatCompletionMessage{
			Role:    m.Role,
			Content: m.OriginalContent,
		}
		if m.ToolCallID.Valid {
			message.ToolCallID = m.ToolCallID.String
		}
		if m.ToolCalls.Valid {
			// unmarshal directly into chatMessage.ToolCalls
			err := json.Unmarshal([]byte(m.ToolCalls.String), &message.ToolCalls)
			if err != nil {
				// TODO: handle, this shouldn't really happen since
				// we only save the successfully marshal'd data to database
				fmt.Printf("Error unmarshalling the tool_calls JSON: %v\n", err)
			}
		}
		chatCompletionMessages = append(chatCompletionMessages, message)
	}

	var tools []openai.Tool
	for _, t := range AvailableTools {
		// TODO: support some way to limit which tools are available per-request
		tools = append(tools, t.Tool)
	}

	return openai.ChatCompletionRequest{
		Model:      model,
		Messages:   chatCompletionMessages,
		MaxTokens:  maxTokens,
		N:          1, // limit responses to 1 "choice". we use choices[0] to reference it
		Tools:      tools,
		ToolChoice: "auto", // TODO: allow limiting/forcing which function is called?
	}
}

// CreateChatCompletion submits a Chat Completion API request and returns the
// response. CreateChatCompletion will recursively call itself in the case of
// tool calls, until a response is received with the final user-facing output.
func CreateChatCompletion(model string, messages []Message, maxTokens int) (string, error) {
	client := openai.NewClient(*config.OpenAI.APIKey)
	req := CreateChatCompletionRequest(model, messages, maxTokens)
	resp, err := client.CreateChatCompletion(context.Background(), req)
	if err != nil {
		return "", err
	}

	choice := resp.Choices[0]

	if len(choice.Message.ToolCalls) > 0 {
		if choice.Message.Content != "" {
			return "", fmt.Errorf("Model replied with user-facing content in addition to tool calls. Unsupported.")
		}

		// Append the assistant's reply with its request for tool calls
		toolCallJson, _ := json.Marshal(choice.Message.ToolCalls)
		messages = append(messages, Message{
			Role:      "assistant",
			ToolCalls: sql.NullString{String: string(toolCallJson), Valid: true},
		})

		toolReplies, err := ExecuteToolCalls(choice.Message.ToolCalls)
		if err != nil {
			return "", err
		}

		// Recurse into CreateChatCompletion with the tool call replies added
		// to the original messages
		return CreateChatCompletion(model, append(messages, toolReplies...), maxTokens)
	}

	// Return the user-facing message.
	return choice.Message.Content, nil
}

// CreateChatCompletionStream submits a streaming Chat Completion API request
// and both returns and streams the response to the provided output channel.
// May return a partial response if an error occurs mid-stream.
func CreateChatCompletionStream(model string, messages []Message, maxTokens int, output chan<- string) (string, error) {
	client := openai.NewClient(*config.OpenAI.APIKey)
	req := CreateChatCompletionRequest(model, messages, maxTokens)

	stream, err := client.CreateChatCompletionStream(context.Background(), req)
	if err != nil {
		return "", err
	}
	defer stream.Close()

	content := strings.Builder{}
	toolCalls := []openai.ToolCall{}

	// Iterate stream segments
	for {
		response, e := stream.Recv()
		if errors.Is(e, io.EOF) {
			break
		}

		if e != nil {
			err = e
			break
		}

		delta := response.Choices[0].Delta
		if len(delta.ToolCalls) > 0 {
			// Construct streamed tool_call arguments
			for _, tc := range delta.ToolCalls {
				if tc.Index == nil {
					return "", fmt.Errorf("Unexpected nil index for streamed tool call.")
				}
				if len(toolCalls) <= *tc.Index {
					toolCalls = append(toolCalls, tc)
				} else {
					toolCalls[*tc.Index].Function.Arguments += tc.Function.Arguments
				}
			}
		} else {
			output <- delta.Content
			content.WriteString(delta.Content)
		}
	}

	if len(toolCalls) > 0 {
		if content.String() != "" {
			return "", fmt.Errorf("Model replied with user-facing content in addition to tool calls. Unsupported.")
		}

		// Append the assistant's reply with its request for tool calls
		toolCallJson, _ := json.Marshal(toolCalls)
		messages = append(messages, Message{
			Role:      "assistant",
			ToolCalls: sql.NullString{String: string(toolCallJson), Valid: true},
		})

		toolReplies, err := ExecuteToolCalls(toolCalls)
		if err != nil {
			return "", err
		}

		// Recurse into CreateChatCompletionStream with the tool call replies
		// added to the original messages
		return CreateChatCompletionStream(model, append(messages, toolReplies...), maxTokens, output)
	}

	return content.String(), err
}
Project restructure Moved source files into cmd/ and pkg/ directories 2023-11-04 12:20:13 -06:00			`package cli`
Initial prototype 2023-10-30 15:23:07 -06:00
			`import (`
			`"context"`
Add initial support for tool/function calling Adds the following tools: - read_dir - list a directory's contents - read_file - read the content of a file - write_file - write contents to a file - insert_file_lines - insert lines in a file - replace_file_lines - replace or remove lines in a file 2023-11-25 17:55:18 -07:00			`"database/sql"`
			`"encoding/json"`
Use the streamed response API 2023-10-30 15:45:21 -06:00			`"errors"`
Add initial support for tool/function calling Adds the following tools: - read_dir - list a directory's contents - read_file - read the content of a file - write_file - write contents to a file - insert_file_lines - insert lines in a file - replace_file_lines - replace or remove lines in a file 2023-11-25 17:55:18 -07:00			`"fmt"`
Use the streamed response API 2023-10-30 15:45:21 -06:00			`"io"`
Refactor streamed response handling Update CreateChangeCompletionStream to return the entire response upon stream completion. Renamed HandleDelayedResponse to HandleDelayedContent, which no longer returns the content. Removes the need wrapping HandleDelayedContent in an immediately invoked function and the passing of the completed response over a channel. Also allows us to better handle the case of partial a response. 2023-11-23 20:45:43 -07:00			`"strings"`
Run gofmt/goimports on go sources 2023-11-04 16:56:22 -06:00
Initial prototype 2023-10-30 15:23:07 -06:00			`openai "github.com/sashabaranov/go-openai"`
			`)`

Parameterize the openai model used Add `openai.defaultConfig` to set the default, will allow overriding with CLI flag 2023-11-08 23:07:52 -07:00			`func CreateChatCompletionRequest(model string, messages []Message, maxTokens int) openai.ChatCompletionRequest {`
Treat the system message like any other Removed the system parameter on ChatCopmletion functions, and persist it in conversations as well. 2023-11-05 01:54:12 -06:00			`chatCompletionMessages := []openai.ChatCompletionMessage{}`
Run gofmt/goimports on go sources 2023-11-04 16:56:22 -06:00			`for _, m := range messages {`
Add initial support for tool/function calling Adds the following tools: - read_dir - list a directory's contents - read_file - read the content of a file - write_file - write contents to a file - insert_file_lines - insert lines in a file - replace_file_lines - replace or remove lines in a file 2023-11-25 17:55:18 -07:00			`message := openai.ChatCompletionMessage{`
Run gofmt/goimports on go sources 2023-11-04 16:56:22 -06:00			`Role: m.Role,`
Initial prototype 2023-10-30 15:23:07 -06:00			`Content: m.OriginalContent,`
Add initial support for tool/function calling Adds the following tools: - read_dir - list a directory's contents - read_file - read the content of a file - write_file - write contents to a file - insert_file_lines - insert lines in a file - replace_file_lines - replace or remove lines in a file 2023-11-25 17:55:18 -07:00			`}`
			`if m.ToolCallID.Valid {`
			`message.ToolCallID = m.ToolCallID.String`
			`}`
			`if m.ToolCalls.Valid {`
			`// unmarshal directly into chatMessage.ToolCalls`
			`err := json.Unmarshal([]byte(m.ToolCalls.String), &message.ToolCalls)`
			`if err != nil {`
			`// TODO: handle, this shouldn't really happen since`
			`// we only save the successfully marshal'd data to database`
			`fmt.Printf("Error unmarshalling the tool_calls JSON: %v\n", err)`
			`}`
			`}`
			`chatCompletionMessages = append(chatCompletionMessages, message)`
			`}`

			`var tools []openai.Tool`
			`for _, t := range AvailableTools {`
			`// TODO: support some way to limit which tools are available per-request`
			`tools = append(tools, t.Tool)`
Initial prototype 2023-10-30 15:23:07 -06:00			`}`

Parameterize maxTokens Minor formatting/commet changes 2023-11-05 11:19:30 -07:00			`return openai.ChatCompletionRequest{`
Add initial support for tool/function calling Adds the following tools: - read_dir - list a directory's contents - read_file - read the content of a file - write_file - write contents to a file - insert_file_lines - insert lines in a file - replace_file_lines - replace or remove lines in a file 2023-11-25 17:55:18 -07:00			`Model: model,`
			`Messages: chatCompletionMessages,`
			`MaxTokens: maxTokens,`
			`N: 1, // limit responses to 1 "choice". we use choices[0] to reference it`
			`Tools: tools,`
			`ToolChoice: "auto", // TODO: allow limiting/forcing which function is called?`
Increase MaxTokens to 256 on OpenAI requests Slight refactor 2023-10-30 16:23:27 -06:00			`}`
			`}`

Parameterize maxTokens Minor formatting/commet changes 2023-11-05 11:19:30 -07:00			`// CreateChatCompletion submits a Chat Completion API request and returns the`
Add initial support for tool/function calling Adds the following tools: - read_dir - list a directory's contents - read_file - read the content of a file - write_file - write contents to a file - insert_file_lines - insert lines in a file - replace_file_lines - replace or remove lines in a file 2023-11-25 17:55:18 -07:00			`// response. CreateChatCompletion will recursively call itself in the case of`
			`// tool calls, until a response is received with the final user-facing output.`
Parameterize the openai model used Add `openai.defaultConfig` to set the default, will allow overriding with CLI flag 2023-11-08 23:07:52 -07:00			`func CreateChatCompletion(model string, messages []Message, maxTokens int) (string, error) {`
Set config defaults using a "default" struct tag Add new SetStructDefaults function to handle the "defaults" struct tag. Only works on struct fields which are pointers (in order to be able to distinguish between not set (nil) and zero values). So, the Config struct has been updated to use pointer fields and we now need to dereference those pointers to use them. 2023-11-18 18:14:00 -07:00			`client := openai.NewClient(*config.OpenAI.APIKey)`
Parameterize the openai model used Add `openai.defaultConfig` to set the default, will allow overriding with CLI flag 2023-11-08 23:07:52 -07:00			`req := CreateChatCompletionRequest(model, messages, maxTokens)`
Parameterize maxTokens Minor formatting/commet changes 2023-11-05 11:19:30 -07:00			`resp, err := client.CreateChatCompletion(context.Background(), req)`
Initial prototype 2023-10-30 15:23:07 -06:00			`if err != nil {`
Include system prompt in OpenAI chat completion requests 2023-11-04 16:07:06 -06:00			`return "", err`
Initial prototype 2023-10-30 15:23:07 -06:00			`}`

Add initial support for tool/function calling Adds the following tools: - read_dir - list a directory's contents - read_file - read the content of a file - write_file - write contents to a file - insert_file_lines - insert lines in a file - replace_file_lines - replace or remove lines in a file 2023-11-25 17:55:18 -07:00			`choice := resp.Choices[0]`

			`if len(choice.Message.ToolCalls) > 0 {`
			`if choice.Message.Content != "" {`
			`return "", fmt.Errorf("Model replied with user-facing content in addition to tool calls. Unsupported.")`
			`}`

			`// Append the assistant's reply with its request for tool calls`
			`toolCallJson, _ := json.Marshal(choice.Message.ToolCalls)`
			`messages = append(messages, Message{`
			`Role: "assistant",`
			`ToolCalls: sql.NullString{String: string(toolCallJson), Valid: true},`
			`})`

			`toolReplies, err := ExecuteToolCalls(choice.Message.ToolCalls)`
			`if err != nil {`
			`return "", err`
			`}`

			`// Recurse into CreateChatCompletion with the tool call replies added`
			`// to the original messages`
			`return CreateChatCompletion(model, append(messages, toolReplies...), maxTokens)`
			`}`

			`// Return the user-facing message.`
			`return choice.Message.Content, nil`
Initial prototype 2023-10-30 15:23:07 -06:00			`}`
Use the streamed response API 2023-10-30 15:45:21 -06:00
Parameterize maxTokens Minor formatting/commet changes 2023-11-05 11:19:30 -07:00			`// CreateChatCompletionStream submits a streaming Chat Completion API request`
Refactor streamed response handling Update CreateChangeCompletionStream to return the entire response upon stream completion. Renamed HandleDelayedResponse to HandleDelayedContent, which no longer returns the content. Removes the need wrapping HandleDelayedContent in an immediately invoked function and the passing of the completed response over a channel. Also allows us to better handle the case of partial a response. 2023-11-23 20:45:43 -07:00			`// and both returns and streams the response to the provided output channel.`
			`// May return a partial response if an error occurs mid-stream.`
			`func CreateChatCompletionStream(model string, messages []Message, maxTokens int, output chan<- string) (string, error) {`
Set config defaults using a "default" struct tag Add new SetStructDefaults function to handle the "defaults" struct tag. Only works on struct fields which are pointers (in order to be able to distinguish between not set (nil) and zero values). So, the Config struct has been updated to use pointer fields and we now need to dereference those pointers to use them. 2023-11-18 18:14:00 -07:00			`client := openai.NewClient(*config.OpenAI.APIKey)`
Parameterize the openai model used Add `openai.defaultConfig` to set the default, will allow overriding with CLI flag 2023-11-08 23:07:52 -07:00			`req := CreateChatCompletionRequest(model, messages, maxTokens)`
Use the streamed response API 2023-10-30 15:45:21 -06:00
Parameterize maxTokens Minor formatting/commet changes 2023-11-05 11:19:30 -07:00			`stream, err := client.CreateChatCompletionStream(context.Background(), req)`
Use the streamed response API 2023-10-30 15:45:21 -06:00			`if err != nil {`
Refactor streamed response handling Update CreateChangeCompletionStream to return the entire response upon stream completion. Renamed HandleDelayedResponse to HandleDelayedContent, which no longer returns the content. Removes the need wrapping HandleDelayedContent in an immediately invoked function and the passing of the completed response over a channel. Also allows us to better handle the case of partial a response. 2023-11-23 20:45:43 -07:00			`return "", err`
Use the streamed response API 2023-10-30 15:45:21 -06:00			`}`
			`defer stream.Close()`

Add initial support for tool/function calling Adds the following tools: - read_dir - list a directory's contents - read_file - read the content of a file - write_file - write contents to a file - insert_file_lines - insert lines in a file - replace_file_lines - replace or remove lines in a file 2023-11-25 17:55:18 -07:00			`content := strings.Builder{}`
			`toolCalls := []openai.ToolCall{}`

			`// Iterate stream segments`
Use the streamed response API 2023-10-30 15:45:21 -06:00			`for {`
Refactor streamed response handling Update CreateChangeCompletionStream to return the entire response upon stream completion. Renamed HandleDelayedResponse to HandleDelayedContent, which no longer returns the content. Removes the need wrapping HandleDelayedContent in an immediately invoked function and the passing of the completed response over a channel. Also allows us to better handle the case of partial a response. 2023-11-23 20:45:43 -07:00			`response, e := stream.Recv()`
			`if errors.Is(e, io.EOF) {`
			`break`
Use the streamed response API 2023-10-30 15:45:21 -06:00			`}`

Refactor streamed response handling Update CreateChangeCompletionStream to return the entire response upon stream completion. Renamed HandleDelayedResponse to HandleDelayedContent, which no longer returns the content. Removes the need wrapping HandleDelayedContent in an immediately invoked function and the passing of the completed response over a channel. Also allows us to better handle the case of partial a response. 2023-11-23 20:45:43 -07:00			`if e != nil {`
			`err = e`
			`break`
Use the streamed response API 2023-10-30 15:45:21 -06:00			`}`
Add initial support for tool/function calling Adds the following tools: - read_dir - list a directory's contents - read_file - read the content of a file - write_file - write contents to a file - insert_file_lines - insert lines in a file - replace_file_lines - replace or remove lines in a file 2023-11-25 17:55:18 -07:00
			`delta := response.Choices[0].Delta`
			`if len(delta.ToolCalls) > 0 {`
			`// Construct streamed tool_call arguments`
			`for _, tc := range delta.ToolCalls {`
			`if tc.Index == nil {`
			`return "", fmt.Errorf("Unexpected nil index for streamed tool call.")`
			`}`
			`if len(toolCalls) <= *tc.Index {`
			`toolCalls = append(toolCalls, tc)`
			`} else {`
			`toolCalls[*tc.Index].Function.Arguments += tc.Function.Arguments`
			`}`
			`}`
			`} else {`
			`output <- delta.Content`
			`content.WriteString(delta.Content)`
			`}`
Use the streamed response API 2023-10-30 15:45:21 -06:00			`}`
Add initial support for tool/function calling Adds the following tools: - read_dir - list a directory's contents - read_file - read the content of a file - write_file - write contents to a file - insert_file_lines - insert lines in a file - replace_file_lines - replace or remove lines in a file 2023-11-25 17:55:18 -07:00
			`if len(toolCalls) > 0 {`
			`if content.String() != "" {`
			`return "", fmt.Errorf("Model replied with user-facing content in addition to tool calls. Unsupported.")`
			`}`

			`// Append the assistant's reply with its request for tool calls`
			`toolCallJson, _ := json.Marshal(toolCalls)`
			`messages = append(messages, Message{`
			`Role: "assistant",`
			`ToolCalls: sql.NullString{String: string(toolCallJson), Valid: true},`
			`})`

			`toolReplies, err := ExecuteToolCalls(toolCalls)`
			`if err != nil {`
			`return "", err`
			`}`

			`// Recurse into CreateChatCompletionStream with the tool call replies`
			`// added to the original messages`
			`return CreateChatCompletionStream(model, append(messages, toolReplies...), maxTokens, output)`
			`}`

			`return content.String(), err`
Use the streamed response API 2023-10-30 15:45:21 -06:00			`}`