Updated

djthorpe · djthorpe · commit ed2b92e848d9 · 2025-02-02T20:43:43.000+01:00
diff --git a/README.md b/README.md
@@ -202,10 +202,10 @@ The options are as follows:
 | `llm.WithToolKit(llm.ToolKit)` | Cannot be combined with streaming | Yes | Yes | - | The set of tools to use. |
 | `llm.WithStopSequence(string, string, ...)` | Yes | Yes | Yes | - | Stop generation if one of these tokens is detected. |
 | `llm.WithSystemPrompt(string)` | No | Yes | Yes | - | Set the system prompt for the model. |
-| `llm.WithSeed(uint64)` | No | Yes | Yes | - | The seed to use for random sampling. If set, different calls will generate deterministic results. |
-| `llm.WithFormat(string)` | No | Yes | Use `json_format` or `text` | - | The format of the response. For Mistral, you must also instruct the model to produce JSON yourself with a system or a user message. |
-| `mistral.WithPresencePenalty(float64)` | No | No | Yes | - | Determines how much the model penalizes the repetition of words or phrases. A higher presence penalty encourages the model to use a wider variety of words and phrases, making the output more diverse and creative. |
-| `mistral.WithFequencyPenalty(float64)` | No | No | Yes | - | Penalizes the repetition of words based on their frequency in the generated text. A higher frequency penalty discourages the model from repeating words that have already appeared frequently in the output, promoting diversity and reducing repetition. |
+| `llm.WithSeed(uint64)` | Yes | Yes | Yes | - | The seed to use for random sampling. If set, different calls will generate deterministic results. |
+| `llm.WithFormat(string)` | Use `json` | Yes | Use `json_format` or `text` | - | The format of the response. For Mistral, you must also instruct the model to produce JSON yourself with a system or a user message. |
+| `llm.WithPresencePenalty(float64)` | Yes | No | Yes | - | Determines how much the model penalizes the repetition of words or phrases. A higher presence penalty encourages the model to use a wider variety of words and phrases, making the output more diverse and creative. |
+| `llm.WithFequencyPenalty(float64)` | Yes | No | Yes | - | Penalizes the repetition of words based on their frequency in the generated text. A higher frequency penalty discourages the model from repeating words that have already appeared frequently in the output, promoting diversity and reducing repetition. |
 | `mistral.WithPrediction(string)` | No | No | Yes | - | Enable users to specify expected results, optimizing response times by leveraging known or predictable content. This approach is especially effective for updating text documents or code files with minimal changes, reducing latency while maintaining high-quality results. |
 | `llm.WithSafePrompt()` | No | No | Yes | - | Whether to inject a safety prompt before all conversations. |
 | `llm.WithNumCompletions(uint64)` | No | No | Yes | - | Number of completions to return for each request. |
diff --git a/opt.go b/opt.go
@@ -271,6 +271,26 @@ func WithTopK(v uint64) Opt {
 	}
 }
 
+func WithPresencePenalty(v float64) Opt {
+	return func(o *Opts) error {
+		if v < -2 || v > 2 {
+			return ErrBadParameter.With("presence_penalty")
+		}
+		o.Set("presence_penalty", v)
+		return nil
+	}
+}
+
+func WithFrequencyPenalty(v float64) Opt {
+	return func(o *Opts) error {
+		if v < -2 || v > 2 {
+			return ErrBadParameter.With("frequency_penalty")
+		}
+		o.Set("frequency_penalty", v)
+		return nil
+	}
+}
+
 // The maximum number of tokens to generate in the completion.
 func WithMaxTokens(v uint64) Opt {
 	return func(o *Opts) error {
diff --git a/pkg/mistral/opt.go b/pkg/mistral/opt.go
@@ -9,26 +9,6 @@ import (
 ///////////////////////////////////////////////////////////////////////////////
 // PUBLIC METHODS
 
-func WithPresencePenalty(v float64) llm.Opt {
-	return func(o *llm.Opts) error {
-		if v < -2 || v > 2 {
-			return llm.ErrBadParameter.With("presence_penalty")
-		}
-		o.Set("presence_penalty", v)
-		return nil
-	}
-}
-
-func WithFrequencyPenalty(v float64) llm.Opt {
-	return func(o *llm.Opts) error {
-		if v < -2 || v > 2 {
-			return llm.ErrBadParameter.With("frequency_penalty")
-		}
-		o.Set("frequency_penalty", v)
-		return nil
-	}
-}
-
 func WithPrediction(v string) llm.Opt {
 	return func(o *llm.Opts) error {
 		o.Set("prediction", v)
diff --git a/pkg/ollama/chat.go b/pkg/ollama/chat.go
@@ -68,9 +68,9 @@ func (ollama *Client) Chat(ctx context.Context, context llm.Context, opts ...llm
 
 	// Append the system prompt at the beginning
 	messages := make([]*Message, 0, len(context.(*session).seq)+1)
-	//if system := opt.SystemPrompt(); system != "" {
-	//	messages = append(messages, systemPrompt(system))
-	//}
+	if system := opt.SystemPrompt(); system != "" {
+		messages = append(messages, systemPrompt(system))
+	}
 
 	// Always append the first message of each completion
 	for _, message := range context.(*session).seq {
@@ -92,7 +92,7 @@ func (ollama *Client) Chat(ctx context.Context, context llm.Context, opts ...llm
 	}
 
 	//  Response
-	var response Response
+	var response, delta Response
 	reqopts := []client.RequestOpt{
 		client.OptPath("chat"),
 	}
@@ -111,12 +111,16 @@ func (ollama *Client) Chat(ctx context.Context, context llm.Context, opts ...llm
 	}
 
 	// Response
-	if err := ollama.DoWithContext(ctx, req, &response, reqopts...); err != nil {
+	if err := ollama.DoWithContext(ctx, req, &delta, reqopts...); err != nil {
 		return nil, err
 	}
 
 	// Return success
-	return &response, nil
+	if optStream(ollama, opt) {
+		return &response, nil
+	} else {
+		return &delta, nil
+	}
 }
 
 ///////////////////////////////////////////////////////////////////////////////
diff --git a/pkg/ollama/chat_test.go b/pkg/ollama/chat_test.go
@@ -0,0 +1,68 @@
+package ollama_test
+
+import (
+	"context"
+	"testing"
+
+	// Packages
+
+	llm "github.com/mutablelogic/go-llm"
+	ollama "github.com/mutablelogic/go-llm/pkg/ollama"
+	assert "github.com/stretchr/testify/assert"
+)
+
+func Test_chat_001(t *testing.T) {
+	// Pull the model
+	model, err := client.PullModel(context.TODO(), "qwen:0.5b", ollama.WithPullStatus(func(status *ollama.PullStatus) {
+		t.Log(status)
+	}))
+	if err != nil {
+		t.FailNow()
+	}
+
+	t.Run("Temperature", func(t *testing.T) {
+		assert := assert.New(t)
+		response, err := client.Chat(context.TODO(), model.UserPrompt("why is the sky blue?"), llm.WithTemperature(0.5))
+		if !assert.NoError(err) {
+			t.FailNow()
+		}
+		t.Log(response)
+	})
+
+	t.Run("TopP", func(t *testing.T) {
+		assert := assert.New(t)
+		response, err := client.Chat(context.TODO(), model.UserPrompt("why is the sky blue?"), llm.WithTopP(0.5))
+		if !assert.NoError(err) {
+			t.FailNow()
+		}
+		t.Log(response)
+	})
+	t.Run("TopK", func(t *testing.T) {
+		assert := assert.New(t)
+		response, err := client.Chat(context.TODO(), model.UserPrompt("why is the sky blue?"), llm.WithTopK(50))
+		if !assert.NoError(err) {
+			t.FailNow()
+		}
+		t.Log(response)
+	})
+
+	t.Run("Stream", func(t *testing.T) {
+		assert := assert.New(t)
+		response, err := client.Chat(context.TODO(), model.UserPrompt("why is the sky blue?"), llm.WithStream(func(stream llm.Completion) {
+			t.Log(stream)
+		}))
+		if !assert.NoError(err) {
+			t.FailNow()
+		}
+		t.Log(response)
+	})
+
+	t.Run("Stop", func(t *testing.T) {
+		assert := assert.New(t)
+		response, err := client.Chat(context.TODO(), model.UserPrompt("why is the sky blue?"), llm.WithStopSequence("sky"))
+		if !assert.NoError(err) {
+			t.FailNow()
+		}
+		t.Log(response)
+	})
+}
diff --git a/pkg/ollama/embedding_test.go b/pkg/ollama/embedding_test.go
@@ -9,13 +9,22 @@ import (
 	assert "github.com/stretchr/testify/assert"
 )
 
-func Test_embed_001(t *testing.T) {
-	t.Run("Embedding", func(t *testing.T) {
+func Test_embeddings_001(t *testing.T) {
+	t.Run("Embedding1", func(t *testing.T) {
 		assert := assert.New(t)
 		embedding, err := client.GenerateEmbedding(context.TODO(), "qwen:0.5b", []string{"hello, world"})
 		if !assert.NoError(err) {
 			t.FailNow()
 		}
-		t.Log(embedding)
+		assert.Equal(1, len(embedding.Embeddings))
+	})
+
+	t.Run("Embedding2", func(t *testing.T) {
+		assert := assert.New(t)
+		embedding, err := client.GenerateEmbedding(context.TODO(), "qwen:0.5b", []string{"hello, world", "goodbye cruel world"})
+		if !assert.NoError(err) {
+			t.FailNow()
+		}
+		assert.Equal(2, len(embedding.Embeddings))
 	})
 }
diff --git a/pkg/ollama/model.go b/pkg/ollama/model.go
@@ -162,6 +162,8 @@ func (ollama *Client) GetModel(ctx context.Context, name string) (llm.Model, err
 	var response ModelMeta
 	if err := ollama.DoWithContext(ctx, req, &response, client.OptPath("show")); err != nil {
 		return nil, err
+	} else {
+		response.Name = name
 	}
 
 	// Return success
diff --git a/pkg/ollama/opt.go b/pkg/ollama/opt.go
@@ -91,6 +91,15 @@ func optFormat(opts *llm.Opts) string {
 	return opts.GetString("format")
 }
 
+func optStopSequence(opts *llm.Opts) []string {
+	if opts.Has("stop") {
+		if stop, ok := opts.Get("stop").([]string); ok {
+			return stop
+		}
+	}
+	return nil
+}
+
 func optOptions(opts *llm.Opts) map[string]any {
 	result := make(map[string]any)
 	if o, ok := opts.Get("options").(map[string]any); ok {
@@ -101,13 +110,25 @@ func optOptions(opts *llm.Opts) map[string]any {
 
 	// copy across temperature, top_p and top_k
 	if opts.Has("temperature") {
-		result["temperature"] = opts.Get("temperature")
+		result["temperature"] = opts.Get("temperature").(float64)
 	}
 	if opts.Has("top_p") {
-		result["top_p"] = opts.Get("top_p")
+		result["top_p"] = opts.GetFloat64("top_p")
 	}
 	if opts.Has("top_k") {
-		result["top_k"] = opts.Get("top_k")
+		result["top_k"] = opts.GetUint64("top_k")
+	}
+	if opts.Has("stop") {
+		result["stop"] = opts.Get("stop").([]string)
+	}
+	if opts.Has("seed") {
+		result["seed"] = opts.GetUint64("seed")
+	}
+	if opts.Has("presence_penalty") {
+		result["presence_penalty"] = opts.GetFloat64("presence_penalty")
+	}
+	if opts.Has("frequency_penalty") {
+		result["frequency_penalty"] = opts.GetFloat64("frequency_penalty")
 	}
 
 	// Return result

Original file line number	Diff line number	Diff line change
`@@ -162,6 +162,8 @@ func (ollama *Client) GetModel(ctx context.Context, name string) (llm.Model, err`
`162`	`162`	`var response ModelMeta`
`163`	`163`	`if err := ollama.DoWithContext(ctx, req, &response, client.OptPath("show")); err != nil {`
`164`	`164`	`return nil, err`
	`165`	`+ } else {`
	`166`	`+ response.Name = name`
`165`	`167`	`}`
`166`	`168`
`167`	`169`	`// Return success`