llamastack
diff --git a/‎.stats.yml‎
Lines changed: 1 addition & 1 deletion b/‎.stats.yml‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎README.md‎
Lines changed: 7 additions & 52 deletions b/‎README.md‎
Lines changed: 7 additions & 52 deletions
diff --git a/‎api.md‎
Lines changed: 2 additions & 6 deletions b/‎api.md‎
Lines changed: 2 additions & 6 deletions
diff --git a/‎client_test.go‎
Lines changed: 19 additions & 99 deletions b/‎client_test.go‎
Lines changed: 19 additions & 99 deletions
@@ -1,4 +1,4 @@
 configured_endpoints: 105
 openapi_spec_url: https://storage.googleapis.com/stainless-sdk-openapi-specs/llamastack%2Fllama-stack-client-adcfaad1990d45e42b20e200a9ecc35ee32df5692bd9cd18ae898b0b7728c919.yml
 openapi_spec_hash: 4f532287bafe5da0578a1c1a5e31c952
-config_hash: 7ec5a583f9c26b38993013bdfb0e7d46
+config_hash: 5b643c97c83a497d7d346253f1e175f3
@@ -265,7 +265,7 @@ client := llamastackclient.NewClient(
 	option.WithHeader("X-Some-Header", "custom_header_info"),
 )
 
-client.Inference.ChatCompletion(context.TODO(), ...,
+client.Toolgroups.List(context.TODO(), ...,
 	// Override the header
 	option.WithHeader("X-Some-Header", "some_other_custom_header_info"),
 	// Add an undocumented field to the request body, using sjson syntax
@@ -296,23 +296,14 @@ When the API returns a non-success status code, we return an error with type
 To handle errors, we recommend that you use the `errors.As` pattern:
 
 ```go
-_, err := client.Inference.ChatCompletion(context.TODO(), llamastackclient.InferenceChatCompletionParams{
-	Messages: []llamastackclient.MessageUnionParam{{
-		OfUser: &llamastackclient.UserMessageParam{
-			Content: llamastackclient.InterleavedContentUnionParam{
-				OfString: llamastackclient.String("string"),
-			},
-		},
-	}},
-	ModelID: "model_id",
-})
+_, err := client.Toolgroups.List(context.TODO())
 if err != nil {
 	var apierr *llamastackclient.Error
 	if errors.As(err, &apierr) {
 		println(string(apierr.DumpRequest(true)))  // Prints the serialized HTTP request
 		println(string(apierr.DumpResponse(true))) // Prints the serialized HTTP response
 	}
-	panic(err.Error()) // GET "/v1/inference/chat-completion": 400 Bad Request { ... }
+	panic(err.Error()) // GET "/v1/toolgroups": 400 Bad Request { ... }
 }
 ```
 
@@ -330,18 +321,8 @@ To set a per-retry timeout, use `option.WithRequestTimeout()`.
 // This sets the timeout for the request, including all the retries.
 ctx, cancel := context.WithTimeout(context.Background(), 5*time.Minute)
 defer cancel()
-client.Inference.ChatCompletion(
+client.Toolgroups.List(
 	ctx,
-	llamastackclient.InferenceChatCompletionParams{
-		Messages: []llamastackclient.MessageUnionParam{{
-			OfUser: &llamastackclient.UserMessageParam{
-				Content: llamastackclient.InterleavedContentUnionParam{
-					OfString: llamastackclient.String("string"),
-				},
-			},
-		}},
-		ModelID: "model_id",
-	},
 	// This sets the per-retry timeout
 	option.WithRequestTimeout(20*time.Second),
 )
@@ -393,20 +374,7 @@ client := llamastackclient.NewClient(
 )
 
 // Override per-request:
-client.Inference.ChatCompletion(
-	context.TODO(),
-	llamastackclient.InferenceChatCompletionParams{
-		Messages: []llamastackclient.MessageUnionParam{{
-			OfUser: &llamastackclient.UserMessageParam{
-				Content: llamastackclient.InterleavedContentUnionParam{
-					OfString: llamastackclient.String("string"),
-				},
-			},
-		}},
-		ModelID: "model_id",
-	},
-	option.WithMaxRetries(5),
-)
+client.Toolgroups.List(context.TODO(), option.WithMaxRetries(5))
 ```
 
 ### Accessing raw response data (e.g. response headers)
@@ -417,24 +385,11 @@ you need to examine response headers, status codes, or other details.
 ```go
 // Create a variable to store the HTTP response
 var response *http.Response
-chatCompletionResponse, err := client.Inference.ChatCompletion(
-	context.TODO(),
-	llamastackclient.InferenceChatCompletionParams{
-		Messages: []llamastackclient.MessageUnionParam{{
-			OfUser: &llamastackclient.UserMessageParam{
-				Content: llamastackclient.InterleavedContentUnionParam{
-					OfString: llamastackclient.String("string"),
-				},
-			},
-		}},
-		ModelID: "model_id",
-	},
-	option.WithResponseInto(&response),
-)
+toolGroups, err := client.Toolgroups.List(context.TODO(), option.WithResponseInto(&response))
 if err != nil {
 	// handle error
 }
-fmt.Printf("%+v\n", chatCompletionResponse)
+fmt.Printf("%+v\n", toolGroups)
 
 fmt.Printf("Status Code: %d\n", response.StatusCode)
 fmt.Printf("Headers: %+#v\n", response.Header)
 
@@ -12,19 +12,16 @@
 - <a href="https://pkg.go.dev/github.com/llamastack/llama-stack-client-go">llamastackclient</a>.<a href="https://pkg.go.dev/github.com/llamastack/llama-stack-client-go#SamplingParams">SamplingParams</a>
 - <a href="https://pkg.go.dev/github.com/llamastack/llama-stack-client-go">llamastackclient</a>.<a href="https://pkg.go.dev/github.com/llamastack/llama-stack-client-go#SystemMessageParam">SystemMessageParam</a>
 - <a href="https://pkg.go.dev/github.com/llamastack/llama-stack-client-go">llamastackclient</a>.<a href="https://pkg.go.dev/github.com/llamastack/llama-stack-client-go#ToolCallParam">ToolCallParam</a>
-- <a href="https://pkg.go.dev/github.com/llamastack/llama-stack-client-go">llamastackclient</a>.<a href="https://pkg.go.dev/github.com/llamastack/llama-stack-client-go#ToolParamDefinition">ToolParamDefinition</a>
 - <a href="https://pkg.go.dev/github.com/llamastack/llama-stack-client-go">llamastackclient</a>.<a href="https://pkg.go.dev/github.com/llamastack/llama-stack-client-go#ToolResponseMessageParam">ToolResponseMessageParam</a>
 - <a href="https://pkg.go.dev/github.com/llamastack/llama-stack-client-go">llamastackclient</a>.<a href="https://pkg.go.dev/github.com/llamastack/llama-stack-client-go#UserMessageParam">UserMessageParam</a>
 
 # Shared Response Types
 
 - <a href="https://pkg.go.dev/github.com/llamastack/llama-stack-client-go">llamastackclient</a>.<a href="https://pkg.go.dev/github.com/llamastack/llama-stack-client-go#AgentConfig">AgentConfig</a>
-- <a href="https://pkg.go.dev/github.com/llamastack/llama-stack-client-go">llamastackclient</a>.<a href="https://pkg.go.dev/github.com/llamastack/llama-stack-client-go#ChatCompletionResponse">ChatCompletionResponse</a>
 - <a href="https://pkg.go.dev/github.com/llamastack/llama-stack-client-go">llamastackclient</a>.<a href="https://pkg.go.dev/github.com/llamastack/llama-stack-client-go#CompletionMessage">CompletionMessage</a>
 - <a href="https://pkg.go.dev/github.com/llamastack/llama-stack-client-go">llamastackclient</a>.<a href="https://pkg.go.dev/github.com/llamastack/llama-stack-client-go#ContentDeltaUnion">ContentDeltaUnion</a>
 - <a href="https://pkg.go.dev/github.com/llamastack/llama-stack-client-go">llamastackclient</a>.<a href="https://pkg.go.dev/github.com/llamastack/llama-stack-client-go#InterleavedContentUnion">InterleavedContentUnion</a>
 - <a href="https://pkg.go.dev/github.com/llamastack/llama-stack-client-go">llamastackclient</a>.<a href="https://pkg.go.dev/github.com/llamastack/llama-stack-client-go#InterleavedContentItemUnion">InterleavedContentItemUnion</a>
-- <a href="https://pkg.go.dev/github.com/llamastack/llama-stack-client-go">llamastackclient</a>.<a href="https://pkg.go.dev/github.com/llamastack/llama-stack-client-go#Metric">Metric</a>
 - <a href="https://pkg.go.dev/github.com/llamastack/llama-stack-client-go">llamastackclient</a>.<a href="https://pkg.go.dev/github.com/llamastack/llama-stack-client-go#QueryResult">QueryResult</a>
 - <a href="https://pkg.go.dev/github.com/llamastack/llama-stack-client-go">llamastackclient</a>.<a href="https://pkg.go.dev/github.com/llamastack/llama-stack-client-go#ResponseFormatUnion">ResponseFormatUnion</a>
 - <a href="https://pkg.go.dev/github.com/llamastack/llama-stack-client-go">llamastackclient</a>.<a href="https://pkg.go.dev/github.com/llamastack/llama-stack-client-go#SafetyViolation">SafetyViolation</a>
@@ -236,12 +233,11 @@ Methods:
 
 Response Types:
 
-- <a href="https://pkg.go.dev/github.com/llamastack/llama-stack-client-go">llamastackclient</a>.<a href="https://pkg.go.dev/github.com/llamastack/llama-stack-client-go#ChatCompletionResponseStreamChunk">ChatCompletionResponseStreamChunk</a>
-- <a href="https://pkg.go.dev/github.com/llamastack/llama-stack-client-go">llamastackclient</a>.<a href="https://pkg.go.dev/github.com/llamastack/llama-stack-client-go#TokenLogProbs">TokenLogProbs</a>
+- <a href="https://pkg.go.dev/github.com/llamastack/llama-stack-client-go">llamastackclient</a>.<a href="https://pkg.go.dev/github.com/llamastack/llama-stack-client-go#InferenceRerankResponse">InferenceRerankResponse</a>
 
 Methods:
 
-- <code title="post /v1/inference/chat-completion">client.Inference.<a href="https://pkg.go.dev/github.com/llamastack/llama-stack-client-go#InferenceService.ChatCompletion">ChatCompletion</a>(ctx <a href="https://pkg.go.dev/context">context</a>.<a href="https://pkg.go.dev/context#Context">Context</a>, body <a href="https://pkg.go.dev/github.com/llamastack/llama-stack-client-go">llamastackclient</a>.<a href="https://pkg.go.dev/github.com/llamastack/llama-stack-client-go#InferenceChatCompletionParams">InferenceChatCompletionParams</a>) (<a href="https://pkg.go.dev/github.com/llamastack/llama-stack-client-go">llamastackclient</a>.<a href="https://pkg.go.dev/github.com/llamastack/llama-stack-client-go#ChatCompletionResponse">ChatCompletionResponse</a>, <a href="https://pkg.go.dev/builtin#error">error</a>)</code>
+- <code title="post /v1alpha/inference/rerank">client.Inference.<a href="https://pkg.go.dev/github.com/llamastack/llama-stack-client-go#InferenceService.Rerank">Rerank</a>(ctx <a href="https://pkg.go.dev/context">context</a>.<a href="https://pkg.go.dev/context#Context">Context</a>, body <a href="https://pkg.go.dev/github.com/llamastack/llama-stack-client-go">llamastackclient</a>.<a href="https://pkg.go.dev/github.com/llamastack/llama-stack-client-go#InferenceRerankParams">InferenceRerankParams</a>) ([]<a href="https://pkg.go.dev/github.com/llamastack/llama-stack-client-go">llamastackclient</a>.<a href="https://pkg.go.dev/github.com/llamastack/llama-stack-client-go#InferenceRerankResponse">InferenceRerankResponse</a>, <a href="https://pkg.go.dev/builtin#error">error</a>)</code>
 
 # Embeddings
 
 
@@ -38,16 +38,7 @@ func TestUserAgentHeader(t *testing.T) {
 			},
 		}),
 	)
-	client.Inference.ChatCompletion(context.Background(), llamastackclient.InferenceChatCompletionParams{
-		Messages: []llamastackclient.MessageUnionParam{{
-			OfUser: &llamastackclient.UserMessageParam{
-				Content: llamastackclient.InterleavedContentUnionParam{
-					OfString: llamastackclient.String("string"),
-				},
-			},
-		}},
-		ModelID: "model_id",
-	})
+	client.Toolgroups.List(context.Background())
 	if userAgent != fmt.Sprintf("LlamaStackClient/Go %s", internal.PackageVersion) {
 		t.Errorf("Expected User-Agent to be correct, but got: %#v", userAgent)
 	}
@@ -70,16 +61,7 @@ func TestRetryAfter(t *testing.T) {
 			},
 		}),
 	)
-	_, err := client.Inference.ChatCompletion(context.Background(), llamastackclient.InferenceChatCompletionParams{
-		Messages: []llamastackclient.MessageUnionParam{{
-			OfUser: &llamastackclient.UserMessageParam{
-				Content: llamastackclient.InterleavedContentUnionParam{
-					OfString: llamastackclient.String("string"),
-				},
-			},
-		}},
-		ModelID: "model_id",
-	})
+	_, err := client.Toolgroups.List(context.Background())
 	if err == nil {
 		t.Error("Expected there to be a cancel error")
 	}
@@ -113,16 +95,7 @@ func TestDeleteRetryCountHeader(t *testing.T) {
 		}),
 		option.WithHeaderDel("X-Stainless-Retry-Count"),
 	)
-	_, err := client.Inference.ChatCompletion(context.Background(), llamastackclient.InferenceChatCompletionParams{
-		Messages: []llamastackclient.MessageUnionParam{{
-			OfUser: &llamastackclient.UserMessageParam{
-				Content: llamastackclient.InterleavedContentUnionParam{
-					OfString: llamastackclient.String("string"),
-				},
-			},
-		}},
-		ModelID: "model_id",
-	})
+	_, err := client.Toolgroups.List(context.Background())
 	if err == nil {
 		t.Error("Expected there to be a cancel error")
 	}
@@ -151,16 +124,7 @@ func TestOverwriteRetryCountHeader(t *testing.T) {
 		}),
 		option.WithHeader("X-Stainless-Retry-Count", "42"),
 	)
-	_, err := client.Inference.ChatCompletion(context.Background(), llamastackclient.InferenceChatCompletionParams{
-		Messages: []llamastackclient.MessageUnionParam{{
-			OfUser: &llamastackclient.UserMessageParam{
-				Content: llamastackclient.InterleavedContentUnionParam{
-					OfString: llamastackclient.String("string"),
-				},
-			},
-		}},
-		ModelID: "model_id",
-	})
+	_, err := client.Toolgroups.List(context.Background())
 	if err == nil {
 		t.Error("Expected there to be a cancel error")
 	}
@@ -188,16 +152,7 @@ func TestRetryAfterMs(t *testing.T) {
 			},
 		}),
 	)
-	_, err := client.Inference.ChatCompletion(context.Background(), llamastackclient.InferenceChatCompletionParams{
-		Messages: []llamastackclient.MessageUnionParam{{
-			OfUser: &llamastackclient.UserMessageParam{
-				Content: llamastackclient.InterleavedContentUnionParam{
-					OfString: llamastackclient.String("string"),
-				},
-			},
-		}},
-		ModelID: "model_id",
-	})
+	_, err := client.Toolgroups.List(context.Background())
 	if err == nil {
 		t.Error("Expected there to be a cancel error")
 	}
@@ -219,16 +174,7 @@ func TestContextCancel(t *testing.T) {
 	)
 	cancelCtx, cancel := context.WithCancel(context.Background())
 	cancel()
-	_, err := client.Inference.ChatCompletion(cancelCtx, llamastackclient.InferenceChatCompletionParams{
-		Messages: []llamastackclient.MessageUnionParam{{
-			OfUser: &llamastackclient.UserMessageParam{
-				Content: llamastackclient.InterleavedContentUnionParam{
-					OfString: llamastackclient.String("string"),
-				},
-			},
-		}},
-		ModelID: "model_id",
-	})
+	_, err := client.Toolgroups.List(cancelCtx)
 	if err == nil {
 		t.Error("Expected there to be a cancel error")
 	}
@@ -247,16 +193,7 @@ func TestContextCancelDelay(t *testing.T) {
 	)
 	cancelCtx, cancel := context.WithTimeout(context.Background(), 2*time.Millisecond)
 	defer cancel()
-	_, err := client.Inference.ChatCompletion(cancelCtx, llamastackclient.InferenceChatCompletionParams{
-		Messages: []llamastackclient.MessageUnionParam{{
-			OfUser: &llamastackclient.UserMessageParam{
-				Content: llamastackclient.InterleavedContentUnionParam{
-					OfString: llamastackclient.String("string"),
-				},
-			},
-		}},
-		ModelID: "model_id",
-	})
+	_, err := client.Toolgroups.List(cancelCtx)
 	if err == nil {
 		t.Error("expected there to be a cancel error")
 	}
@@ -281,16 +218,7 @@ func TestContextDeadline(t *testing.T) {
 				},
 			}),
 		)
-		_, err := client.Inference.ChatCompletion(deadlineCtx, llamastackclient.InferenceChatCompletionParams{
-			Messages: []llamastackclient.MessageUnionParam{{
-				OfUser: &llamastackclient.UserMessageParam{
-					Content: llamastackclient.InterleavedContentUnionParam{
-						OfString: llamastackclient.String("string"),
-					},
-				},
-			}},
-			ModelID: "model_id",
-		})
+		_, err := client.Toolgroups.List(deadlineCtx)
 		if err == nil {
 			t.Error("expected there to be a deadline error")
 		}
@@ -334,15 +262,11 @@ func TestContextDeadlineStreaming(t *testing.T) {
 				},
 			}),
 		)
-		stream := client.Inference.ChatCompletionStreaming(deadlineCtx, llamastackclient.InferenceChatCompletionParams{
-			Messages: []llamastackclient.MessageUnionParam{{
-				OfUser: &llamastackclient.UserMessageParam{
-					Content: llamastackclient.InterleavedContentUnionParam{
-						OfString: llamastackclient.String("string"),
-					},
-				},
-			}},
-			ModelID: "model_id",
+		stream := client.Responses.NewStreaming(deadlineCtx, llamastackclient.ResponseNewParams{
+			Input: llamastackclient.ResponseNewParamsInputUnion{
+				OfString: llamastackclient.String("string"),
+			},
+			Model: "model",
 		})
 		for stream.Next() {
 			_ = stream.Current()
@@ -387,17 +311,13 @@ func TestContextDeadlineStreamingWithRequestTimeout(t *testing.T) {
 				},
 			}),
 		)
-		stream := client.Inference.ChatCompletionStreaming(
+		stream := client.Responses.NewStreaming(
 			context.Background(),
-			llamastackclient.InferenceChatCompletionParams{
-				Messages: []llamastackclient.MessageUnionParam{{
-					OfUser: &llamastackclient.UserMessageParam{
-						Content: llamastackclient.InterleavedContentUnionParam{
-							OfString: llamastackclient.String("string"),
-						},
-					},
-				}},
-				ModelID: "model_id",
+			llamastackclient.ResponseNewParams{
+				Input: llamastackclient.ResponseNewParamsInputUnion{
+					OfString: llamastackclient.String("string"),
+				},
+				Model: "model",
 			},
 			option.WithRequestTimeout((100 * time.Millisecond)),
 		)