@@ -65,6 +65,9 @@ def benchmarks(self) -> BenchmarksResource:
6565
6666 @cached_property
6767 def eval (self ) -> EvalResource :
68+ """
69+ Llama Stack Evaluation API for running evaluations on model and agent candidates.
70+ """
6871 return EvalResource (self ._client )
6972
7073 @cached_property
@@ -73,6 +76,14 @@ def admin(self) -> AdminResource:
7376
7477 @cached_property
7578 def inference (self ) -> InferenceResource :
79+ """
80+ Llama Stack Inference API for generating completions, chat completions, and embeddings.
81+
82+ This API provides the raw interface to the underlying models. Three kinds of models are supported:
83+ - LLM models: these models generate "raw" and "chat" (conversational) completions.
84+ - Embedding models: these models generate embeddings to be used for semantic search.
85+ - Rerank models: these models reorder the documents based on their relevance to a query.
86+ """
7687 return InferenceResource (self ._client )
7788
7889 @cached_property
@@ -106,6 +117,9 @@ def benchmarks(self) -> AsyncBenchmarksResource:
106117
107118 @cached_property
108119 def eval (self ) -> AsyncEvalResource :
120+ """
121+ Llama Stack Evaluation API for running evaluations on model and agent candidates.
122+ """
109123 return AsyncEvalResource (self ._client )
110124
111125 @cached_property
@@ -114,6 +128,14 @@ def admin(self) -> AsyncAdminResource:
114128
115129 @cached_property
116130 def inference (self ) -> AsyncInferenceResource :
131+ """
132+ Llama Stack Inference API for generating completions, chat completions, and embeddings.
133+
134+ This API provides the raw interface to the underlying models. Three kinds of models are supported:
135+ - LLM models: these models generate "raw" and "chat" (conversational) completions.
136+ - Embedding models: these models generate embeddings to be used for semantic search.
137+ - Rerank models: these models reorder the documents based on their relevance to a query.
138+ """
117139 return AsyncInferenceResource (self ._client )
118140
119141 @cached_property
@@ -150,6 +172,9 @@ def benchmarks(self) -> BenchmarksResourceWithRawResponse:
150172
151173 @cached_property
152174 def eval (self ) -> EvalResourceWithRawResponse :
175+ """
176+ Llama Stack Evaluation API for running evaluations on model and agent candidates.
177+ """
153178 return EvalResourceWithRawResponse (self ._alpha .eval )
154179
155180 @cached_property
@@ -158,6 +183,14 @@ def admin(self) -> AdminResourceWithRawResponse:
158183
159184 @cached_property
160185 def inference (self ) -> InferenceResourceWithRawResponse :
186+ """
187+ Llama Stack Inference API for generating completions, chat completions, and embeddings.
188+
189+ This API provides the raw interface to the underlying models. Three kinds of models are supported:
190+ - LLM models: these models generate "raw" and "chat" (conversational) completions.
191+ - Embedding models: these models generate embeddings to be used for semantic search.
192+ - Rerank models: these models reorder the documents based on their relevance to a query.
193+ """
161194 return InferenceResourceWithRawResponse (self ._alpha .inference )
162195
163196
@@ -175,6 +208,9 @@ def benchmarks(self) -> AsyncBenchmarksResourceWithRawResponse:
175208
176209 @cached_property
177210 def eval (self ) -> AsyncEvalResourceWithRawResponse :
211+ """
212+ Llama Stack Evaluation API for running evaluations on model and agent candidates.
213+ """
178214 return AsyncEvalResourceWithRawResponse (self ._alpha .eval )
179215
180216 @cached_property
@@ -183,6 +219,14 @@ def admin(self) -> AsyncAdminResourceWithRawResponse:
183219
184220 @cached_property
185221 def inference (self ) -> AsyncInferenceResourceWithRawResponse :
222+ """
223+ Llama Stack Inference API for generating completions, chat completions, and embeddings.
224+
225+ This API provides the raw interface to the underlying models. Three kinds of models are supported:
226+ - LLM models: these models generate "raw" and "chat" (conversational) completions.
227+ - Embedding models: these models generate embeddings to be used for semantic search.
228+ - Rerank models: these models reorder the documents based on their relevance to a query.
229+ """
186230 return AsyncInferenceResourceWithRawResponse (self ._alpha .inference )
187231
188232
@@ -200,6 +244,9 @@ def benchmarks(self) -> BenchmarksResourceWithStreamingResponse:
200244
201245 @cached_property
202246 def eval (self ) -> EvalResourceWithStreamingResponse :
247+ """
248+ Llama Stack Evaluation API for running evaluations on model and agent candidates.
249+ """
203250 return EvalResourceWithStreamingResponse (self ._alpha .eval )
204251
205252 @cached_property
@@ -208,6 +255,14 @@ def admin(self) -> AdminResourceWithStreamingResponse:
208255
209256 @cached_property
210257 def inference (self ) -> InferenceResourceWithStreamingResponse :
258+ """
259+ Llama Stack Inference API for generating completions, chat completions, and embeddings.
260+
261+ This API provides the raw interface to the underlying models. Three kinds of models are supported:
262+ - LLM models: these models generate "raw" and "chat" (conversational) completions.
263+ - Embedding models: these models generate embeddings to be used for semantic search.
264+ - Rerank models: these models reorder the documents based on their relevance to a query.
265+ """
211266 return InferenceResourceWithStreamingResponse (self ._alpha .inference )
212267
213268
@@ -225,6 +280,9 @@ def benchmarks(self) -> AsyncBenchmarksResourceWithStreamingResponse:
225280
226281 @cached_property
227282 def eval (self ) -> AsyncEvalResourceWithStreamingResponse :
283+ """
284+ Llama Stack Evaluation API for running evaluations on model and agent candidates.
285+ """
228286 return AsyncEvalResourceWithStreamingResponse (self ._alpha .eval )
229287
230288 @cached_property
@@ -233,4 +291,12 @@ def admin(self) -> AsyncAdminResourceWithStreamingResponse:
233291
234292 @cached_property
235293 def inference (self ) -> AsyncInferenceResourceWithStreamingResponse :
294+ """
295+ Llama Stack Inference API for generating completions, chat completions, and embeddings.
296+
297+ This API provides the raw interface to the underlying models. Three kinds of models are supported:
298+ - LLM models: these models generate "raw" and "chat" (conversational) completions.
299+ - Embedding models: these models generate embeddings to be used for semantic search.
300+ - Rerank models: these models reorder the documents based on their relevance to a query.
301+ """
236302 return AsyncInferenceResourceWithStreamingResponse (self ._alpha .inference )
0 commit comments