from llama_stack_client.types import (
AgentConfig,
BatchCompletion,
ChatCompletionResponse,
CompletionMessage,
ContentDelta,
Document,
InterleavedContent,
InterleavedContentItem,
Message,
Metric,
ParamType,
QueryConfig,
QueryGeneratorConfig,
QueryResult,
ResponseFormat,
SafetyViolation,
SamplingParams,
ScoringResult,
SystemMessage,
ToolCall,
ToolParamDefinition,
ToolResponseMessage,
UserMessage,
)Types:
from llama_stack_client.types import ListToolGroupsResponse, ToolGroup, ToolgroupListResponseMethods:
client.toolgroups.list() -> ToolgroupListResponseclient.toolgroups.get(toolgroup_id) -> ToolGroupclient.toolgroups.register(**params) -> Noneclient.toolgroups.unregister(toolgroup_id) -> None
Types:
from llama_stack_client.types import ListToolsResponse, Tool, ToolListResponseMethods:
client.tools.list(**params) -> ToolListResponseclient.tools.get(tool_name) -> Tool
Types:
from llama_stack_client.types import ToolDef, ToolInvocationResult, ToolRuntimeListToolsResponseMethods:
client.tool_runtime.invoke_tool(**params) -> ToolInvocationResultclient.tool_runtime.list_tools(**params) -> ToolRuntimeListToolsResponse
Methods:
client.tool_runtime.rag_tool.insert(**params) -> Noneclient.tool_runtime.rag_tool.query(**params) -> QueryResult
Types:
from llama_stack_client.types import ResponseObject, ResponseObjectStream, ResponseListResponseMethods:
client.responses.create(**params) -> ResponseObjectclient.responses.retrieve(response_id) -> ResponseObjectclient.responses.list(**params) -> SyncOpenAICursorPage[ResponseListResponse]
Types:
from llama_stack_client.types.responses import InputItemListResponseMethods:
client.responses.input_items.list(response_id, **params) -> InputItemListResponse
Types:
from llama_stack_client.types import (
InferenceStep,
MemoryRetrievalStep,
ShieldCallStep,
ToolExecutionStep,
ToolResponse,
AgentCreateResponse,
AgentRetrieveResponse,
AgentListResponse,
)Methods:
client.agents.create(**params) -> AgentCreateResponseclient.agents.retrieve(agent_id) -> AgentRetrieveResponseclient.agents.list(**params) -> AgentListResponseclient.agents.delete(agent_id) -> None
Types:
from llama_stack_client.types.agents import Session, SessionCreateResponse, SessionListResponseMethods:
client.agents.session.create(agent_id, **params) -> SessionCreateResponseclient.agents.session.retrieve(session_id, *, agent_id, **params) -> Sessionclient.agents.session.list(agent_id, **params) -> SessionListResponseclient.agents.session.delete(session_id, *, agent_id) -> None
Types:
from llama_stack_client.types.agents import StepRetrieveResponseMethods:
client.agents.steps.retrieve(step_id, *, agent_id, session_id, turn_id) -> StepRetrieveResponse
Types:
from llama_stack_client.types.agents import (
AgentTurnResponseStreamChunk,
Turn,
TurnResponseEvent,
TurnResponseEventPayload,
)Methods:
client.agents.turn.create(session_id, *, agent_id, **params) -> Turnclient.agents.turn.retrieve(turn_id, *, agent_id, session_id) -> Turnclient.agents.turn.resume(turn_id, *, agent_id, session_id, **params) -> Turn
Types:
from llama_stack_client.types import (
ListDatasetsResponse,
DatasetRetrieveResponse,
DatasetListResponse,
DatasetIterrowsResponse,
DatasetRegisterResponse,
)Methods:
client.datasets.retrieve(dataset_id) -> DatasetRetrieveResponseclient.datasets.list() -> DatasetListResponseclient.datasets.appendrows(dataset_id, **params) -> Noneclient.datasets.iterrows(dataset_id, **params) -> DatasetIterrowsResponseclient.datasets.register(**params) -> DatasetRegisterResponseclient.datasets.unregister(dataset_id) -> None
Types:
from llama_stack_client.types import BenchmarkConfig, EvalCandidate, EvaluateResponse, JobMethods:
client.eval.evaluate_rows(benchmark_id, **params) -> EvaluateResponseclient.eval.evaluate_rows_alpha(benchmark_id, **params) -> EvaluateResponseclient.eval.run_eval(benchmark_id, **params) -> Jobclient.eval.run_eval_alpha(benchmark_id, **params) -> Job
Methods:
client.eval.jobs.retrieve(job_id, *, benchmark_id) -> EvaluateResponseclient.eval.jobs.cancel(job_id, *, benchmark_id) -> Noneclient.eval.jobs.status(job_id, *, benchmark_id) -> Job
Types:
from llama_stack_client.types import HealthInfo, ProviderInfo, RouteInfo, VersionInfoMethods:
client.inspect.health() -> HealthInfoclient.inspect.version() -> VersionInfo
Types:
from llama_stack_client.types import (
ChatCompletionResponseStreamChunk,
CompletionResponse,
EmbeddingsResponse,
TokenLogProbs,
InferenceBatchChatCompletionResponse,
)Methods:
client.inference.batch_chat_completion(**params) -> InferenceBatchChatCompletionResponseclient.inference.batch_completion(**params) -> BatchCompletionclient.inference.chat_completion(**params) -> ChatCompletionResponseclient.inference.completion(**params) -> CompletionResponseclient.inference.embeddings(**params) -> EmbeddingsResponse
Types:
from llama_stack_client.types import CreateEmbeddingsResponseMethods:
client.embeddings.create(**params) -> CreateEmbeddingsResponse
Types:
from llama_stack_client.types import ChatCompletionChunkTypes:
from llama_stack_client.types.chat import (
CompletionCreateResponse,
CompletionRetrieveResponse,
CompletionListResponse,
)Methods:
client.chat.completions.create(**params) -> CompletionCreateResponseclient.chat.completions.retrieve(completion_id) -> CompletionRetrieveResponseclient.chat.completions.list(**params) -> SyncOpenAICursorPage[CompletionListResponse]
Types:
from llama_stack_client.types import CompletionCreateResponseMethods:
client.completions.create(**params) -> CompletionCreateResponse
Types:
from llama_stack_client.types import QueryChunksResponseMethods:
client.vector_io.insert(**params) -> Noneclient.vector_io.query(**params) -> QueryChunksResponse
Types:
from llama_stack_client.types import (
ListVectorDBsResponse,
VectorDBRetrieveResponse,
VectorDBListResponse,
VectorDBRegisterResponse,
)Methods:
client.vector_dbs.retrieve(vector_db_id) -> VectorDBRetrieveResponseclient.vector_dbs.list() -> VectorDBListResponseclient.vector_dbs.register(**params) -> VectorDBRegisterResponseclient.vector_dbs.unregister(vector_db_id) -> None
Types:
from llama_stack_client.types import (
ListVectorStoresResponse,
VectorStore,
VectorStoreDeleteResponse,
VectorStoreSearchResponse,
)Methods:
client.vector_stores.create(**params) -> VectorStoreclient.vector_stores.retrieve(vector_store_id) -> VectorStoreclient.vector_stores.update(vector_store_id, **params) -> VectorStoreclient.vector_stores.list(**params) -> SyncOpenAICursorPage[VectorStore]client.vector_stores.delete(vector_store_id) -> VectorStoreDeleteResponseclient.vector_stores.search(vector_store_id, **params) -> VectorStoreSearchResponse
Types:
from llama_stack_client.types.vector_stores import (
VectorStoreFile,
FileDeleteResponse,
FileContentResponse,
)Methods:
client.vector_stores.files.create(vector_store_id, **params) -> VectorStoreFileclient.vector_stores.files.retrieve(file_id, *, vector_store_id) -> VectorStoreFileclient.vector_stores.files.update(file_id, *, vector_store_id, **params) -> VectorStoreFileclient.vector_stores.files.list(vector_store_id, **params) -> SyncOpenAICursorPage[VectorStoreFile]client.vector_stores.files.delete(file_id, *, vector_store_id) -> FileDeleteResponseclient.vector_stores.files.content(file_id, *, vector_store_id) -> FileContentResponse
Types:
from llama_stack_client.types import ListModelsResponse, Model, ModelListResponseMethods:
client.models.retrieve(model_id) -> Modelclient.models.list() -> ModelListResponseclient.models.register(**params) -> Modelclient.models.unregister(model_id) -> None
Types:
from llama_stack_client.types import AlgorithmConfig, ListPostTrainingJobsResponse, PostTrainingJobMethods:
client.post_training.preference_optimize(**params) -> PostTrainingJobclient.post_training.supervised_fine_tune(**params) -> PostTrainingJob
Types:
from llama_stack_client.types.post_training import (
JobListResponse,
JobArtifactsResponse,
JobStatusResponse,
)Methods:
client.post_training.job.list() -> List[Data]client.post_training.job.artifacts(**params) -> JobArtifactsResponseclient.post_training.job.cancel(**params) -> Noneclient.post_training.job.status(**params) -> JobStatusResponse
Types:
from llama_stack_client.types import ListProvidersResponse, ProviderListResponseMethods:
client.providers.retrieve(provider_id) -> ProviderInfoclient.providers.list() -> ProviderListResponse
Types:
from llama_stack_client.types import ListRoutesResponse, RouteListResponseMethods:
client.routes.list() -> RouteListResponse
Types:
from llama_stack_client.types import CreateResponseMethods:
client.moderations.create(**params) -> CreateResponse
Types:
from llama_stack_client.types import RunShieldResponseMethods:
client.safety.run_shield(**params) -> RunShieldResponse
Types:
from llama_stack_client.types import ListShieldsResponse, Shield, ShieldListResponseMethods:
client.shields.retrieve(identifier) -> Shieldclient.shields.list() -> ShieldListResponseclient.shields.register(**params) -> Shield
Types:
from llama_stack_client.types import SyntheticDataGenerationResponseMethods:
client.synthetic_data_generation.generate(**params) -> SyntheticDataGenerationResponse
Types:
from llama_stack_client.types import (
Event,
QueryCondition,
QuerySpansResponse,
SpanWithStatus,
Trace,
TelemetryGetSpanResponse,
TelemetryGetSpanTreeResponse,
TelemetryQueryMetricsResponse,
TelemetryQuerySpansResponse,
TelemetryQueryTracesResponse,
)Methods:
client.telemetry.get_span(span_id, *, trace_id) -> TelemetryGetSpanResponseclient.telemetry.get_span_tree(span_id, **params) -> TelemetryGetSpanTreeResponseclient.telemetry.get_trace(trace_id) -> Traceclient.telemetry.log_event(**params) -> Noneclient.telemetry.query_metrics(metric_name, **params) -> TelemetryQueryMetricsResponseclient.telemetry.query_spans(**params) -> TelemetryQuerySpansResponseclient.telemetry.query_traces(**params) -> TelemetryQueryTracesResponseclient.telemetry.save_spans_to_dataset(**params) -> None
Types:
from llama_stack_client.types import ScoringScoreResponse, ScoringScoreBatchResponseMethods:
client.scoring.score(**params) -> ScoringScoreResponseclient.scoring.score_batch(**params) -> ScoringScoreBatchResponse
Types:
from llama_stack_client.types import (
ListScoringFunctionsResponse,
ScoringFn,
ScoringFnParams,
ScoringFunctionListResponse,
)Methods:
client.scoring_functions.retrieve(scoring_fn_id) -> ScoringFnclient.scoring_functions.list() -> ScoringFunctionListResponseclient.scoring_functions.register(**params) -> None
Types:
from llama_stack_client.types import Benchmark, ListBenchmarksResponse, BenchmarkListResponseMethods:
client.benchmarks.retrieve(benchmark_id) -> Benchmarkclient.benchmarks.list() -> BenchmarkListResponseclient.benchmarks.register(**params) -> None
Types:
from llama_stack_client.types import DeleteFileResponse, File, ListFilesResponseMethods: