diff --git a/docs/openapi_generator/generate.py b/docs/openapi_generator/generate.py
index 3aa7ea6dc..a82b3db76 100644
--- a/docs/openapi_generator/generate.py
+++ b/docs/openapi_generator/generate.py
@@ -52,13 +52,11 @@ def main(output_dir: str):
Options(
server=Server(url="http://any-hosted-llama-stack.com"),
info=Info(
- title="[DRAFT] Llama Stack Specification",
+ title="Llama Stack Specification",
version=LLAMA_STACK_API_VERSION,
- description="""This is the specification of the llama stack that provides
+ description="""This is the specification of the Llama Stack that provides
a set of endpoints and their corresponding interfaces that are tailored to
- best leverage Llama Models. The specification is still in draft and subject to change.
- Generated at """
- + now,
+ best leverage Llama Models.""",
),
),
)
diff --git a/docs/openapi_generator/pyopenapi/generator.py b/docs/openapi_generator/pyopenapi/generator.py
index 2e1fbb856..66424ab15 100644
--- a/docs/openapi_generator/pyopenapi/generator.py
+++ b/docs/openapi_generator/pyopenapi/generator.py
@@ -438,6 +438,14 @@ def _build_extra_tag_groups(
return extra_tags
def _build_operation(self, op: EndpointOperation) -> Operation:
+ if op.defining_class.__name__ in [
+ "SyntheticDataGeneration",
+ "PostTraining",
+ "BatchInference",
+ ]:
+ op.defining_class.__name__ = f"{op.defining_class.__name__} (Coming Soon)"
+ print(op.defining_class.__name__)
+
doc_string = parse_type(op.func_ref)
doc_params = dict(
(param.name, param.description) for param in doc_string.params.values()
diff --git a/docs/requirements.txt b/docs/requirements.txt
index 464dde187..c182f41c4 100644
--- a/docs/requirements.txt
+++ b/docs/requirements.txt
@@ -7,3 +7,5 @@ sphinx-pdj-theme
sphinx-copybutton
sphinx-tabs
sphinx-design
+sphinxcontrib-openapi
+sphinxcontrib-redoc
diff --git a/docs/resources/llama-stack-spec.html b/docs/resources/llama-stack-spec.html
index cf4bf5125..090253804 100644
--- a/docs/resources/llama-stack-spec.html
+++ b/docs/resources/llama-stack-spec.html
@@ -19,9 +19,9 @@
spec = {
"openapi": "3.1.0",
"info": {
- "title": "[DRAFT] Llama Stack Specification",
+ "title": "Llama Stack Specification",
"version": "alpha",
- "description": "This is the specification of the llama stack that provides\n a set of endpoints and their corresponding interfaces that are tailored to\n best leverage Llama Models. The specification is still in draft and subject to change.\n Generated at 2024-11-19 09:14:01.145131"
+ "description": "This is the specification of the Llama Stack that provides\n a set of endpoints and their corresponding interfaces that are tailored to\n best leverage Llama Models. Generated at 2024-11-22 17:23:55.034164"
},
"servers": [
{
@@ -44,7 +44,7 @@
}
},
"tags": [
- "BatchInference"
+ "BatchInference (Coming Soon)"
],
"parameters": [
{
@@ -84,7 +84,7 @@
}
},
"tags": [
- "BatchInference"
+ "BatchInference (Coming Soon)"
],
"parameters": [
{
@@ -117,7 +117,7 @@
}
},
"tags": [
- "PostTraining"
+ "PostTraining (Coming Soon)"
],
"parameters": [
{
@@ -1079,7 +1079,7 @@
}
},
"tags": [
- "PostTraining"
+ "PostTraining (Coming Soon)"
],
"parameters": [
{
@@ -1117,7 +1117,7 @@
}
},
"tags": [
- "PostTraining"
+ "PostTraining (Coming Soon)"
],
"parameters": [
{
@@ -1155,7 +1155,7 @@
}
},
"tags": [
- "PostTraining"
+ "PostTraining (Coming Soon)"
],
"parameters": [
{
@@ -1193,7 +1193,7 @@
}
},
"tags": [
- "PostTraining"
+ "PostTraining (Coming Soon)"
],
"parameters": [
{
@@ -1713,7 +1713,7 @@
}
},
"tags": [
- "PostTraining"
+ "PostTraining (Coming Soon)"
],
"parameters": [
{
@@ -2161,7 +2161,7 @@
}
},
"tags": [
- "PostTraining"
+ "PostTraining (Coming Soon)"
],
"parameters": [
{
@@ -2201,7 +2201,7 @@
}
},
"tags": [
- "SyntheticDataGeneration"
+ "SyntheticDataGeneration (Coming Soon)"
],
"parameters": [
{
@@ -3861,7 +3861,8 @@
"type": "string",
"enum": [
"bing",
- "brave"
+ "brave",
+ "tavily"
],
"default": "brave"
},
@@ -8002,7 +8003,7 @@
"description": ""
},
{
- "name": "BatchInference"
+ "name": "BatchInference (Coming Soon)"
},
{
"name": "BenchmarkEvalTaskConfig",
@@ -8256,7 +8257,7 @@
"description": ""
},
{
- "name": "PostTraining"
+ "name": "PostTraining (Coming Soon)"
},
{
"name": "PostTrainingJob",
@@ -8447,7 +8448,7 @@
"description": ""
},
{
- "name": "SyntheticDataGeneration"
+ "name": "SyntheticDataGeneration (Coming Soon)"
},
{
"name": "SyntheticDataGenerationResponse",
@@ -8558,7 +8559,7 @@
"name": "Operations",
"tags": [
"Agents",
- "BatchInference",
+ "BatchInference (Coming Soon)",
"DatasetIO",
"Datasets",
"Eval",
@@ -8568,12 +8569,12 @@
"Memory",
"MemoryBanks",
"Models",
- "PostTraining",
+ "PostTraining (Coming Soon)",
"Safety",
"Scoring",
"ScoringFunctions",
"Shields",
- "SyntheticDataGeneration",
+ "SyntheticDataGeneration (Coming Soon)",
"Telemetry"
]
},
diff --git a/docs/resources/llama-stack-spec.yaml b/docs/resources/llama-stack-spec.yaml
index e84f11bdd..8ffd9fdef 100644
--- a/docs/resources/llama-stack-spec.yaml
+++ b/docs/resources/llama-stack-spec.yaml
@@ -2629,6 +2629,7 @@ components:
enum:
- bing
- brave
+ - tavily
type: string
input_shields:
items:
@@ -3397,11 +3398,10 @@ components:
- api_key
type: object
info:
- description: "This is the specification of the llama stack that provides\n \
+ description: "This is the specification of the Llama Stack that provides\n \
\ a set of endpoints and their corresponding interfaces that are tailored\
- \ to\n best leverage Llama Models. The specification is still in\
- \ draft and subject to change.\n Generated at 2024-11-19 09:14:01.145131"
- title: '[DRAFT] Llama Stack Specification'
+ \ to\n best leverage Llama Models. Generated at 2024-11-22 17:23:55.034164"
+ title: Llama Stack Specification
version: alpha
jsonSchemaDialect: https://json-schema.org/draft/2020-12/schema
openapi: 3.1.0
@@ -3658,7 +3658,7 @@ paths:
$ref: '#/components/schemas/BatchChatCompletionResponse'
description: OK
tags:
- - BatchInference
+ - BatchInference (Coming Soon)
/alpha/batch-inference/completion:
post:
parameters:
@@ -3683,7 +3683,7 @@ paths:
$ref: '#/components/schemas/BatchCompletionResponse'
description: OK
tags:
- - BatchInference
+ - BatchInference (Coming Soon)
/alpha/datasetio/get-rows-paginated:
get:
parameters:
@@ -4337,7 +4337,7 @@ paths:
$ref: '#/components/schemas/PostTrainingJobArtifactsResponse'
description: OK
tags:
- - PostTraining
+ - PostTraining (Coming Soon)
/alpha/post-training/job/cancel:
post:
parameters:
@@ -4358,7 +4358,7 @@ paths:
'200':
description: OK
tags:
- - PostTraining
+ - PostTraining (Coming Soon)
/alpha/post-training/job/logs:
get:
parameters:
@@ -4382,7 +4382,7 @@ paths:
$ref: '#/components/schemas/PostTrainingJobLogStream'
description: OK
tags:
- - PostTraining
+ - PostTraining (Coming Soon)
/alpha/post-training/job/status:
get:
parameters:
@@ -4406,7 +4406,7 @@ paths:
$ref: '#/components/schemas/PostTrainingJobStatusResponse'
description: OK
tags:
- - PostTraining
+ - PostTraining (Coming Soon)
/alpha/post-training/jobs:
get:
parameters:
@@ -4425,7 +4425,7 @@ paths:
$ref: '#/components/schemas/PostTrainingJob'
description: OK
tags:
- - PostTraining
+ - PostTraining (Coming Soon)
/alpha/post-training/preference-optimize:
post:
parameters:
@@ -4450,7 +4450,7 @@ paths:
$ref: '#/components/schemas/PostTrainingJob'
description: OK
tags:
- - PostTraining
+ - PostTraining (Coming Soon)
/alpha/post-training/supervised-fine-tune:
post:
parameters:
@@ -4475,7 +4475,7 @@ paths:
$ref: '#/components/schemas/PostTrainingJob'
description: OK
tags:
- - PostTraining
+ - PostTraining (Coming Soon)
/alpha/providers/list:
get:
parameters:
@@ -4755,7 +4755,7 @@ paths:
$ref: '#/components/schemas/SyntheticDataGenerationResponse'
description: OK
tags:
- - SyntheticDataGeneration
+ - SyntheticDataGeneration (Coming Soon)
/alpha/telemetry/get-trace:
get:
parameters:
@@ -4863,7 +4863,7 @@ tags:
- description:
name: BatchCompletionResponse
-- name: BatchInference
+- name: BatchInference (Coming Soon)
- description:
name: BenchmarkEvalTaskConfig
@@ -5044,7 +5044,7 @@ tags:
- description:
name: PhotogenToolDefinition
-- name: PostTraining
+- name: PostTraining (Coming Soon)
- description:
name: PostTrainingJob
@@ -5179,7 +5179,7 @@ tags:
- description:
name: SyntheticDataGenerateRequest
-- name: SyntheticDataGeneration
+- name: SyntheticDataGeneration (Coming Soon)
- description: 'Response from the synthetic data generation. Batch of (prompt, response,
score) tuples that pass the threshold.
@@ -5262,7 +5262,7 @@ x-tagGroups:
- name: Operations
tags:
- Agents
- - BatchInference
+ - BatchInference (Coming Soon)
- DatasetIO
- Datasets
- Eval
@@ -5272,12 +5272,12 @@ x-tagGroups:
- Memory
- MemoryBanks
- Models
- - PostTraining
+ - PostTraining (Coming Soon)
- Safety
- Scoring
- ScoringFunctions
- Shields
- - SyntheticDataGeneration
+ - SyntheticDataGeneration (Coming Soon)
- Telemetry
- name: Types
tags:
diff --git a/docs/source/conf.py b/docs/source/conf.py
index 152c94563..5d88ae3d6 100644
--- a/docs/source/conf.py
+++ b/docs/source/conf.py
@@ -25,6 +25,7 @@
"sphinx_copybutton",
"sphinx_tabs.tabs",
"sphinx_design",
+ "sphinxcontrib.redoc",
]
myst_enable_extensions = ["colon_fence"]
@@ -82,3 +83,18 @@
html_static_path = ["../_static"]
# html_logo = "../_static/llama-stack-logo.png"
html_style = "../_static/css/my_theme.css"
+
+redoc = [
+ {
+ "name": "Llama Stack API",
+ "page": "references/api_reference/index",
+ "spec": "../resources/llama-stack-spec.yaml",
+ "opts": {
+ "suppress-warnings": True,
+ # "expand-responses": ["200", "201"],
+ },
+ "embed": True,
+ },
+]
+
+redoc_uri = "https://cdn.redoc.ly/redoc/latest/bundles/redoc.standalone.js"
diff --git a/docs/source/references/api_reference/index.md b/docs/source/references/api_reference/index.md
new file mode 100644
index 000000000..679bc8e5e
--- /dev/null
+++ b/docs/source/references/api_reference/index.md
@@ -0,0 +1,7 @@
+# API Reference
+
+```{eval-rst}
+.. sphinxcontrib-redoc:: ../resources/llama-stack-spec.yaml
+ :page-title: API Reference
+ :expand-responses: all
+```
diff --git a/docs/source/references/index.md b/docs/source/references/index.md
index 94c3a35a2..85b1ad75a 100644
--- a/docs/source/references/index.md
+++ b/docs/source/references/index.md
@@ -1,11 +1,15 @@
# References
+- [API Reference](api_reference/index) for the Llama Stack API specification
- [Llama CLI](llama_cli_reference/index) for building and running your Llama Stack server
- [Llama Stack Client CLI](llama_stack_client_cli_reference/index) for interacting with your Llama Stack server
+
```{toctree}
:maxdepth: 2
:hidden:
+api_reference/index
llama_cli_reference/index
llama_stack_client_cli_reference/index
llama_cli_reference/download_models
+```