llamastack
diff --git a/‎llama_stack/providers/inline/tool_runtime/synthetic-data-kit/synthetic_data_kit.py‎
Lines changed: 10 additions & 4 deletions b/‎llama_stack/providers/inline/tool_runtime/synthetic-data-kit/synthetic_data_kit.py‎
Lines changed: 10 additions & 4 deletions
diff --git a/‎tests/verifications/openai_api/fixtures/docs/llama_stack_and_models.docx‎
7.59 KB b/‎tests/verifications/openai_api/fixtures/docs/llama_stack_and_models.docx‎
7.59 KB
diff --git a/‎tests/verifications/openai_api/fixtures/docs/llama_stack_and_models.md‎
Lines changed: 27 additions & 0 deletions b/‎tests/verifications/openai_api/fixtures/docs/llama_stack_and_models.md‎
Lines changed: 27 additions & 0 deletions
diff --git a/‎tests/verifications/openai_api/fixtures/pdfs/llama_stack_and_models.pdf‎ renamed to ‎tests/verifications/openai_api/fixtures/docs/llama_stack_and_models.pdf‎ b/‎tests/verifications/openai_api/fixtures/pdfs/llama_stack_and_models.pdf‎ renamed to ‎tests/verifications/openai_api/fixtures/docs/llama_stack_and_models.pdf‎
diff --git a/‎tests/verifications/openai_api/fixtures/docs/llama_stack_and_models.pptx‎
40.5 KB b/‎tests/verifications/openai_api/fixtures/docs/llama_stack_and_models.pptx‎
40.5 KB
diff --git a/‎tests/verifications/openai_api/fixtures/docs/llama_stack_and_models.txt‎
Lines changed: 24 additions & 0 deletions b/‎tests/verifications/openai_api/fixtures/docs/llama_stack_and_models.txt‎
Lines changed: 24 additions & 0 deletions
diff --git a/‎tests/verifications/openai_api/fixtures/test_cases/responses.yaml‎
Lines changed: 29 additions & 1 deletion b/‎tests/verifications/openai_api/fixtures/test_cases/responses.yaml‎
Lines changed: 29 additions & 1 deletion
@@ -13,7 +13,7 @@
 from typing import Any
 
 from llama_stack.apis.common.content_types import URL
-from llama_stack.apis.files.files import Files
+from llama_stack.apis.files import Files
 from llama_stack.apis.tools import (
     ListToolDefsResponse,
     ToolDef,
@@ -76,7 +76,7 @@ async def invoke_tool(self, tool_name: str, kwargs: dict[str, Any]) -> ToolInvoc
 
         file_id = kwargs["file_id"]
         file_response = await self.files_api.openai_retrieve_file(file_id)
-        mime_type, _ = mimetypes.guess_type(file_response.filename)
+        mime_type = self._guess_mime_type(file_response.filename)
         content_response = await self.files_api.openai_retrieve_file_content(file_id)
 
         mime_category = mime_type.split("/")[0] if mime_type else None
@@ -89,10 +89,16 @@ async def invoke_tool(self, tool_name: str, kwargs: dict[str, Any]) -> ToolInvoc
             )
         else:
             return await asyncio.to_thread(
-                self.synthetic_data_kit_convert, content_response.body, file_response.filename
+                self._synthetic_data_kit_convert, content_response.body, file_response.filename
             )
 
-    def synthetic_data_kit_convert(self, content_body: bytes, filename: str) -> ToolInvocationResult:
+    def _guess_mime_type(self, filename: str) -> str | None:
+        mime_type, _ = mimetypes.guess_type(filename)
+        if mime_type is None and filename.endswith(".md"):
+            mime_type = "text/markdown"
+        return mime_type
+
+    def _synthetic_data_kit_convert(self, content_body: bytes, filename: str) -> ToolInvocationResult:
         from synthetic_data_kit.core.ingest import process_file
 
         try:
 
@@ -0,0 +1,27 @@
+# Llama Stack
+
+## Llama Stack Overview
+
+Llama Stack standardizes the core building blocks that simplify AI application development. It codifies best practices across the Llama ecosystem. More specifically, it provides
+
+* Unified API layer for Inference, RAG, Agents, Tools, Safety, Evals, and Telemetry.
+
+* Plugin architecture to support the rich ecosystem of different API implementations in various environments, including local development, on-premises, cloud, and mobile.
+
+* Prepackaged verified distributions which offer a one-stop solution for developers to get started quickly and reliably in any environment.
+
+* Multiple developer interfaces like CLI and SDKs for Python, Typescript, iOS, and Android.
+
+* Standalone applications as examples for how to build production-grade AI applications with Llama Stack.
+
+## Llama Stack Benefits
+
+* Flexible Options: Developers can choose their preferred infrastructure without changing APIs and enjoy flexible deployment choices.
+
+* Consistent Experience: With its unified APIs, Llama Stack makes it easier to build, test, and deploy AI applications with consistent application behavior.
+
+* Robust Ecosystem: Llama Stack is already integrated with distribution partners (cloud providers, hardware vendors, and AI-focused companies) that offer tailored infrastructure, software, and services for deploying Llama models.
+
+# Llama 4 Maverick
+
+Llama 4 Maverick is a Mixture-of-Experts (MoE) model with 17 billion active parameters and 128 experts.
@@ -0,0 +1,24 @@
+Llama Stack
+
+
+Llama Stack Overview
+
+Llama Stack standardizes the core building blocks that simplify AI application development. It codifies best practices across the Llama ecosystem. More specifically, it provides
+
+* Unified API layer for Inference, RAG, Agents, Tools, Safety, Evals, and Telemetry.
+* Plugin architecture to support the rich ecosystem of different API implementations in various environments, including local development, on-premises, cloud, and mobile.
+* Prepackaged verified distributions which offer a one-stop solution for developers to get started quickly and reliably in any environment.
+* Multiple developer interfaces like CLI and SDKs for Python, Typescript, iOS, and Android.
+* Standalone applications as examples for how to build production-grade AI applications with Llama Stack.
+
+
+Llama Stack Benefits
+
+* Flexible Options: Developers can choose their preferred infrastructure without changing APIs and enjoy flexible deployment choices.
+* Consistent Experience: With its unified APIs, Llama Stack makes it easier to build, test, and deploy AI applications with consistent application behavior.
+* Robust Ecosystem: Llama Stack is already integrated with distribution partners (cloud providers, hardware vendors, and AI-focused companies) that offer tailored infrastructure, software, and services for deploying Llama models.
+
+
+Llama 4 Maverick
+
+Llama 4 Maverick is a Mixture-of-Experts (MoE) model with 17 billion active parameters and 128 experts.
@@ -42,12 +42,40 @@ test_response_file_search:
         # vector_store_ids param for file_search tool gets added by the test runner
       file_content: "Llama 4 Maverick has 128 experts"
       output: "128"
+    - case_id: "llama_experts_docx"
+      input: "How many experts does the Llama 4 Maverick model have?"
+      tools:
+      - type: file_search
+        # vector_store_ids param for file_search toolgets added by the test runner
+      file_path: "docs/llama_stack_and_models.docx"
+      output: "128"
+    - case_id: "llama_experts_md"
+      input: "How many experts does the Llama 4 Maverick model have?"
+      tools:
+      - type: file_search
+        # vector_store_ids param for file_search toolgets added by the test runner
+      file_path: "docs/llama_stack_and_models.md"
+      output: "128"
     - case_id: "llama_experts_pdf"
       input: "How many experts does the Llama 4 Maverick model have?"
       tools:
       - type: file_search
         # vector_store_ids param for file_search toolgets added by the test runner
-      file_path: "pdfs/llama_stack_and_models.pdf"
+      file_path: "docs/llama_stack_and_models.pdf"
+      output: "128"
+    - case_id: "llama_experts_pptx"
+      input: "How many experts does the Llama 4 Maverick model have?"
+      tools:
+      - type: file_search
+        # vector_store_ids param for file_search toolgets added by the test runner
+      file_path: "docs/llama_stack_and_models.pptx"
+      output: "128"
+    - case_id: "llama_experts_txt"
+      input: "How many experts does the Llama 4 Maverick model have?"
+      tools:
+      - type: file_search
+        # vector_store_ids param for file_search toolgets added by the test runner
+      file_path: "docs/llama_stack_and_models.txt"
       output: "128"
 
 test_response_mcp_tool: