microsoft
diff --git a/‎python/semantic_kernel/agents/open_ai/responses_agent_thread_actions.py
Lines changed: 195 additions & 58 deletions b/‎python/semantic_kernel/agents/open_ai/responses_agent_thread_actions.py
Lines changed: 195 additions & 58 deletions
diff --git a/‎python/semantic_kernel/contents/__init__.py
Lines changed: 20 additions & 6 deletions b/‎python/semantic_kernel/contents/__init__.py
Lines changed: 20 additions & 6 deletions
diff --git a/‎python/semantic_kernel/contents/chat_message_content.py
Lines changed: 54 additions & 12 deletions b/‎python/semantic_kernel/contents/chat_message_content.py
Lines changed: 54 additions & 12 deletions
diff --git a/‎python/semantic_kernel/contents/const.py
Lines changed: 2 additions & 0 deletions b/‎python/semantic_kernel/contents/const.py
Lines changed: 2 additions & 0 deletions
diff --git a/‎python/semantic_kernel/contents/file_content.py
Lines changed: 105 additions & 0 deletions b/‎python/semantic_kernel/contents/file_content.py
Lines changed: 105 additions & 0 deletions
diff --git a/‎python/tests/assets/sample_file.pdf
617 Bytes b/‎python/tests/assets/sample_file.pdf
617 Bytes
@@ -4,12 +4,19 @@
 from semantic_kernel.contents.audio_content import AudioContent
 from semantic_kernel.contents.chat_history import ChatHistory
 from semantic_kernel.contents.chat_message_content import ChatMessageContent
+from semantic_kernel.contents.file_content import FileContent
 from semantic_kernel.contents.file_reference_content import FileReferenceContent
 from semantic_kernel.contents.function_call_content import FunctionCallContent
 from semantic_kernel.contents.function_result_content import FunctionResultContent
-from semantic_kernel.contents.history_reducer.chat_history_reducer import ChatHistoryReducer
-from semantic_kernel.contents.history_reducer.chat_history_summarization_reducer import ChatHistorySummarizationReducer
-from semantic_kernel.contents.history_reducer.chat_history_truncation_reducer import ChatHistoryTruncationReducer
+from semantic_kernel.contents.history_reducer.chat_history_reducer import (
+    ChatHistoryReducer,
+)
+from semantic_kernel.contents.history_reducer.chat_history_summarization_reducer import (
+    ChatHistorySummarizationReducer,
+)
+from semantic_kernel.contents.history_reducer.chat_history_truncation_reducer import (
+    ChatHistoryTruncationReducer,
+)
 from semantic_kernel.contents.image_content import ImageContent
 from semantic_kernel.contents.realtime_events import (
     RealtimeAudioEvent,
@@ -20,9 +27,15 @@
     RealtimeImageEvent,
     RealtimeTextEvent,
 )
-from semantic_kernel.contents.streaming_annotation_content import StreamingAnnotationContent
-from semantic_kernel.contents.streaming_chat_message_content import StreamingChatMessageContent
-from semantic_kernel.contents.streaming_file_reference_content import StreamingFileReferenceContent
+from semantic_kernel.contents.streaming_annotation_content import (
+    StreamingAnnotationContent,
+)
+from semantic_kernel.contents.streaming_chat_message_content import (
+    StreamingChatMessageContent,
+)
+from semantic_kernel.contents.streaming_file_reference_content import (
+    StreamingFileReferenceContent,
+)
 from semantic_kernel.contents.streaming_text_content import StreamingTextContent
 from semantic_kernel.contents.text_content import TextContent
 from semantic_kernel.contents.utils.author_role import AuthorRole
@@ -37,6 +50,7 @@
     "ChatHistorySummarizationReducer",
     "ChatHistoryTruncationReducer",
     "ChatMessageContent",
+    "FileContent",
     "FileReferenceContent",
     "FinishReason",
     "FunctionCallContent",
 
@@ -16,6 +16,7 @@
     ANNOTATION_CONTENT_TAG,
     CHAT_MESSAGE_CONTENT_TAG,
     DISCRIMINATOR_FIELD,
+    FILE_CONTENT_TAG,
     FILE_REFERENCE_CONTENT_TAG,
     FUNCTION_CALL_CONTENT_TAG,
     FUNCTION_RESULT_CONTENT_TAG,
@@ -26,12 +27,17 @@
     ContentTypes,
 )
 from semantic_kernel.contents.file_reference_content import FileReferenceContent
+from semantic_kernel.contents.file_content import FileContent
 from semantic_kernel.contents.function_call_content import FunctionCallContent
 from semantic_kernel.contents.function_result_content import FunctionResultContent
 from semantic_kernel.contents.image_content import ImageContent
 from semantic_kernel.contents.kernel_content import KernelContent
-from semantic_kernel.contents.streaming_annotation_content import StreamingAnnotationContent
-from semantic_kernel.contents.streaming_file_reference_content import StreamingFileReferenceContent
+from semantic_kernel.contents.streaming_annotation_content import (
+    StreamingAnnotationContent,
+)
+from semantic_kernel.contents.streaming_file_reference_content import (
+    StreamingFileReferenceContent,
+)
 from semantic_kernel.contents.text_content import TextContent
 from semantic_kernel.contents.utils.author_role import AuthorRole
 from semantic_kernel.contents.utils.finish_reason import FinishReason
@@ -48,6 +54,7 @@
     IMAGE_CONTENT_TAG: ImageContent,
     STREAMING_FILE_REFERENCE_CONTENT_TAG: StreamingFileReferenceContent,
     STREAMING_ANNOTATION_CONTENT_TAG: StreamingAnnotationContent,
+    FILE_CONTENT_TAG: FileContent,
 }
 
 CMC_ITEM_TYPES = Annotated[
@@ -58,6 +65,7 @@
     | FunctionResultContent
     | FunctionCallContent
     | FileReferenceContent
+    | FileContent
     | StreamingAnnotationContent
     | StreamingFileReferenceContent
     | AudioContent,
@@ -239,7 +247,13 @@ def to_element(self) -> "Element":
         """
         root = Element(self.tag)
         for field in self.model_fields_set:
-            if field not in ["role", "name", "encoding", "finish_reason", "ai_model_id"]:
+            if field not in [
+                "role",
+                "name",
+                "encoding",
+                "finish_reason",
+                "ai_model_id",
+            ]:
                 continue
             value = getattr(self, field)
             if isinstance(value, Enum):
@@ -260,15 +274,22 @@ def from_element(cls, element: Element) -> "ChatMessageContent":
             ChatMessageContent - The new instance of ChatMessageContent or a subclass.
         """
         if element.tag != cls.tag:
-            raise ContentInitializationError(f"Element tag is not {cls.tag}")  # pragma: no cover
+            raise ContentInitializationError(
+                f"Element tag is not {cls.tag}"
+            )  # pragma: no cover
         kwargs: dict[str, Any] = {key: value for key, value in element.items()}
         items: list[KernelContent] = []
         if element.text:
             items.append(TextContent(text=unescape(element.text)))
         for child in element:
             if child.tag not in TAG_CONTENT_MAP:
-                logger.warning('Unknown tag "%s" in ChatMessageContent, treating as text', child.tag)
-                text = ElementTree.tostring(child, encoding="unicode", short_empty_elements=False)
+                logger.warning(
+                    'Unknown tag "%s" in ChatMessageContent, treating as text',
+                    child.tag,
+                )
+                text = ElementTree.tostring(
+                    child, encoding="unicode", short_empty_elements=False
+                )
                 items.append(TextContent(text=unescape(text) or ""))
             else:
                 items.append(TAG_CONTENT_MAP[child.tag].from_element(child))  # type: ignore
@@ -294,9 +315,13 @@ def to_prompt(self) -> str:
             str - The prompt from the ChatMessageContent.
         """
         root = self.to_element()
-        return ElementTree.tostring(root, encoding=self.encoding or "unicode", short_empty_elements=False)
+        return ElementTree.tostring(
+            root, encoding=self.encoding or "unicode", short_empty_elements=False
+        )
 
-    def to_dict(self, role_key: str = "role", content_key: str = "content") -> dict[str, Any]:
+    def to_dict(
+        self, role_key: str = "role", content_key: str = "content"
+    ) -> dict[str, Any]:
         """Serialize the ChatMessageContent to a dictionary.
 
         Returns:
@@ -305,8 +330,14 @@ def to_dict(self, role_key: str = "role", content_key: str = "content") -> dict[
         ret: dict[str, Any] = {
             role_key: self.role.value,
         }
-        if self.role == AuthorRole.ASSISTANT and any(isinstance(item, FunctionCallContent) for item in self.items):
-            ret["tool_calls"] = [item.to_dict() for item in self.items if isinstance(item, FunctionCallContent)]
+        if self.role == AuthorRole.ASSISTANT and any(
+            isinstance(item, FunctionCallContent) for item in self.items
+        ):
+            ret["tool_calls"] = [
+                item.to_dict()
+                for item in self.items
+                if isinstance(item, FunctionCallContent)
+            ]
         else:
             ret[content_key] = self._parse_items()
         if self.role == AuthorRole.TOOL:
@@ -330,5 +361,16 @@ def _parse_items(self) -> str | list[dict[str, Any]]:
 
     def __hash__(self) -> int:
         """Return the hash of the chat message content."""
-        hashable_items = [make_hashable(item) for item in self.items] if self.items else []
-        return hash((self.tag, self.role, self.content, self.encoding, self.finish_reason, *hashable_items))
+        hashable_items = (
+            [make_hashable(item) for item in self.items] if self.items else []
+        )
+        return hash(
+            (
+                self.tag,
+                self.role,
+                self.content,
+                self.encoding,
+                self.finish_reason,
+                *hashable_items,
+            )
+        )
@@ -9,6 +9,7 @@
 IMAGE_CONTENT_TAG: Final[str] = "image"
 ANNOTATION_CONTENT_TAG: Final[str] = "annotation"
 STREAMING_ANNOTATION_CONTENT_TAG: Final[str] = "streaming_annotation"
+FILE_CONTENT_TAG: Final[str] = "file"
 BINARY_CONTENT_TAG: Final[str] = "binary"
 FILE_REFERENCE_CONTENT_TAG: Final[str] = "file_reference"
 STREAMING_FILE_REFERENCE_CONTENT_TAG: Final[str] = "streaming_file_reference"
@@ -25,6 +26,7 @@ class ContentTypes(str, Enum):
     BINARY_CONTENT = BINARY_CONTENT_TAG
     CHAT_MESSAGE_CONTENT = CHAT_MESSAGE_CONTENT_TAG
     IMAGE_CONTENT = IMAGE_CONTENT_TAG
+    FILE_CONTENT = FILE_CONTENT_TAG
     FILE_REFERENCE_CONTENT = FILE_REFERENCE_CONTENT_TAG
     FUNCTION_CALL_CONTENT = FUNCTION_CALL_CONTENT_TAG
     FUNCTION_RESULT_CONTENT = FUNCTION_RESULT_CONTENT_TAG
 
@@ -0,0 +1,105 @@
+# Copyright (c) Microsoft. All rights reserved.
+
+import logging
+import mimetypes
+import os
+from typing import Any, ClassVar, Literal, TypeVar
+from numpy import ndarray
+from pydantic import Field
+from semantic_kernel.contents.binary_content import BinaryContent
+from semantic_kernel.contents.const import ContentTypes, FILE_CONTENT_TAG
+from semantic_kernel.utils.feature_stage_decorator import experimental
+
+logger = logging.getLogger(__name__)
+
+_T = TypeVar("_T", bound="FileContent")
+
+
+@experimental
+class FileContent(BinaryContent):
+    """File Content class.
+
+    This can be created either from bytes data or a file path. The filename and mime_type are required for correct serialization.
+    """
+
+    content_type: Literal[ContentTypes.FILE_CONTENT] = Field(FILE_CONTENT_TAG, init=False)  # type: ignore
+    tag: ClassVar[str] = FILE_CONTENT_TAG
+    filename: str | None = None
+
+    def __init__(
+        self,
+        filename: str | None = None,
+        uri: str | None = None,
+        data_uri: str | None = None,
+        data: str | bytes | ndarray | None = None,
+        data_format: str | None = None,
+        mime_type: str | None = None,
+        **kwargs: Any,
+    ):
+        # Always use base64 for file data for consistency with serialization
+        if data is not None and data_format is None:
+            data_format = "base64"
+        super().__init__(
+            uri=uri,
+            data_uri=data_uri,
+            data=data,
+            data_format=data_format,
+            mime_type=mime_type,
+            **kwargs,
+        )
+        self.filename = filename
+        if self.filename is None and uri is not None:
+            self.filename = os.path.basename(uri)
+
+    @classmethod
+    def from_file(cls: type[_T], file_path: str, **kwargs: Any) -> _T:
+        mime_type, _ = mimetypes.guess_type(file_path)
+        with open(file_path, "rb") as f:
+            data = f.read()
+        filename = os.path.basename(file_path)
+        # Always use base64 for file data for consistency with serialization
+        return cls(
+            filename=filename,
+            data=data,
+            mime_type=mime_type,
+            data_format="base64",
+            **kwargs,
+        )
+
+    def __str__(self) -> str:
+        if self.data is not None and self.mime_type is not None:
+            import base64
+
+            encoded = base64.b64encode(self.data).decode("ascii")
+            return f"data:{self.mime_type};base64,{encoded}"
+        elif self.uri is not None:
+            return str(self.uri)
+        return ""
+
+    def to_element(self) -> Any:
+        return {"type": "input_file", "filename": self.filename, "file_data": str(self)}
+
+    @classmethod
+    def from_element(cls: type[_T], element: Any) -> _T:
+        # Parse file_data as data URI if present
+        import re
+        import base64
+
+        file_data = element.get("file_data")
+        filename = element.get("filename")
+        data = None
+        mime_type = None
+        data_format = None
+        if file_data and file_data.startswith("data:"):
+            # Example: data:application/pdf;base64,....
+            match = re.match(r"data:([^;]+);base64,(.*)", file_data)
+            if match:
+                mime_type = match.group(1)
+                data = base64.b64decode(match.group(2))
+                data_format = "base64"
+        return cls(
+            filename=filename, data=data, mime_type=mime_type, data_format=data_format
+        )
+
+    def to_dict(self) -> dict[str, Any]:
+        return {"type": "input_file", "filename": self.filename, "file_data": str(self)}