langchain-ai · isahers1 · Dec 17, 2024 · Dec 17, 2024
diff --git a/python/langsmith/client.py b/python/langsmith/client.py
@@ -1,4 +1,4 @@
 """Client for interacting with the LangSmith API.

 Use the client to customize API keys / workspace ocnnections, SSl certs,
 etc. for tracing.
@@ -3903,6 +3903,7 @@
                 attachments[key.removeprefix("attachment.")] = {
                     "presigned_url": value["presigned_url"],
                     "reader": reader,
+                    "mime_type": value["mime_type"],
                 }
 
         return ls_schemas.Example(
@@ -3989,6 +3990,7 @@
                     attachments[key.removeprefix("attachment.")] = {
                         "presigned_url": value["presigned_url"],
                         "reader": reader,
+                        "mime_type": value["mime_type"],
                     }
 
             yield ls_schemas.Example(

diff --git a/python/langsmith/schemas.py b/python/langsmith/schemas.py
@@ -131,7 +131,7 @@ class AttachmentInfo(TypedDict):
 
     presigned_url: str
     reader: BinaryIOLike
-    # TODO: add mime type
+    mime_type: str
 
 
 class Example(ExampleBase):

diff --git a/python/tests/integration_tests/test_client.py b/python/tests/integration_tests/test_client.py
@@ -1253,6 +1253,114 @@ def test_list_examples_attachments_keys(langchain_client: Client) -> None:
 
     langchain_client.delete_dataset(dataset_id=dataset.id)
 
+@pytest.mark.skip(reason="Need to land https://github.com/langchain-ai/langchainplus/pull/7415 first")
+def test_mime_type_is_propogated(langchain_client: Client) -> None:
+    """Test that the mime type is propogated correctly."""
+    dataset_name = "__test_mime_type_is_propogated" + uuid4().hex[:4]
+    dataset = langchain_client.create_dataset(dataset_name=dataset_name)
+
+    langchain_client.upload_examples_multipart(
+        dataset_id=dataset.id,
+        uploads=[
+            ExampleUploadWithAttachments(
+                inputs={"text": "hello world"},
+                outputs={"response": "hi there"},
+                attachments={
+                    "test_file": ("text/plain", b"test content"),
+                },
+            )
+        ],
+    )
+
+    example = next(langchain_client.list_examples(dataset_id=dataset.id))
+    assert example.attachments["test_file"]["mime_type"] == "text/plain"
+
+    example = langchain_client.read_example(example_id=example.id)
+    assert example.attachments["test_file"]["mime_type"] == "text/plain"
+
+    langchain_client.delete_dataset(dataset_id=dataset.id)
+
+@pytest.mark.skip(reason="Need to land https://github.com/langchain-ai/langchainplus/pull/7415 first")
+def test_evaluate_mime_type_is_propogated(langchain_client: Client) -> None:
+    """Test that the mime type is propogated correctly when evaluating."""
+    dataset_name = "__test_evaluate_mime_type_is_propogated" + uuid4().hex[:4]
+    dataset = langchain_client.create_dataset(dataset_name=dataset_name)
+
+    langchain_client.upload_examples_multipart(
+        dataset_id=dataset.id,
+        uploads=[
+            ExampleUploadWithAttachments(
+                inputs={"text": "hello world"},
+                outputs={"response": "hi there"},
+                attachments={
+                    "test_file": ("text/plain", b"test content"),
+                },
+            )
+        ],
+    )
+
+    def target(inputs: Dict[str, Any], attachments: Dict[str, Any]) -> Dict[str, Any]:
+        # Verify we receive the attachment data
+        assert attachments["test_file"]["mime_type"] == "text/plain"
+        return {"answer": "hi there"}
+
+    def evaluator(outputs: dict, reference_outputs: dict, attachments: dict) -> Dict[str, Any]:
+        # Verify we receive the attachment data
+        assert attachments["test_file"]["mime_type"] == "text/plain"
+        return {
+            "score": float(
+                reference_outputs.get("answer") == outputs.get("answer")  # type: ignore
+            )
+        }
+
+    langchain_client.evaluate(
+        target,
+        data=dataset_name,
+        evaluators=[evaluator]
+    )
+
+    langchain_client.delete_dataset(dataset_name=dataset_name)
+
+@pytest.mark.skip(reason="Need to land https://github.com/langchain-ai/langchainplus/pull/7415 first")
+async def test_evaluate_mime_type_is_propogated(langchain_client: Client) -> None:
+    """Test that the mime type is propogated correctly when evaluating."""
+    dataset_name = "__test_evaluate_mime_type_is_propogated" + uuid4().hex[:4]
+    dataset = langchain_client.create_dataset(dataset_name=dataset_name)
+
+    langchain_client.upload_examples_multipart(
+        dataset_id=dataset.id,
+        uploads=[
+            ExampleUploadWithAttachments(
+                inputs={"text": "hello world"},
+                outputs={"response": "hi there"},
+                attachments={
+                    "test_file": ("text/plain", b"test content"),
+                },
+            )
+        ],
+    )
+
+    async def target(inputs: Dict[str, Any], attachments: Dict[str, Any]) -> Dict[str, Any]:
+        # Verify we receive the attachment data
+        assert attachments["test_file"]["mime_type"] == "text/plain"
+        return {"answer": "hi there"}
+
+    async def evaluator(outputs: dict, reference_outputs: dict, attachments: dict) -> Dict[str, Any]:
+        # Verify we receive the attachment data
+        assert attachments["test_file"]["mime_type"] == "text/plain"
+        return {
+            "score": float(
+                reference_outputs.get("answer") == outputs.get("answer")  # type: ignore
+            )
+        }
+
+    await langchain_client.aevaluate(
+        target,
+        data=dataset_name,
+        evaluators=[evaluator]
+    )
+
+    langchain_client.delete_dataset(dataset_name=dataset_name)
 
 def test_evaluate_with_attachments_multiple_evaluators(
     langchain_client: Client,