langchain-ai · baskaryan · Nov 8, 2024
diff --git a/python/langsmith/evaluation/_runner.py b/python/langsmith/evaluation/_runner.py
@@ -1,4 +1,4 @@
 """V2 Evaluation Interface."""

 from __future__ import annotations

@@ -7,12 +7,14 @@
 import concurrent.futures as cf
 import datetime
 import functools
+import importlib
 import inspect
 import itertools
 import logging
 import pathlib
 import queue
 import random
+import sys
 import textwrap
 import threading
 import uuid
@@ -94,6 +96,9 @@
     ],
 ]
 
+_IS_INTERACTIVE_ENV = hasattr(sys, "ps2")
+_IPYTHON_INSTALLED = importlib.util.find_spec("IPython")
+
 
 def evaluate(
     target: TARGET_T,
@@ -1113,15 +1118,25 @@
                 f"{base_url}/datasets/{dataset_id}/compare?"
                 f"selectedSessions={project.id}"
             )
-            print(  # noqa: T201
-                f"View the evaluation results for experiment: '{self.experiment_name}'"
-                f" at:\n{comparison_url}\n\n"
-            )
         else:
-            # HACKHACK
+            comparison_url = None
+
+        if _IS_INTERACTIVE_ENV and _IPYTHON_INSTALLED and comparison_url:
+            from IPython.display import HTML, display  # type: ignore[import-not-found]
+
+            display(
+                HTML(
+                    f"RUNNING EXPERIMENT: <a href='{comparison_url}'>"
+                    f"{self.experiment_name}</a>"
+                )
+            )
+        elif comparison_url:
             print(  # noqa: T201
-                "Starting evaluation of experiment: %s", self.experiment_name
+                f"RUNNING EXPERIMENT: {self.experiment_name}\nEXPERIMENT URL: "
+                f"{comparison_url}"
             )
+        else:
+            print(f"RUNNING EXPERIMENT: {self.experiment_name}")  # noqa: T201
 
 
 class _ExperimentManager(_ExperimentManagerMixin):