From f66be6f92e7ecfaac50012da64d44f717d385263 Mon Sep 17 00:00:00 2001
From: William FH <13333726+hinthornw@users.noreply.github.com>
Date: Tue, 20 Aug 2024 10:41:13 -0700
Subject: [PATCH] [Python] (Beta) Async Client (#925)

Co-authored-by: Jake Rachleff <jake@langchain.dev>
---
 python/langsmith/__init__.py                  |   6 +
 python/langsmith/_internal/_beta_decorator.py |   9 +-
 python/langsmith/async_client.py              | 708 ++++++++++++++++++
 python/langsmith/client.py                    |  36 +-
 python/langsmith/utils.py                     |  30 +-
 python/poetry.lock                            |   8 +-
 python/pyproject.toml                         |   3 +-
 .../integration_tests/test_async_client.py    | 243 ++++++
 python/tests/unit_tests/test_client.py        |  36 -
 python/tests/unit_tests/test_utils.py         |  34 +
 10 files changed, 1034 insertions(+), 79 deletions(-)
 create mode 100644 python/langsmith/async_client.py
 create mode 100644 python/tests/integration_tests/test_async_client.py

diff --git a/python/langsmith/__init__.py b/python/langsmith/__init__.py
index b865c4754..a20f5b2f9 100644
--- a/python/langsmith/__init__.py
+++ b/python/langsmith/__init__.py
@@ -5,6 +5,7 @@
 if TYPE_CHECKING:
     from langsmith._expect import expect
     from langsmith._testing import test, unit
+    from langsmith.async_client import AsyncClient
     from langsmith.client import Client
     from langsmith.evaluation import aevaluate, evaluate
     from langsmith.evaluation.evaluator import EvaluationResult, RunEvaluator
@@ -33,6 +34,10 @@ def __getattr__(name: str) -> Any:
         from langsmith.client import Client
 
         return Client
+    elif name == "AsyncClient":
+        from langsmith.async_client import AsyncClient
+
+        return AsyncClient
     elif name == "RunTree":
         from langsmith.run_trees import RunTree
 
@@ -118,4 +123,5 @@ def __getattr__(name: str) -> Any:
     "get_tracing_context",
     "get_current_run_tree",
     "ContextThreadPoolExecutor",
+    "AsyncClient",
 ]
diff --git a/python/langsmith/_internal/_beta_decorator.py b/python/langsmith/_internal/_beta_decorator.py
index 433ade058..12350d533 100644
--- a/python/langsmith/_internal/_beta_decorator.py
+++ b/python/langsmith/_internal/_beta_decorator.py
@@ -7,12 +7,15 @@ class LangSmithBetaWarning(UserWarning):
     """This is a warning specific to the LangSmithBeta module."""
 
 
+@functools.lru_cache(maxsize=100)
+def _warn_once(message: str) -> None:
+    warnings.warn(message, LangSmithBetaWarning, stacklevel=2)
+
+
 def warn_beta(func: Callable) -> Callable:
     @functools.wraps(func)
     def wrapper(*args, **kwargs):
-        warnings.warn(
-            f"Function {func.__name__} is in beta.", LangSmithBetaWarning, stacklevel=2
-        )
+        _warn_once(f"Function {func.__name__} is in beta.")
         return func(*args, **kwargs)
 
     return wrapper
diff --git a/python/langsmith/async_client.py b/python/langsmith/async_client.py
new file mode 100644
index 000000000..1dc6f7119
--- /dev/null
+++ b/python/langsmith/async_client.py
@@ -0,0 +1,708 @@
+"""The Async LangSmith Client."""
+
+from __future__ import annotations
+
+import asyncio
+import datetime
+import uuid
+from typing import (
+    Any,
+    AsyncIterator,
+    Dict,
+    List,
+    Mapping,
+    Optional,
+    Sequence,
+    Tuple,
+    Union,
+    cast,
+)
+
+import httpx
+
+from langsmith import client as ls_client
+from langsmith import schemas as ls_schemas
+from langsmith import utils as ls_utils
+from langsmith._internal import _beta_decorator as ls_beta
+
+
+class AsyncClient:
+    """Async Client for interacting with the LangSmith API."""
+
+    __slots__ = (
+        "_retry_config",
+        "_client",
+    )
+
+    def __init__(
+        self,
+        api_url: Optional[str] = None,
+        api_key: Optional[str] = None,
+        timeout_ms: Optional[
+            Union[
+                int, Tuple[Optional[int], Optional[int], Optional[int], Optional[int]]
+            ]
+        ] = None,
+        retry_config: Optional[Mapping[str, Any]] = None,
+    ):
+        """Initialize the async client."""
+        ls_beta._warn_once("Class AsyncClient is in beta.")
+        self._retry_config = retry_config or {"max_retries": 3}
+        _headers = {
+            "Content-Type": "application/json",
+        }
+        api_key = ls_utils.get_api_key(api_key)
+        if api_key:
+            _headers[ls_client.X_API_KEY] = api_key
+
+        if isinstance(timeout_ms, int):
+            timeout_: Union[Tuple, float] = (timeout_ms / 1000, None, None, None)
+        elif isinstance(timeout_ms, tuple):
+            timeout_ = tuple([t / 1000 if t is not None else None for t in timeout_ms])
+        else:
+            timeout_ = 10
+        self._client = httpx.AsyncClient(
+            base_url=ls_utils.get_api_url(api_url), headers=_headers, timeout=timeout_
+        )
+
+    async def __aenter__(self) -> "AsyncClient":
+        """Enter the async client."""
+        return self
+
+    async def __aexit__(self, exc_type, exc_val, exc_tb):
+        """Exit the async client."""
+        await self.aclose()
+
+    async def aclose(self):
+        """Close the async client."""
+        await self._client.aclose()
+
+    async def _arequest_with_retries(
+        self,
+        method: str,
+        endpoint: str,
+        **kwargs: Any,
+    ) -> httpx.Response:
+        """Make an async HTTP request with retries."""
+        max_retries = cast(int, self._retry_config.get("max_retries", 3))
+        for attempt in range(max_retries):
+            try:
+                response = await self._client.request(method, endpoint, **kwargs)
+                ls_utils.raise_for_status_with_text(response)
+                return response
+            except httpx.HTTPStatusError as e:
+                if attempt == max_retries - 1:
+                    raise ls_utils.LangSmithAPIError(f"HTTP error: {repr(e)}")
+                await asyncio.sleep(2**attempt)
+            except httpx.RequestError as e:
+                if attempt == max_retries - 1:
+                    raise ls_utils.LangSmithConnectionError(f"Request error: {repr(e)}")
+                await asyncio.sleep(2**attempt)
+        raise ls_utils.LangSmithAPIError(
+            "Unexpected error connecting to the LangSmith API"
+        )
+
+    async def _aget_paginated_list(
+        self,
+        path: str,
+        params: Optional[Dict[str, Any]] = None,
+    ) -> AsyncIterator[Dict[str, Any]]:
+        """Get a paginated list of items."""
+        params = params or {}
+        offset = params.get("offset", 0)
+        params["limit"] = params.get("limit", 100)
+        while True:
+            params["offset"] = offset
+            print(f"path: {path}, params: {params}", flush=True)
+            response = await self._arequest_with_retries("GET", path, params=params)
+            items = response.json()
+            print(f"items: {items}, response: {response}", flush=True)
+            if not items:
+                break
+            for item in items:
+                yield item
+            if len(items) < params["limit"]:
+                break
+            offset += len(items)
+
+    async def _aget_cursor_paginated_list(
+        self,
+        path: str,
+        *,
+        body: Optional[dict] = None,
+        request_method: str = "POST",
+        data_key: str = "runs",
+    ) -> AsyncIterator[dict]:
+        """Get a cursor paginated list of items."""
+        params_ = body.copy() if body else {}
+        while True:
+            response = await self._arequest_with_retries(
+                request_method,
+                path,
+                content=ls_client._dumps_json(params_),
+            )
+            response_body = response.json()
+            if not response_body:
+                break
+            if not response_body.get(data_key):
+                break
+            for run in response_body[data_key]:
+                yield run
+            cursors = response_body.get("cursors")
+            if not cursors:
+                break
+            if not cursors.get("next"):
+                break
+            params_["cursor"] = cursors["next"]
+
+    async def create_run(
+        self,
+        name: str,
+        inputs: Dict[str, Any],
+        run_type: str,
+        *,
+        project_name: Optional[str] = None,
+        revision_id: Optional[ls_client.ID_TYPE] = None,
+        **kwargs: Any,
+    ) -> None:
+        """Create a run."""
+        run_create = {
+            "name": name,
+            "id": kwargs.get("id") or uuid.uuid4(),
+            "inputs": inputs,
+            "run_type": run_type,
+            "session_name": project_name or ls_utils.get_tracer_project(),
+            "revision_id": revision_id,
+            **kwargs,
+        }
+        await self._arequest_with_retries(
+            "POST", "/runs", content=ls_client._dumps_json(run_create)
+        )
+
+    async def update_run(
+        self,
+        run_id: ls_client.ID_TYPE,
+        **kwargs: Any,
+    ) -> None:
+        """Update a run."""
+        data = {**kwargs, "id": ls_client._as_uuid(run_id)}
+        await self._arequest_with_retries(
+            "PATCH",
+            f"/runs/{ls_client._as_uuid(run_id)}",
+            content=ls_client._dumps_json(data),
+        )
+
+    async def read_run(self, run_id: ls_client.ID_TYPE) -> ls_schemas.Run:
+        """Read a run."""
+        response = await self._arequest_with_retries(
+            "GET",
+            f"/runs/{ls_client._as_uuid(run_id)}",
+        )
+        return ls_schemas.Run(**response.json())
+
+    async def list_runs(
+        self,
+        *,
+        project_id: Optional[
+            Union[ls_client.ID_TYPE, Sequence[ls_client.ID_TYPE]]
+        ] = None,
+        project_name: Optional[Union[str, Sequence[str]]] = None,
+        run_type: Optional[str] = None,
+        trace_id: Optional[ls_client.ID_TYPE] = None,
+        reference_example_id: Optional[ls_client.ID_TYPE] = None,
+        query: Optional[str] = None,
+        filter: Optional[str] = None,
+        trace_filter: Optional[str] = None,
+        tree_filter: Optional[str] = None,
+        is_root: Optional[bool] = None,
+        parent_run_id: Optional[ls_client.ID_TYPE] = None,
+        start_time: Optional[datetime.datetime] = None,
+        error: Optional[bool] = None,
+        run_ids: Optional[Sequence[ls_client.ID_TYPE]] = None,
+        select: Optional[Sequence[str]] = None,
+        limit: Optional[int] = None,
+        **kwargs: Any,
+    ) -> AsyncIterator[ls_schemas.Run]:
+        """List runs from the LangSmith API.
+
+        Parameters
+        ----------
+        project_id : UUID or None, default=None
+            The ID(s) of the project to filter by.
+        project_name : str or None, default=None
+            The name(s) of the project to filter by.
+        run_type : str or None, default=None
+            The type of the runs to filter by.
+        trace_id : UUID or None, default=None
+            The ID of the trace to filter by.
+        reference_example_id : UUID or None, default=None
+            The ID of the reference example to filter by.
+        query : str or None, default=None
+            The query string to filter by.
+        filter : str or None, default=None
+            The filter string to filter by.
+        trace_filter : str or None, default=None
+            Filter to apply to the ROOT run in the trace tree. This is meant to
+            be used in conjunction with the regular `filter` parameter to let you
+            filter runs by attributes of the root run within a trace.
+        tree_filter : str or None, default=None
+            Filter to apply to OTHER runs in the trace tree, including
+            sibling and child runs. This is meant to be used in conjunction with
+            the regular `filter` parameter to let you filter runs by attributes
+            of any run within a trace.
+        is_root : bool or None, default=None
+            Whether to filter by root runs.
+        parent_run_id : UUID or None, default=None
+            The ID of the parent run to filter by.
+        start_time : datetime or None, default=None
+            The start time to filter by.
+        error : bool or None, default=None
+            Whether to filter by error status.
+        run_ids : List[str or UUID] or None, default=None
+            The IDs of the runs to filter by.
+        limit : int or None, default=None
+            The maximum number of runs to return.
+        **kwargs : Any
+            Additional keyword arguments.
+
+        Yields:
+        ------
+        Run
+            The runs.
+
+        Examples:
+        --------
+        .. code-block:: python
+
+            # List all runs in a project
+            project_runs = client.list_runs(project_name="<your_project>")
+
+            # List LLM and Chat runs in the last 24 hours
+            todays_llm_runs = client.list_runs(
+                project_name="<your_project>",
+                start_time=datetime.now() - timedelta(days=1),
+                run_type="llm",
+            )
+
+            # List root traces in a project
+            root_runs = client.list_runs(project_name="<your_project>", is_root=1)
+
+            # List runs without errors
+            correct_runs = client.list_runs(project_name="<your_project>", error=False)
+
+            # List runs and only return their inputs/outputs (to speed up the query)
+            input_output_runs = client.list_runs(
+                project_name="<your_project>", select=["inputs", "outputs"]
+            )
+
+            # List runs by run ID
+            run_ids = [
+                "a36092d2-4ad5-4fb4-9c0d-0dba9a2ed836",
+                "9398e6be-964f-4aa4-8ae9-ad78cd4b7074",
+            ]
+            selected_runs = client.list_runs(id=run_ids)
+
+            # List all "chain" type runs that took more than 10 seconds and had
+            # `total_tokens` greater than 5000
+            chain_runs = client.list_runs(
+                project_name="<your_project>",
+                filter='and(eq(run_type, "chain"), gt(latency, 10), gt(total_tokens, 5000))',
+            )
+
+            # List all runs called "extractor" whose root of the trace was assigned feedback "user_score" score of 1
+            good_extractor_runs = client.list_runs(
+                project_name="<your_project>",
+                filter='eq(name, "extractor")',
+                trace_filter='and(eq(feedback_key, "user_score"), eq(feedback_score, 1))',
+            )
+
+            # List all runs that started after a specific timestamp and either have "error" not equal to null or a "Correctness" feedback score equal to 0
+            complex_runs = client.list_runs(
+                project_name="<your_project>",
+                filter='and(gt(start_time, "2023-07-15T12:34:56Z"), or(neq(error, null), and(eq(feedback_key, "Correctness"), eq(feedback_score, 0.0))))',
+            )
+
+            # List all runs where `tags` include "experimental" or "beta" and `latency` is greater than 2 seconds
+            tagged_runs = client.list_runs(
+                project_name="<your_project>",
+                filter='and(or(has(tags, "experimental"), has(tags, "beta")), gt(latency, 2))',
+            )
+        """  # noqa: E501
+        project_ids = []
+        if isinstance(project_id, (uuid.UUID, str)):
+            project_ids.append(project_id)
+        elif isinstance(project_id, list):
+            project_ids.extend(project_id)
+        if project_name is not None:
+            if isinstance(project_name, str):
+                project_name = [project_name]
+            projects = await asyncio.gather(
+                *[self.read_project(project_name=name) for name in project_name]
+            )
+            project_ids.extend([project.id for project in projects])
+
+        body_query: Dict[str, Any] = {
+            "session": project_ids if project_ids else None,
+            "run_type": run_type,
+            "reference_example": (
+                [reference_example_id] if reference_example_id else None
+            ),
+            "query": query,
+            "filter": filter,
+            "trace_filter": trace_filter,
+            "tree_filter": tree_filter,
+            "is_root": is_root,
+            "parent_run": parent_run_id,
+            "start_time": start_time.isoformat() if start_time else None,
+            "error": error,
+            "id": run_ids,
+            "trace": trace_id,
+            "select": select,
+            **kwargs,
+        }
+        if project_ids:
+            body_query["session"] = [
+                str(ls_client._as_uuid(id_)) for id_ in project_ids
+            ]
+        body = {k: v for k, v in body_query.items() if v is not None}
+        ix = 0
+        async for run in self._aget_cursor_paginated_list("/runs/query", body=body):
+            yield ls_schemas.Run(**run)
+            ix += 1
+            if limit is not None and ix >= limit:
+                break
+
+    async def create_project(
+        self,
+        project_name: str,
+        **kwargs: Any,
+    ) -> ls_schemas.TracerSession:
+        """Create a project."""
+        data = {"name": project_name, **kwargs}
+        response = await self._arequest_with_retries(
+            "POST", "/sessions", content=ls_client._dumps_json(data)
+        )
+        return ls_schemas.TracerSession(**response.json())
+
+    async def read_project(
+        self,
+        project_name: Optional[str] = None,
+        project_id: Optional[ls_client.ID_TYPE] = None,
+    ) -> ls_schemas.TracerSession:
+        """Read a project."""
+        if project_id:
+            response = await self._arequest_with_retries(
+                "GET", f"/sessions/{ls_client._as_uuid(project_id)}"
+            )
+        elif project_name:
+            response = await self._arequest_with_retries(
+                "GET", "/sessions", params={"name": project_name}
+            )
+        else:
+            raise ValueError("Either project_name or project_id must be provided")
+
+        data = response.json()
+        if isinstance(data, list):
+            if not data:
+                raise ls_utils.LangSmithNotFoundError(
+                    f"Project {project_name} not found"
+                )
+            return ls_schemas.TracerSession(**data[0])
+        return ls_schemas.TracerSession(**data)
+
+    async def delete_project(
+        self, *, project_name: Optional[str] = None, project_id: Optional[str] = None
+    ) -> None:
+        """Delete a project from LangSmith.
+
+        Parameters
+        ----------
+        project_name : str or None, default=None
+            The name of the project to delete.
+        project_id : str or None, default=None
+            The ID of the project to delete.
+        """
+        if project_id is None and project_name is None:
+            raise ValueError("Either project_name or project_id must be provided")
+        if project_id is None:
+            project = await self.read_project(project_name=project_name)
+            project_id = str(project.id)
+        if not project_id:
+            raise ValueError("Project not found")
+        await self._arequest_with_retries(
+            "DELETE",
+            f"/sessions/{ls_client._as_uuid(project_id)}",
+        )
+
+    async def create_dataset(
+        self,
+        dataset_name: str,
+        **kwargs: Any,
+    ) -> ls_schemas.Dataset:
+        """Create a dataset."""
+        data = {"name": dataset_name, **kwargs}
+        response = await self._arequest_with_retries(
+            "POST", "/datasets", content=ls_client._dumps_json(data)
+        )
+        return ls_schemas.Dataset(**response.json())
+
+    async def read_dataset(
+        self,
+        dataset_name: Optional[str] = None,
+        dataset_id: Optional[ls_client.ID_TYPE] = None,
+    ) -> ls_schemas.Dataset:
+        """Read a dataset."""
+        if dataset_id:
+            response = await self._arequest_with_retries(
+                "GET", f"/datasets/{ls_client._as_uuid(dataset_id)}"
+            )
+        elif dataset_name:
+            response = await self._arequest_with_retries(
+                "GET", "/datasets", params={"name": dataset_name}
+            )
+        else:
+            raise ValueError("Either dataset_name or dataset_id must be provided")
+
+        data = response.json()
+        if isinstance(data, list):
+            if not data:
+                raise ls_utils.LangSmithNotFoundError(
+                    f"Dataset {dataset_name} not found"
+                )
+            return ls_schemas.Dataset(**data[0])
+        return ls_schemas.Dataset(**data)
+
+    async def delete_dataset(self, dataset_id: ls_client.ID_TYPE) -> None:
+        """Delete a dataset."""
+        await self._arequest_with_retries(
+            "DELETE",
+            f"/datasets/{ls_client._as_uuid(dataset_id)}",
+        )
+
+    async def list_datasets(
+        self,
+        **kwargs: Any,
+    ) -> AsyncIterator[ls_schemas.Dataset]:
+        """List datasets."""
+        async for dataset in self._aget_paginated_list("/datasets", params=kwargs):
+            yield ls_schemas.Dataset(**dataset)
+
+    async def create_example(
+        self,
+        inputs: Dict[str, Any],
+        outputs: Optional[Dict[str, Any]] = None,
+        dataset_id: Optional[ls_client.ID_TYPE] = None,
+        dataset_name: Optional[str] = None,
+        **kwargs: Any,
+    ) -> ls_schemas.Example:
+        """Create an example."""
+        if dataset_id is None and dataset_name is None:
+            raise ValueError("Either dataset_id or dataset_name must be provided")
+        if dataset_id is None:
+            dataset = await self.read_dataset(dataset_name=dataset_name)
+            dataset_id = dataset.id
+
+        data = {
+            "inputs": inputs,
+            "outputs": outputs,
+            "dataset_id": str(dataset_id),
+            **kwargs,
+        }
+        response = await self._arequest_with_retries(
+            "POST", "/examples", content=ls_client._dumps_json(data)
+        )
+        return ls_schemas.Example(**response.json())
+
+    async def read_example(self, example_id: ls_client.ID_TYPE) -> ls_schemas.Example:
+        """Read an example."""
+        response = await self._arequest_with_retries(
+            "GET", f"/examples/{ls_client._as_uuid(example_id)}"
+        )
+        return ls_schemas.Example(**response.json())
+
+    async def list_examples(
+        self,
+        *,
+        dataset_id: Optional[ls_client.ID_TYPE] = None,
+        dataset_name: Optional[str] = None,
+        **kwargs: Any,
+    ) -> AsyncIterator[ls_schemas.Example]:
+        """List examples."""
+        params = kwargs.copy()
+        if dataset_id:
+            params["dataset"] = ls_client._as_uuid(dataset_id)
+        elif dataset_name:
+            dataset = await self.read_dataset(dataset_name=dataset_name)
+            params["dataset"] = dataset.id
+
+        async for example in self._aget_paginated_list("/examples", params=params):
+            yield ls_schemas.Example(**example)
+
+    async def create_feedback(
+        self,
+        run_id: Optional[ls_client.ID_TYPE],
+        key: str,
+        score: Optional[float] = None,
+        value: Optional[Any] = None,
+        comment: Optional[str] = None,
+        **kwargs: Any,
+    ) -> ls_schemas.Feedback:
+        """Create feedback."""
+        data = {
+            "run_id": ls_client._ensure_uuid(run_id, accept_null=True),
+            "key": key,
+            "score": score,
+            "value": value,
+            "comment": comment,
+            **kwargs,
+        }
+        response = await self._arequest_with_retries(
+            "POST", "/feedback", content=ls_client._dumps_json(data)
+        )
+        return ls_schemas.Feedback(**response.json())
+
+    async def read_feedback(
+        self, feedback_id: ls_client.ID_TYPE
+    ) -> ls_schemas.Feedback:
+        """Read feedback."""
+        response = await self._arequest_with_retries(
+            "GET", f"/feedback/{ls_client._as_uuid(feedback_id)}"
+        )
+        return ls_schemas.Feedback(**response.json())
+
+    async def list_feedback(
+        self,
+        *,
+        run_ids: Optional[Sequence[ls_client.ID_TYPE]] = None,
+        feedback_key: Optional[Sequence[str]] = None,
+        feedback_source_type: Optional[Sequence[ls_schemas.FeedbackSourceType]] = None,
+        limit: Optional[int] = None,
+        **kwargs: Any,
+    ) -> AsyncIterator[ls_schemas.Feedback]:
+        """List feedback."""
+        params = {
+            "run": (
+                [str(ls_client._as_uuid(id_)) for id_ in run_ids] if run_ids else None
+            ),
+            "limit": min(limit, 100) if limit is not None else 100,
+            **kwargs,
+        }
+        if feedback_key is not None:
+            params["key"] = feedback_key
+        if feedback_source_type is not None:
+            params["source"] = feedback_source_type
+        ix = 0
+        async for feedback in self._aget_paginated_list("/feedback", params=params):
+            yield ls_schemas.Feedback(**feedback)
+            ix += 1
+            if limit is not None and ix >= limit:
+                break
+
+    @ls_beta.warn_beta
+    async def index_dataset(
+        self,
+        *,
+        dataset_id: ls_client.ID_TYPE,
+        tag: str = "latest",
+        **kwargs: Any,
+    ) -> None:
+        """Enable dataset indexing. Examples are indexed by their inputs.
+
+        This enables searching for similar examples by inputs with
+        ``client.similar_examples()``.
+
+        Args:
+            dataset_id (UUID): The ID of the dataset to index.
+            tag (str, optional): The version of the dataset to index. If 'latest'
+                then any updates to the dataset (additions, updates, deletions of
+                examples) will be reflected in the index.
+
+        Returns:
+            None
+
+        Raises:
+            requests.HTTPError
+        """  # noqa: E501
+        dataset_id = ls_client._as_uuid(dataset_id, "dataset_id")
+        resp = await self._arequest_with_retries(
+            "POST",
+            f"/datasets/{dataset_id}/index",
+            content=ls_client._dumps_json({"tag": tag, **kwargs}),
+        )
+        ls_utils.raise_for_status_with_text(resp)
+
+    @ls_beta.warn_beta
+    async def similar_examples(
+        self,
+        inputs: dict,
+        /,
+        *,
+        limit: int,
+        dataset_id: ls_client.ID_TYPE,
+        **kwargs: Any,
+    ) -> List[ls_schemas.ExampleSearch]:
+        r"""Retrieve the dataset examples whose inputs best match the current inputs.
+
+        **Note**: Must have few-shot indexing enabled for the dataset. See
+        ``client.index_dataset()``.
+
+        Args:
+            inputs (dict): The inputs to use as a search query. Must match the dataset
+                input schema. Must be JSON serializable.
+            limit (int): The maximum number of examples to return.
+            dataset_id (str or UUID): The ID of the dataset to search over.
+            kwargs (Any): Additional keyword args to pass as part of request body.
+
+        Returns:
+            List of ExampleSearch objects.
+
+        Example:
+            .. code-block:: python
+
+                from langsmith import Client
+
+                client = Client()
+                await client.similar_examples(
+                    {"question": "When would i use the runnable generator"},
+                    limit=3,
+                    dataset_id="...",
+                )
+
+            .. code-block:: pycon
+
+                [
+                    ExampleSearch(
+                        inputs={'question': 'How do I cache a Chat model? What caches can I use?'},
+                        outputs={'answer': 'You can use LangChain\'s caching layer for Chat Models. This can save you money by reducing the number of API calls you make to the LLM provider, if you\'re often requesting the same completion multiple times, and speed up your application.\n\n```python\n\nfrom langchain.cache import InMemoryCache\nlangchain.llm_cache = InMemoryCache()\n\n# The first time, it is not yet in cache, so it should take longer\nllm.predict(\'Tell me a joke\')\n\n```\n\nYou can also use SQLite Cache which uses a SQLite database:\n\n```python\n  rm .langchain.db\n\nfrom langchain.cache import SQLiteCache\nlangchain.llm_cache = SQLiteCache(database_path=".langchain.db")\n\n# The first time, it is not yet in cache, so it should take longer\nllm.predict(\'Tell me a joke\') \n```\n'},
+                        metadata=None,
+                        id=UUID('b2ddd1c4-dff6-49ae-8544-f48e39053398'),
+                        dataset_id=UUID('01b6ce0f-bfb6-4f48-bbb8-f19272135d40')
+                    ),
+                    ExampleSearch(
+                        inputs={'question': "What's a runnable lambda?"},
+                        outputs={'answer': "A runnable lambda is an object that implements LangChain's `Runnable` interface and runs a callbale (i.e., a function). Note the function must accept a single argument."},
+                        metadata=None,
+                        id=UUID('f94104a7-2434-4ba7-8293-6a283f4860b4'),
+                        dataset_id=UUID('01b6ce0f-bfb6-4f48-bbb8-f19272135d40')
+                    ),
+                    ExampleSearch(
+                        inputs={'question': 'Show me how to use RecursiveURLLoader'},
+                        outputs={'answer': 'The RecursiveURLLoader comes from the langchain.document_loaders.recursive_url_loader module. Here\'s an example of how to use it:\n\n```python\nfrom langchain.document_loaders.recursive_url_loader import RecursiveUrlLoader\n\n# Create an instance of RecursiveUrlLoader with the URL you want to load\nloader = RecursiveUrlLoader(url="https://example.com")\n\n# Load all child links from the URL page\nchild_links = loader.load()\n\n# Print the child links\nfor link in child_links:\n    print(link)\n```\n\nMake sure to replace "https://example.com" with the actual URL you want to load. The load() method returns a list of child links found on the URL page. You can iterate over this list to access each child link.'},
+                        metadata=None,
+                        id=UUID('0308ea70-a803-4181-a37d-39e95f138f8c'),
+                        dataset_id=UUID('01b6ce0f-bfb6-4f48-bbb8-f19272135d40')
+                    ),
+                ]
+
+        """  # noqa: E501
+        dataset_id = ls_client._as_uuid(dataset_id, "dataset_id")
+        resp = await self._arequest_with_retries(
+            "POST",
+            f"/datasets/{dataset_id}/search",
+            content=ls_client._dumps_json({"inputs": inputs, "limit": limit, **kwargs}),
+        )
+        ls_utils.raise_for_status_with_text(resp)
+        examples = []
+        for ex in resp.json()["examples"]:
+            examples.append(ls_schemas.ExampleSearch(**ex, dataset_id=dataset_id))
+        return examples
diff --git a/python/langsmith/client.py b/python/langsmith/client.py
index 740bd1581..4c0d378b7 100644
--- a/python/langsmith/client.py
+++ b/python/langsmith/client.py
@@ -355,38 +355,6 @@ def _get_tracing_sampling_rate() -> float | None:
     return sampling_rate
 
 
-def _get_env(var_names: Sequence[str], default: Optional[str] = None) -> Optional[str]:
-    for var_name in var_names:
-        var = os.getenv(var_name)
-        if var is not None:
-            return var
-    return default
-
-
-def _get_api_key(api_key: Optional[str]) -> Optional[str]:
-    api_key_ = (
-        api_key
-        if api_key is not None
-        else _get_env(("LANGSMITH_API_KEY", "LANGCHAIN_API_KEY"))
-    )
-    if api_key_ is None or not api_key_.strip():
-        return None
-    return api_key_.strip().strip('"').strip("'")
-
-
-def _get_api_url(api_url: Optional[str]) -> str:
-    _api_url = api_url or cast(
-        str,
-        _get_env(
-            ("LANGSMITH_ENDPOINT", "LANGCHAIN_ENDPOINT"),
-            "https://api.smith.langchain.com",
-        ),
-    )
-    if not _api_url.strip():
-        raise ls_utils.LangSmithUserError("LangSmith API URL cannot be empty")
-    return _api_url.strip().strip('"').strip("'").rstrip("/")
-
-
 def _get_write_api_urls(_write_api_urls: Optional[Dict[str, str]]) -> Dict[str, str]:
     _write_api_urls = _write_api_urls or json.loads(
         os.getenv("LANGSMITH_RUNS_ENDPOINTS", "{}")
@@ -563,8 +531,8 @@ def __init__(
             self.api_url = next(iter(self._write_api_urls))
             self.api_key: Optional[str] = self._write_api_urls[self.api_url]
         else:
-            self.api_url = _get_api_url(api_url)
-            self.api_key = _get_api_key(api_key)
+            self.api_url = ls_utils.get_api_url(api_url)
+            self.api_key = ls_utils.get_api_key(api_key)
             _validate_api_key_if_hosted(self.api_url, self.api_key)
             self._write_api_urls = {self.api_url: self.api_key}
         self.retry_config = retry_config or _default_retry_config()
diff --git a/python/langsmith/utils.py b/python/langsmith/utils.py
index 0d3552dcc..c28b23c38 100644
--- a/python/langsmith/utils.py
+++ b/python/langsmith/utils.py
@@ -32,6 +32,7 @@
     cast,
 )
 
+import httpx
 import requests
 from typing_extensions import ParamSpec
 from urllib3.util import Retry
@@ -123,13 +124,18 @@ def wrapper(*args: Any, **kwargs: Any) -> Any:
     return decorator
 
 
-def raise_for_status_with_text(response: requests.Response) -> None:
+def raise_for_status_with_text(
+    response: Union[requests.Response, httpx.Response],
+) -> None:
     """Raise an error with the response text."""
     try:
         response.raise_for_status()
     except requests.HTTPError as e:
         raise requests.HTTPError(str(e), response.text) from e  # type: ignore[call-arg]
 
+    except httpx.HTTPError as e:
+        raise httpx.HTTPError(str(e), response.text) from e  # type: ignore[call-arg]
+
 
 def get_enum_value(enu: Union[enum.Enum, str]) -> str:
     """Get the value of a string enum."""
@@ -687,3 +693,25 @@ def _wrapped_fn(*args: Any) -> T:
             timeout=timeout,
             chunksize=chunksize,
         )
+
+
+def get_api_url(api_url: Optional[str]) -> str:
+    """Get the LangSmith API URL from the environment or the given value."""
+    _api_url = api_url or cast(
+        str,
+        get_env_var(
+            "ENDPOINT",
+            default="https://api.smith.langchain.com",
+        ),
+    )
+    if not _api_url.strip():
+        raise LangSmithUserError("LangSmith API URL cannot be empty")
+    return _api_url.strip().strip('"').strip("'").rstrip("/")
+
+
+def get_api_key(api_key: Optional[str]) -> Optional[str]:
+    """Get the API key from the environment or the given value."""
+    api_key_ = api_key if api_key is not None else get_env_var("API_KEY", default=None)
+    if api_key_ is None or not api_key_.strip():
+        return None
+    return api_key_.strip().strip('"').strip("'")
diff --git a/python/poetry.lock b/python/poetry.lock
index 3d4d1374c..6e1a324ec 100644
--- a/python/poetry.lock
+++ b/python/poetry.lock
@@ -790,13 +790,13 @@ files = [
 
 [[package]]
 name = "openai"
-version = "1.40.3"
+version = "1.41.1"
 description = "The official Python library for the openai API"
 optional = false
 python-versions = ">=3.7.1"
 files = [
-    {file = "openai-1.40.3-py3-none-any.whl", hash = "sha256:09396cb6e2e15c921a5d872bf92841a60a9425da10dcd962b45fe7c4f48f8395"},
-    {file = "openai-1.40.3.tar.gz", hash = "sha256:f2ffe907618240938c59d7ccc67dd01dc8c50be203c0077240db6758d2f02480"},
+    {file = "openai-1.41.1-py3-none-any.whl", hash = "sha256:56fb04105263f79559aff3ceea2e1dd16f8c5385e8238cb66cf0e6888fa8bfcf"},
+    {file = "openai-1.41.1.tar.gz", hash = "sha256:e38e376efd91e0d4db071e2a6517b6b4cac1c2a6fd63efdc5ec6be10c5967c1b"},
 ]
 
 [package.dependencies]
@@ -1843,4 +1843,4 @@ vcr = []
 [metadata]
 lock-version = "2.0"
 python-versions = ">=3.8.1,<4.0"
-content-hash = "e062da3051244f0d59796d6659149eee4e2f46d9332714d57edd459c80b7d8cd"
+content-hash = "546941bdd68403dda7ee3a67954b3741133c4f80a1a9a810ff450959278021d0"
diff --git a/python/pyproject.toml b/python/pyproject.toml
index 1242fb6d7..1e3462dc8 100644
--- a/python/pyproject.toml
+++ b/python/pyproject.toml
@@ -1,6 +1,6 @@
 [tool.poetry]
 name = "langsmith"
-version = "0.1.99"
+version = "0.1.100"
 description = "Client library to connect to the LangSmith LLM Tracing and Evaluation Platform."
 authors = ["LangChain <support@langchain.dev>"]
 license = "MIT"
@@ -32,6 +32,7 @@ pydantic = [
 ]
 requests = "^2"
 orjson = "^3.9.14"
+httpx = ">=0.23.0,<1"
 
 [tool.poetry.group.dev.dependencies]
 pytest = "^7.3.1"
diff --git a/python/tests/integration_tests/test_async_client.py b/python/tests/integration_tests/test_async_client.py
new file mode 100644
index 000000000..5d914a5da
--- /dev/null
+++ b/python/tests/integration_tests/test_async_client.py
@@ -0,0 +1,243 @@
+import asyncio
+import datetime
+import uuid
+
+import pytest
+from pydantic import BaseModel
+
+from langsmith import utils as ls_utils
+from langsmith.async_client import AsyncClient
+from langsmith.schemas import DataType, Run
+
+
+@pytest.mark.asyncio
+async def test_indexed_datasets():
+    class InputsSchema(BaseModel):
+        name: str  # type: ignore[annotation-unchecked]
+        age: int  # type: ignore[annotation-unchecked]
+
+    async with AsyncClient() as client:
+        # Create a new dataset
+        try:
+            dataset = await client.create_dataset(
+                "test_dataset_for_integration_tests_" + uuid.uuid4().hex,
+                inputs_schema_definition=InputsSchema.model_json_schema(),
+            )
+
+            example = await client.create_example(
+                inputs={"name": "Alice", "age": 30},
+                outputs={"hi": "hello"},
+                dataset_id=dataset.id,
+            )
+
+            await client.index_dataset(dataset_id=dataset.id)
+
+            async def check_similar_examples():
+                examples = await client.similar_examples(
+                    {"name": "Alice", "age": 30}, dataset_id=dataset.id, limit=1
+                )
+                return len(examples) == 1
+
+            await wait_for(check_similar_examples, timeout=20)
+            examples = await client.similar_examples(
+                {"name": "Alice", "age": 30}, dataset_id=dataset.id, limit=1
+            )
+            assert examples[0].id == example.id
+        finally:
+            await client.delete_dataset(dataset_id=dataset.id)
+
+
+# Helper function to wait for a condition
+async def wait_for(condition, timeout=10):
+    start_time = asyncio.get_event_loop().time()
+    while True:
+        try:
+            if await condition():
+                return
+        except Exception:
+            if asyncio.get_event_loop().time() - start_time > timeout:
+                raise TimeoutError("Condition not met within the timeout period")
+            await asyncio.sleep(0.1)
+
+
+@pytest.fixture
+async def async_client():
+    client = AsyncClient()
+    yield client
+    await client.aclose()
+
+
+@pytest.mark.asyncio
+async def test_create_run(async_client: AsyncClient):
+    project_name = "__test_create_run" + uuid.uuid4().hex[:8]
+    run_id = uuid.uuid4()
+
+    await async_client.create_run(
+        name="test_run",
+        inputs={"input": "hello"},
+        run_type="llm",
+        project_name=project_name,
+        id=run_id,
+        start_time=datetime.datetime.now(datetime.timezone.utc),
+    )
+
+    async def check_run():
+        try:
+            run = await async_client.read_run(run_id)
+            return run.name == "test_run"
+        except ls_utils.LangSmithError:
+            return False
+
+    await wait_for(check_run)
+    run = await async_client.read_run(run_id)
+    assert run.name == "test_run"
+    assert run.inputs == {"input": "hello"}
+
+
+@pytest.mark.asyncio
+async def test_list_runs(async_client: AsyncClient):
+    project_name = "__test_list_runs"
+    run_ids = [uuid.uuid4() for _ in range(3)]
+    meta_uid = str(uuid.uuid4())
+
+    for i, run_id in enumerate(run_ids):
+        await async_client.create_run(
+            name=f"test_run_{i}",
+            inputs={"input": f"hello_{i}"},
+            run_type="llm",
+            project_name=project_name,
+            id=run_id,
+            start_time=datetime.datetime.now(datetime.timezone.utc),
+            end_time=datetime.datetime.now(datetime.timezone.utc),
+            extra={"metadata": {"uid": meta_uid}},
+        )
+
+    filter_ = f'and(eq(metadata_key, "uid"), eq(metadata_value, "{meta_uid}"))'
+
+    async def check_runs():
+        runs = [
+            run
+            async for run in async_client.list_runs(
+                project_name=project_name, filter=filter_
+            )
+        ]
+        return len(runs) == 3
+
+    await wait_for(check_runs)
+
+    runs = [
+        run
+        async for run in async_client.list_runs(
+            project_name=project_name, filter=filter_
+        )
+    ]
+    assert len(runs) == 3
+    assert all(isinstance(run, Run) for run in runs)
+
+
+@pytest.mark.asyncio
+async def test_create_dataset(async_client: AsyncClient):
+    dataset_name = "__test_create_dataset" + uuid.uuid4().hex[:8]
+
+    dataset = await async_client.create_dataset(dataset_name, data_type=DataType.kv)
+
+    assert dataset.name == dataset_name
+    assert dataset.data_type == DataType.kv
+
+    await async_client.delete_dataset(dataset_id=dataset.id)
+
+
+@pytest.mark.asyncio
+async def test_create_example(async_client: AsyncClient):
+    dataset_name = "__test_create_example" + uuid.uuid4().hex[:8]
+    dataset = await async_client.create_dataset(dataset_name)
+
+    example = await async_client.create_example(
+        inputs={"input": "hello"}, outputs={"output": "world"}, dataset_id=dataset.id
+    )
+
+    assert example.inputs == {"input": "hello"}
+    assert example.outputs == {"output": "world"}
+
+    await async_client.delete_dataset(dataset_id=dataset.id)
+
+
+@pytest.mark.asyncio
+async def test_list_examples(async_client: AsyncClient):
+    dataset_name = "__test_list_examples" + uuid.uuid4().hex[:8]
+    dataset = await async_client.create_dataset(dataset_name)
+
+    for i in range(3):
+        await async_client.create_example(
+            inputs={"input": f"hello_{i}"},
+            outputs={"output": f"world_{i}"},
+            dataset_id=dataset.id,
+        )
+
+    examples = [
+        example async for example in async_client.list_examples(dataset_id=dataset.id)
+    ]
+    assert len(examples) == 3
+
+    await async_client.delete_dataset(dataset_id=dataset.id)
+
+
+@pytest.mark.asyncio
+async def test_create_feedback(async_client: AsyncClient):
+    project_name = "__test_create_feedback" + uuid.uuid4().hex[:8]
+    run_id = uuid.uuid4()
+
+    await async_client.create_run(
+        name="test_run",
+        inputs={"input": "hello"},
+        run_type="llm",
+        project_name=project_name,
+        id=run_id,
+        start_time=datetime.datetime.now(datetime.timezone.utc),
+    )
+
+    feedback = await async_client.create_feedback(
+        run_id=run_id,
+        key="test_key",
+        score=0.9,
+        value="test_value",
+        comment="test_comment",
+    )
+
+    assert feedback.run_id == run_id
+    assert feedback.key == "test_key"
+    assert feedback.score == 0.9
+    assert feedback.value == "test_value"
+    assert feedback.comment == "test_comment"
+
+
+@pytest.mark.asyncio
+async def test_list_feedback(async_client: AsyncClient):
+    project_name = "__test_list_feedback"
+    run_id = uuid.uuid4()
+
+    await async_client.create_run(
+        name="test_run",
+        inputs={"input": "hello"},
+        run_type="llm",
+        project_name=project_name,
+        id=run_id,
+        start_time=datetime.datetime.now(datetime.timezone.utc),
+    )
+
+    for i in range(3):
+        await async_client.create_feedback(
+            run_id=run_id,
+            key=f"test_key_{i}",
+            score=0.9,
+            value=f"test_value_{i}",
+            comment=f"test_comment_{i}",
+        )
+
+    async def check_feedbacks():
+        feedbacks = [
+            feedback async for feedback in async_client.list_feedback(run_ids=[run_id])
+        ]
+        return len(feedbacks) == 3
+
+    await wait_for(check_feedbacks, timeout=10)
diff --git a/python/tests/unit_tests/test_client.py b/python/tests/unit_tests/test_client.py
index c60afa702..ed8159804 100644
--- a/python/tests/unit_tests/test_client.py
+++ b/python/tests/unit_tests/test_client.py
@@ -33,8 +33,6 @@
 from langsmith.client import (
     Client,
     _dumps_json,
-    _get_api_key,
-    _get_api_url,
     _is_langchain_hosted,
     _is_localhost,
     _serialize_json,
@@ -260,40 +258,6 @@ def test_async_methods() -> None:
         )
 
 
-def test_get_api_key() -> None:
-    assert _get_api_key("provided_api_key") == "provided_api_key"
-    assert _get_api_key("'provided_api_key'") == "provided_api_key"
-    assert _get_api_key('"_provided_api_key"') == "_provided_api_key"
-
-    with patch.dict("os.environ", {"LANGCHAIN_API_KEY": "env_api_key"}, clear=True):
-        assert _get_api_key(None) == "env_api_key"
-
-    with patch.dict("os.environ", {}, clear=True):
-        assert _get_api_key(None) is None
-
-    assert _get_api_key("") is None
-    assert _get_api_key(" ") is None
-
-
-def test_get_api_url() -> None:
-    assert _get_api_url("http://provided.url") == "http://provided.url"
-
-    with patch.dict("os.environ", {"LANGCHAIN_ENDPOINT": "http://env.url"}):
-        assert _get_api_url(None) == "http://env.url"
-
-    with patch.dict("os.environ", {}, clear=True):
-        assert _get_api_url(None) == "https://api.smith.langchain.com"
-
-    with patch.dict("os.environ", {}, clear=True):
-        assert _get_api_url(None) == "https://api.smith.langchain.com"
-
-    with patch.dict("os.environ", {"LANGCHAIN_ENDPOINT": "http://env.url"}):
-        assert _get_api_url(None) == "http://env.url"
-
-    with pytest.raises(ls_utils.LangSmithUserError):
-        _get_api_url(" ")
-
-
 def test_create_run_unicode() -> None:
     inputs = {
         "foo": "これは私の友達です",
diff --git a/python/tests/unit_tests/test_utils.py b/python/tests/unit_tests/test_utils.py
index 8fd493478..9db646aae 100644
--- a/python/tests/unit_tests/test_utils.py
+++ b/python/tests/unit_tests/test_utils.py
@@ -311,3 +311,37 @@ def test_parse_prompt_identifier():
             assert False, f"Expected ValueError for identifier: {invalid_id}"
         except ValueError:
             pass  # This is the expected behavior
+
+
+def test_get_api_key() -> None:
+    assert ls_utils.get_api_key("provided_api_key") == "provided_api_key"
+    assert ls_utils.get_api_key("'provided_api_key'") == "provided_api_key"
+    assert ls_utils.get_api_key('"_provided_api_key"') == "_provided_api_key"
+
+    with patch.dict("os.environ", {"LANGCHAIN_API_KEY": "env_api_key"}, clear=True):
+        assert ls_utils.get_api_key(None) == "env_api_key"
+
+    with patch.dict("os.environ", {}, clear=True):
+        assert ls_utils.get_api_key(None) is None
+
+    assert ls_utils.get_api_key("") is None
+    assert ls_utils.get_api_key(" ") is None
+
+
+def test_get_api_url() -> None:
+    assert ls_utils.get_api_url("http://provided.url") == "http://provided.url"
+
+    with patch.dict("os.environ", {"LANGCHAIN_ENDPOINT": "http://env.url"}):
+        assert ls_utils.get_api_url(None) == "http://env.url"
+
+    with patch.dict("os.environ", {}, clear=True):
+        assert ls_utils.get_api_url(None) == "https://api.smith.langchain.com"
+
+    with patch.dict("os.environ", {}, clear=True):
+        assert ls_utils.get_api_url(None) == "https://api.smith.langchain.com"
+
+    with patch.dict("os.environ", {"LANGCHAIN_ENDPOINT": "http://env.url"}):
+        assert ls_utils.get_api_url(None) == "http://env.url"
+
+    with pytest.raises(ls_utils.LangSmithUserError):
+        ls_utils.get_api_url(" ")