diff --git a/docusaurus.config.js b/docusaurus.config.js
index d496858db..2aa88501f 100644
--- a/docusaurus.config.js
+++ b/docusaurus.config.js
@@ -46,12 +46,6 @@ const config = {
               label: "stable",
               badge: false,
             },
-            old: {
-              label: "old",
-              banner: "unmaintained",
-              badge: false,
-              path: "old",
-            },
           },
           sidebarPath: require.resolve("./sidebars.js"),
           remarkPlugins: [
diff --git a/vercel.json b/vercel.json
index e105ac49a..3e57e5c27 100644
--- a/vercel.json
+++ b/vercel.json
@@ -2,89 +2,37 @@
   "cleanUrls": true,
   "trailingSlash": false,
   "redirects": [
-    {
-      "source": "/evaluation/custom-evaluators",
-      "destination": "/evaluation/faq/custom-evaluators"
-    },
     {
       "source": "/category/tracing",
-      "destination": "/tracing"
-    },
-    {
-      "source": "category/testing--evaluation",
-      "destination": "/evaluation"
-    },
-    {
-      "source": "/category/langsmith-cookbook",
-      "destination": "/cookbook"
-    },
-    {
-      "source": "/tracing/tracing-faq",
-      "destination": "/tracing/faq"
-    },
-    {
-      "source": "/category/organizations",
-      "destination": "/"
-    },
-    {
-      "source": "/organizations",
-      "destination": "/"
+      "destination": "/observability"
     },
     {
       "source": "/category/organizations/:path*",
       "destination": ":path*"
     },
-    {
-      "source": "/cookbook/testing-examples/prod-candidate-testing",
-      "destination": "/cookbook/testing-examples/backtesting"
-    },
     {
       "source": "/evaluation/faq/datasets-client",
-      "destination": "/evaluation/faq/manage-datasets#how-to-manage-datasets-programmatically"
+      "destination": "/evaluation/how_to_guides/manage_datasets_programmatically"
     },
     {
       "source": "/evaluation/faq/datasets-webapp",
-      "destination": "/evaluation/faq/manage-datasets"
-    },
-    {
-      "source": "/overview",
-      "destination": "/"
-    },
-    {
-      "source": "/docs/:path*",
-      "destination": "/:path*"
+      "destination": "/evaluation/how_to_guides/manage_datasets_in_application#manage-a-dataset"
     },
     {
       "source": "/monitoring/:path*",
-      "destination": "/old/monitoring/:path*"
-    },
-    {
-      "source": "/proxy/:path*",
-      "destination": "/old/proxy/:path*"
+      "destination": "/observability/how_to_guides#monitoring"
     },
     {
       "source": "/tracing/:path*",
-      "destination": "/old/tracing/:path*"
-    },
-    {
-      "source": "/cookbook/:path*",
-      "destination": "/old/cookbook/:path*"
+      "destination": "/observability"
     },
     {
       "source": "/hub/:path*",
-      "destination": "/old/hub/:path*"
-    },
-    {
-      "source": "/user_guide",
-      "destination": "/old/user_guide"
+      "destination": "/prompt_engineering/how_to_guides#prompt-hub"
     },
     {
       "source": "/category/prompt-hub/:path*",
-      "destination": "/old/category/prompt-hub/:path*"
-    },
-    {
-      "source": "/category/proxy/:path*",
-      "destination": "/old/category/proxy/:path*"
+      "destination": "/prompt_engineering/how_to_guides#prompt-hub"
     },
     {
       "source": "/category/release-notes",
@@ -92,47 +40,35 @@
     },
     {
       "source": "/how_to_guides/evaluation/:path*",
-      "destination": "/evaluation/how_to_guides/evaluation/:path*"
+      "destination": "/evaluation/how_to_guides/evaluation"
     },
     {
       "source": "/how_to_guides/human_feedback/:path*",
-      "destination": "/evaluation/how_to_guides/human_feedback/:path*"
+      "destination": "/evaluation/how_to_guides#annotation-queues-and-human-feedback"
     },
     {
       "source": "/how_to_guides/datasets/:path*",
-      "destination": "/evaluation/how_to_guides/datasets/:path*"
+      "destination": "/evaluation/how_to_guides#dataset-management"
     },
     {
       "source": "/how_to_guides/monitoring/:path*",
-      "destination": "/observability/how_to_guides/monitoring/:path*"
+      "destination": "/observability/how_to_guides"
     },
     {
       "source": "/how_to_guides/tracing/:path*",
-      "destination": "/observability/how_to_guides/tracing/:path*"
+      "destination": "/observability/how_to_guides"
     },
     {
       "source": "/how_to_guides/prompts/:path*",
-      "destination": "/prompt_engineering/how_to_guides/prompts/:path*"
+      "destination": "/prompt_engineering/how_to_guides#prompt-hub"
     },
     {
       "source": "/how_to_guides/playground/:path*",
-      "destination": "/prompt_engineering/how_to_guides/playground/:path*"
+      "destination": "/prompt_engineering/how_to_guides#playground"
     },
     {
       "source": "/how_to_guides/setup/:path*",
-      "destination": "/administration/how_to_guides/organization_management/:path*"
-    },
-    {
-      "source": "/how_to_guides",
-      "destination": "/"
-    },
-    {
-      "source": "/concepts",
-      "destination": "/"
-    },
-    {
-      "source": "/tutorials",
-      "destination": "/"
+      "destination": "/administration/how_to_guides/organization_management"
     },
     {
       "source": "/concepts/admin:path*",
@@ -156,7 +92,7 @@
     },
     {
       "source": "/pricing:path*",
-      "destination": "/pricing"
+      "destination": "https://www.langchain.com/pricing-langsmith"
     },
     {
       "source": "/tutorials/Developers/observability",
@@ -220,7 +156,7 @@
     },
     {
       "source": "/evaluation/how_to_guides/unit_testing(/?)",
-      "destination": "/evauation/how_to_guides/pytest"
+      "destination": "/evaluation/how_to_guides/pytest"
     },
     {
       "source": "/observability/how_to_guides/tracing/:path*",
diff --git a/versioned_docs/version-old/evaluation/_check.py b/versioned_docs/version-old/evaluation/_check.py
deleted file mode 100644
index ea9e8fcba..000000000
--- a/versioned_docs/version-old/evaluation/_check.py
+++ /dev/null
@@ -1,23 +0,0 @@
-import re
-
-with open('quickstart.mdx', 'r') as file:
-    all_mdx_content = file.read() 
-
-code_block_pattern = re.compile(r'content: `([^`]*)`', re.DOTALL)
-
-by_code_tabs = all_mdx_content.split("<CodeTabs")
-steps = []
-for mdx_content in by_code_tabs:
-    python_code_blocks = code_block_pattern.findall(mdx_content)
-
-    formatted = []
-    for index, code in enumerate(python_code_blocks, start=1):
-        if ";" in code or "@langchain" in code or "pip install" in code:
-            # Silly.
-            continue
-        formatted_code = code.strip().strip('"').strip("'").replace("\\n", "\n")
-        print(f"Python Code Block {index}:\n{formatted_code}\n---\n")
-        formatted.append(formatted_code)
-    if formatted:
-        steps.append(formatted)
-
diff --git a/versioned_docs/version-old/evaluation/faq/_category_.json b/versioned_docs/version-old/evaluation/faq/_category_.json
deleted file mode 100644
index b9e125a41..000000000
--- a/versioned_docs/version-old/evaluation/faq/_category_.json
+++ /dev/null
@@ -1,5 +0,0 @@
-{
-  "position": 2,
-  "collapsed": true,
-  "collapsible": true
-}
\ No newline at end of file
diff --git a/versioned_docs/version-old/evaluation/faq/custom-evaluators.mdx b/versioned_docs/version-old/evaluation/faq/custom-evaluators.mdx
deleted file mode 100644
index 878fbced4..000000000
--- a/versioned_docs/version-old/evaluation/faq/custom-evaluators.mdx
+++ /dev/null
@@ -1,381 +0,0 @@
----
-sidebar_label: Create an Evaluator
-sidebar_position: 1
----
-
-# Evaluators
-
-In this guide, you will create custom evaluators to grade your LLM system. An evaluator can apply any logic you want, returning a numeric `score` associated with a `key`.
-
-Most evaluators are applied on a `run` level, scoring each prediction individually.
-Some `summary_evaluators` can be applied on a `experiment` level, letting you score and aggregate metrics across multiple runs.
-
-Evaluators take in a `Run` and an `Example`:
-
-#### Run Object
-
-The key `Run` object fields are as follows:
-
-- `outputs`: `Dict[str, Any]` - The outputs of your pipeline
-- `inputs`: `Dict[str, Any]` - The inputs to your pipeline. These are the same as the inputs in the example.
-- `child_runs`: `List[Run]` - If your pipeline has nested steps, these can be accessed and used in your evaluator
-
-#### Example Object
-
-The key `Example` object fields are as follows:
-
-- `outputs`: `Dict[str, Any]` - The reference labels or other context found in your dataset
-- `inputs`: `Dict[str, Any]` - The inputs to your pipeline
-- `metadata`: `Dict[str, Any]` - Any other metadata you have stored in that example within the dataset
-
-## Run Evaluators
-
-Run evaluators are applied to each prediction of your pipeline. The common automated evaluator types are:
-
-1. Simple Heuristics: Checking for regex matches, presence/absence of certain words or code, etc.
-2. AI-assisted: Instruct an "LLM-as-judge" to grade the output of a run based on the prediction and reference answer (or retrieved context).
-
-We will demonstrate some simple ones below.
-
-#### Example 1: Exact Match Evaluator
-
-Let's start with a simple evaluator that checks if the model's output exactly matches the reference answer.
-
-```python
-from langsmith.schemas import Example, Run
-
-def exact_match(run: Run, example: Example) -> dict:
-    reference = example.outputs["answer"]
-    prediction = run.outputs["output"]
-    score = prediction.lower() == reference.lower()
-    return {"key": "exact_match", "score": score}
-```
-
-Let's break this down:
-
-- The evaluator function accepts a `Run` and `Example` and returns a dictionary with the evaluation key and score. The run contains the full trace of your pipeline, and the example contains the inputs and outputs for this data point. If your dataset contains labels, they are found in the `example.outputs` dictionary, which is kept separate to keep your model from cheating.
-- In our dataset, the outputs have an "answer" key that contains the reference answer. Your pipeline generates predictions as a dictionary with an "output" key.
-- It compares the prediction and reference (case-insensitive) and returns a dictionary with the evaluation key and score.
-
-You can use this evaluator directly in the `evaluate` function:
-
-```python
-from langsmith.evaluation import evaluate
-
-evaluate(
-    <your prediction function>,
-    data="<dataset_name>",
-    evaluators=[exact_match],
-)
-```
-
-#### Example 2: Parametrizing your evaluator
-
-You may want to parametrize your evaluator as a class. This is useful when you need to pass additional parameters to the evaluator.
-
-```python
-from langsmith.evaluation import evaluate
-from langsmith.schemas import Example, Run
-
-class BlocklistEvaluator:
-    def __init__(self, blocklist: list[str]):
-        self.blocklist = blocklist
-    def __call__(
-        self, run: Run, example: Example | None = None
-    ) -> dict:
-        model_outputs = run.outputs["output"]
-        score = not any([word in model_outputs for word in self.blocklist])
-        return {"key": "blocklist", "score": score}
-
-
-evaluate(
-    <your prediction function>,
-    data="<dataset_name>",
-    evaluators=[BlocklistEvaluator(blocklist=["bad", "words"])],
-)
-```
-
-#### Example 3: Evaluating nested traces
-
-While most evaluations are applied to the inputs and outputs of your system, you can also evaluate all of the subcomponents that are traced within your pipeline.
-
-This is possible by stepping through the `run` object and collecting the outputs of each component.
-
-As a simple example, let's assume you want to evaluate the expected tools that are invoked in a pipeline.
-
-```python
-from langsmith.evaluation import evaluate
-from langsmith.schemas import Example, Run
-
-def evaluate_trajectory(run: Run, example: Example) -> dict:
-    # collect the tools on level 1 of the trace tree
-    steps = [child.name for child in run.child_runs if child.run_type == "tool"]
-    expected_steps = example.outputs["expected_tools"]
-    score = len(set(steps) & set(expected_steps)) / len(set(steps) | set(expected_steps))
-    return {"key": "tools", "score": score}
-```
-
-This lets you grade the performance of intermediate steps in your pipeline.
-
-Note: the example above assumes tools are properly typed in the trace tree.
-
-#### Example 3: Structured Output
-
-With function calling, it has become easier than ever to generate feedback metrics using LLMs as a judge simply by specifying a Pydantic schema for the output.
-
-Below is an example (in this case using OpenAI's tool calling functionality) to evaluate RAG app faithfulness.
-
-````python
-import json
-from typing import List
-
-import openai
-from langsmith.schemas import Example, Run
-from pydantic import BaseModel, Field
-
-openai_client = openai.Client()
-
-
-class Propositions(BaseModel):
-    propositions: List[str] = Field(
-        description="The factual propositions generated by the model"
-    )
-
-
-class FaithfulnessScore(BaseModel):
-    reasoning: str = Field(description="The reasoning for the faithfulness score")
-    score: bool
-
-
-def faithfulness(run: Run, example: Example) -> dict:
-    # Assumes your RAG app includes the prediction in the "output" key in its response
-    response: str = run.outputs["output"]
-    # Assumes your RAG app includes the retrieved docs as a "context" key in the outputs
-    # If not, you can fetch from the child_runs of the run object
-    retrieved_docs: list = run.outputs["context"]
-    formatted_docs = "\n".join([str(doc) for doc in retrieved_docs])
-    extracted = openai_client.chat.completions.create(
-        model="gpt-4-turbo-preview",
-        messages=[
-            {
-                "role": "user",
-                "content": "Extract all factual propositions from the following text:\n\n"
-                f"```\n{response}\n```",
-            },
-        ],
-        tools=[
-            {
-                "type": "function",
-                "function": {
-                    "name": "Propositions",
-                    "description": "Use to record each factual assertion.",
-                    "parameters": Propositions.model_json_schema(),
-                },
-            }
-        ],
-        tool_choice={"type": "function", "function": {"name": "Propositions"}},
-    )
-    propositions = [
-        prop
-        for tc in extracted.choices[0].message.tool_calls
-        for prop in json.loads(tc.function.arguments)["propositions"]
-    ]
-    scores, reasoning = [], []
-    tools = [
-        {
-            "type": "function",
-            "function": {
-                "name": "FaithfulnessScore",
-                "description": "Use to score how faithful the propositions are to the docs.",
-                "parameters": FaithfulnessScore.model_json_schema(),
-            },
-        }
-    ]
-    for proposition in propositions:
-        faithfulness_completion = openai_client.chat.completions.create(
-            model="gpt-4-turbo-preview",
-            messages=[
-                {
-                    "role": "user",
-                    "content": "Grade whether the proposition can be logically concluded"
-                    f" from the docs:\n\nProposition: {proposition}\nDocs:\n"
-                    f"```\n{formatted_docs}\n```",
-                },
-            ],
-            # highlight-next-line
-            tools=tools,
-            tool_choice={"type": "function", "function": {"name": "FaithfulnessScore"}},
-        )
-        faithfulness_args = json.loads(
-            faithfulness_completion.choices[0].message.tool_calls[0].function.arguments
-        )
-        scores.append(faithfulness_args["score"])
-        reasoning.append(faithfulness_args["reasoning"])
-    average_score = sum(scores) / len(scores) if scores else None
-    comment = "\n".join(reasoning)
-    return {"key": "faithfulness", "score": average_score, "comment": comment}
-
-````
-
-#### Example 4: Returning Multiple Scores
-
-A single evaluator can return multiple scores. An example of when this might be useful is if you are using tool calling for an LLM-as-judge to extract multiple metrics in a single API call.
-
-```python
-import json
-
-import openai
-from langsmith.schemas import Example, Run
-from pydantic import BaseModel, Field
-
-# Initialize the OpenAI client
-openai_client = openai.Client()
-
-class Scores(BaseModel):
-    correctness_reasoning: str = Field(description="The reasoning for the correctness score")
-    correctness: float = Field(description="The score for the correctness of the prediction")
-    conciseness_reasoning: str = Field(description="The reasoning for the conciseness score")
-    conciseness: float = Field(description="The score for the conciseness of the prediction")
-
-def multiple_scores(run: Run, example: Example) -> dict:
-    reference = example.outputs["answer"]
-    prediction = run.outputs["output"]
-
-    messages = [
-        {
-            "role": "user",
-            "content": f"Reference: {reference}\nPrediction: {prediction}"
-        },
-    ]
-
-    tools = [
-        {
-            "type": "function",
-            "function": {
-                "name": "Scores",
-                "description": "Use to evaluate the correctness and conciseness of the prediction.",
-                "parameters": Scores.model_json_schema(),
-            },
-        }
-    ]
-
-    # Generating the chat completion with structured output
-    completion = openai_client.chat.completions.create(
-        model="gpt-4-turbo-preview",
-        messages=messages,
-        tools=tools,
-        tool_choice={"type": "function", "function": {"name": "Scores"}},
-    )
-
-    # Extracting structured scores from the completion
-    scores_args = json.loads(completion.choices[0].message.tool_calls[0].function.arguments)
-
-    return {
-        # highlight-next-line
-        "results": [
-            # Provide the key, score and other relevant information for each metric
-            # highlight-next-line
-            {"key": "correctness", "score": scores_args["correctness"], "comment": scores_args["correctness_reasoning"]},
-            {"key": "conciseness", "score": scores_args["conciseness"], "comment": scores_args["conciseness_reasoning"]}
-        ]
-    }
-```
-
-#### Example 5: Perplexity Evaluator
-
-The flexibility of the functional interface means you can easly apply evaluators from any other libraries. For instance, you may want to use statistical measures such as [`perplexity`](https://huggingface.co/spaces/evaluate-metric/perplexity) to grade your run output. Below is an example using the [evaluate](https://huggingface.co/docs/evaluate/index) package by HuggingFace, which contains numerous commonly used metrics. Start by installing the `evaluate` package by running `pip install evaluate`.
-
-```python
-from evaluate import load
-from langsmith.schemas import Example, Run
-from langsmith.evaluation import RunEvaluator
-
-class PerplexityEvaluator(RunEvaluator):
-    def __init__(self, prediction_key: Optional[str] = None, model_id: str = "gpt-2"):
-        self.prediction_key = prediction_key
-        self.model_id = model_id
-        self.metric_fn = load("perplexity", module_type="metric")
-    def evaluate_run(
-        self, run: Run, example: Example
-    ) -> dict:
-        if run.outputs is None:
-            raise ValueError("Run outputs cannot be None")
-        prediction = run.outputs[self.prediction_key]
-        results = self.metric_fn.compute(
-            predictions=[prediction], model_id=self.model_id
-        )
-        ppl = results["perplexities"][0]
-        return {"key": "Perplexity", "score": ppl}
-```
-
-Let's break down what the `PerplexityEvaluator` is doing:
-
-- **Initialize**: In the constructor, we're setting up a few properties that will be needed later on.
-  - `prediction_key`: The key to find the model's prediction in the outputs of a run.
-  - `model_id`: The ID of the language model you want to use to compute the metric. In our example, we are using 'gpt-2'.
-  - `metric_fn`: The evaluation metric function, loaded from the HuggingFace `evaluate` package.
-- **Evaluate**: This method takes a run (and optionally an example) and returns an evaluation dictionary.
-  - If the run outputs are `None`, the evaluator raises an error.
-  - Otherwise, the outputs are passed to the `metric_fn` to compute the perplexity. The perplexity score is then returned as part of the evaluation dictionary.
-    Once you've defined your evaluators, you can use them to evaluate your model:
-
-```python
-from langsmith.evaluation import evaluate
-evaluate(
-    <LLM or chain or agent>,
-    data="<dataset_name>",
-    evaluators=[BlocklistEvaluator(blocklist=["bad", "words"]), PerplexityEvaluator(), is_empty],
-)
-```
-
-## Summary Evaluators
-
-Some metrics can only be defined on the entire experiment level as opposed to the individual runs of the experiment. For example, you may want to compute the f1 score of a classifier across all runs in an experiment kicked off from a dataset. These are called `summary_evaluators`. Instead of taking in a single `Run` and `Example`, these evaluators take a list of each.
-
-```python
-from typing import List
-from langsmith.schemas import Example, Run
-from langsmith.evaluation import evaluate
-
-def f1_score_summary_evaluator(runs: List[Run], examples: List[Example]) -> dict:
-    true_positives = 0
-    false_positives = 0
-    false_negatives = 0
-    for run, example in zip(runs, examples):
-        # Matches the output format of your dataset
-        reference = example.outputs["answer"]
-        # Matches the output dict in `predict` function below
-        prediction = run.outputs["prediction"]
-        if reference and prediction == reference:
-            true_positives += 1
-        elif prediction and not reference:
-            false_positives += 1
-        elif not prediction and reference:
-            false_negatives += 1
-    if true_positives == 0:
-        return {"key": "f1_score", "score": 0.0}
-
-    precision = true_positives / (true_positives + false_positives)
-    recall = true_positives / (true_positives + false_negatives)
-    f1_score = 2 * (precision * recall) / (precision + recall)
-    return {"key": "f1_score", "score": f1_score}
-
-def predict(inputs: dict):
-    return {"prediction": True}
-
-evaluate(
-    predict, # Your classifier
-    data="<dataset_name>",
-    summary_evaluators=[f1_score_summary_evaluator],
-)
-```
-
-### Recap
-
-Congratulations! You created a custom evaluation chain you can apply to _any_ traced run so you can surface more relevant information in your application.
-LangChain's evaluation chains speed up the development process for application-specific, semantically robust evaluations.
-You can also extend existing components from the library so you can focus on building your product. All your evals come with:
-
-- Automatic tracing integrations to help you debug, compare, and improve your code
-- Easy sharing and mixing of components and results
-- Out-of-the-box support for sync and async evaluations for faster runs
diff --git a/versioned_docs/version-old/evaluation/faq/evaluator-implementations.mdx b/versioned_docs/version-old/evaluation/faq/evaluator-implementations.mdx
deleted file mode 100644
index 80d3476d9..000000000
--- a/versioned_docs/version-old/evaluation/faq/evaluator-implementations.mdx
+++ /dev/null
@@ -1,338 +0,0 @@
----
-sidebar_label: Use Off-the-Shelf Evaluators
-sidebar_position: 2
----
-
-import {
-  CodeTabs,
-  PythonBlock,
-  TypeScriptBlock,
-} from "@site/src/components/InstructionsWithCode";
-
-# How to Use Off-the-Shelf Evaluators
-
-LangChain's evaluation module provides evaluators you can use as-is for common evaluation scenarios.
-
-It's easy to use these by passing them to the `evaluators` argument of the `evaluate()` function.
-
-Copy the code snippets below to get started. You can also configure them for your applications using the arguments mentioned in the "Parameters" sections.  
-If you don't see an implementation that suits your needs, you can learn how to create your own [Custom Run Evaluators](custom-evaluators) in the linked guide, or contribute an string evaluator to the [LangChain repository](https://github.com/langchain-ai/langchain/blob/master/libs/langchain/langchain/evaluation/).
-
-:::note
-Most of these evaluators are useful but imperfect! We recommend against blind trust of any single automated metric and to always incorporate them as a part of a holistic testing and evaluation strategy.  
-Many of the LLM-based evaluators return a binary score for a given data point, so measuring differences in prompt or model performance are most reliable in aggregate over a larger dataset.
-:::
-
-## Overview
-
-The following table enumerates the off-the-shelf evaluators available in LangSmith, along with their output keys and a simple code sample.
-
-| Evaluator name       | Output Key                  | Simple Code Example                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                   |
-| -------------------- | --------------------------- | ----------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------- |
-| QA                   | `correctness`               | `LangChainStringEvaluator("qa")`                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                      |
-| Contextual Q&A       | `contextual accuracy`       | `LangChainStringEvaluator("context_qa")`                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                              |
-| Chain of Thought Q&A | `cot contextual accuracy`   | `LangChainStringEvaluator("cot_qa")`                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                  |
-| Criteria             | Depends on criteria key     | `LangChainStringEvaluator("criteria", config={ "criteria": <criterion> })`<br/><br/>`criterion` may be one of the default implemented criteria: `conciseness`, `relevance`, `correctness`, `coherence`, `harmfulness`, `maliciousness`, `helpfulness`, `controversiality`, `misogyny`, and `criminality`.<br/><br/>Or, you may define your own criteria in a custom dict as follows:<br/>`{ "criterion_key": "criterion description" }`                                                                                                               |
-| Labeled Criteria     | Depends on criteria key     | `LangChainStringEvaluator("labeled_criteria", config={ "criteria": <criterion> })`<br/><br/>`criterion` may be one of the default implemented criteria: `conciseness`, `relevance`, `correctness`, `coherence`, `harmfulness`, `maliciousness`, `helpfulness`, `controversiality`, `misogyny`, and `criminality`.<br/><br/>Or, you may define your own criteria in a custom dict as follows:<br/>`{ "criterion_key": "criterion description" }`                                                                                                       |
-| Score                | Depends on criteria key     | `LangChainStringEvaluator("score_string", config={ "criteria": <criterion>, "normalize_by": 10 })`<br/><br/>`criterion` may be one of the default implemented criteria: `conciseness`, `relevance`, `correctness`, `coherence`, `harmfulness`, `maliciousness`, `helpfulness`, `controversiality`, `misogyny`, and `criminality`.<br/><br/>Or, you may define your own criteria in a custom dict as follows:<br/>`{ "criterion_key": "criterion description" }`. Scores are out of 10, so normalize_by will cast this to a score from 0 to 1.         |
-| Labeled Score        | Depends on criteria key     | `LangChainStringEvaluator("labeled_score_string", config={ "criteria": <criterion>, "normalize_by": 10 })`<br/><br/>`criterion` may be one of the default implemented criteria: `conciseness`, `relevance`, `correctness`, `coherence`, `harmfulness`, `maliciousness`, `helpfulness`, `controversiality`, `misogyny`, and `criminality`.<br/><br/>Or, you may define your own criteria in a custom dict as follows:<br/>`{ "criterion_key": "criterion description" }`. Scores are out of 10, so normalize_by will cast this to a score from 0 to 1. |
-| Embedding distance   | `embedding_cosine_distance` | `LangChainStringEvaluator("embedding_distance")`                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                      |
-| String Distance      | `string_distance`           | `LangChainStringEvaluator("string_distance", config={"distance": "damerau_levenshtein" })` <br/><br/>`distance` defines the string difference metric to be applied, such as `levenshtein` or `jaro_winkler`.                                                                                                                                                                                                                                                                                                                                          |
-| Exact Match          | `exact_match`               | `LangChainStringEvaluator("exact_match")`                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                             |
-| Regex Match          | `regex_match`               | `LangChainStringEvaluator("regex_match")`                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                             |
-| Json Validity        | `json_validity`             | `LangChainStringEvaluator("json_validity")`                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           |
-| Json Equality        | `json_equality`             | `LangChainStringEvaluator("json_equality")`                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           |
-| Json Edit Distance   | `json_edit_distance`        | `LangChainStringEvaluator("json_edit_distance")`                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                      |
-| Json Schema          | `json_schema`               | `LangChainStringEvaluator("json_schema")`                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                             |
-
-## Correctness: QA evaluation
-
-QA evalutors help to measure the correctness of a response to a user query or question. If you have a dataset with reference labels or reference context docs, these are the evaluators for you!
-Three QA evaluators you can load are: `"qa"`, `"context_qa"`, `"cot_qa"`. Based on our meta-evals, we recommend using `"cot_qa"` or a similar prompt for best results.
-
-- The `"qa"` evaluator ([reference](https://api.python.langchain.com/en/latest/evaluation/langchain.evaluation.qa.eval_chain.QAEvalChain.html#langchain-evaluation-qa-eval-chain-qaevalchain)) instructs an llm to directly grade a response as "correct" or "incorrect" based on the reference answer.
-- The `"context_qa"` evaluator ([reference](https://api.python.langchain.com/en/latest/evaluation/langchain.evaluation.qa.eval_chain.ContextQAEvalChain.html#langchain.evaluation.qa.eval_chain.ContextQAEvalChain)) instructs the LLM chain to use reference "context" (provided throught the example outputs) in determining correctness. This is useful if you have a larger corpus of grounding docs but don't have ground truth answers to a query.
-- The `"cot_qa"` evaluator ([reference](https://api.python.langchain.com/en/latest/evaluation/langchain.evaluation.qa.eval_chain.CotQAEvalChain.html#langchain.evaluation.qa.eval_chain.CotQAEvalChain)) is similar to the "context_qa" evaluator, except it instructs the LLMChain to use chain of thought "reasoning" before determining a final verdict. This tends to lead to responses that better correlate with human labels, for a slightly higher token and runtime cost.
-
-<CodeTabs
-  tabs={[
-    PythonBlock(`from langsmith import Client
-from langsmith.evaluation import LangChainStringEvaluator, evaluate\n
-qa_evaluator = LangChainStringEvaluator("qa")  
-context_qa_evaluator = LangChainStringEvaluator("context_qa")
-cot_qa_evaluator = LangChainStringEvaluator("cot_qa")\n
-client = Client()
-evaluate(
-    <your pipeline>,
-    data="<dataset_name>", 
-    evaluators=[qa_evaluator, context_qa_evaluator, cot_qa_evaluator],
-    metadata={"revision_id": "the version of your pipeline you are testing"},
-)`),
-  ]}
-  groupId="client-language"
-/>
-You can customize the evaluator by specifying the LLM used to power its LLM chain
-or even by customizing the prompt itself. Below is an example using an Anthropic
-model to run the evaluator, and a custom prompt for the base QA evaluator. Check
-out the reference docs for more information on the expected prompt format.
-<CodeTabs
-  tabs={[
-    PythonBlock(`from langchain.chat_models import ChatAnthropic
-from langchain_core.prompts.prompt import PromptTemplate
-from langsmith.evaluation import LangChainStringEvaluator\n
-_PROMPT_TEMPLATE = """You are an expert professor specialized in grading students' answers to questions.
-You are grading the following question:
-{input}
-Here is the real answer:
-{reference}
-You are grading the following predicted answer:
-{prediction}
-Respond with CORRECT or INCORRECT:
-Grade:
-"""\n
-PROMPT = PromptTemplate(
-    input_variables=["input", "reference", "prediction"], template=_PROMPT_TEMPLATE
-)
-eval_llm = ChatAnthropic(temperature=0.0)\n
-qa_evaluator = LangChainStringEvaluator("qa", config={"llm": eval_llm, "prompt": PROMPT})  
-context_qa_evaluator = LangChainStringEvaluator("context_qa", config={"llm": eval_llm})
-cot_qa_evaluator = LangChainStringEvaluator("cot_qa", config={"llm": eval_llm})
-evaluate(
-    <your pipeline>,
-    data="<dataset_name>",
-    evaluators=[qa_evaluator, context_qa_evaluator, cot_qa_evaluator],  
-)
-`),
-  ]}
-  groupId="client-language"
-/>
-
-## Criteria Evaluators (No Labels)
-
-If you don't have ground truth reference labels, you can evaluate your run against a custom set of criteria using the `"criteria"` or `"score"` evaluators. These are helpful when there are high level semantic aspects of your model's output you'd like to monitor that aren't captured by other explicit checks or rules.
-
-- The `"criteria"` evaluator ([reference](https://api.python.langchain.com/en/latest/evaluation/langchain.evaluation.criteria.eval_chain.CriteriaEvalChain.html#langchain.evaluation.criteria.eval_chain.CriteriaEvalChain)) instructs an LLM to assess if a prediction satisfies the given criteria, outputting a binary score
-- The `"score_string"` evaluator ([reference](https://api.python.langchain.com/en/latest/evaluation/langchain.evaluation.scoring.eval_chain.ScoreStringEvalChain.html#langchain.evaluation.scoring.eval_chain.ScoreStringEvalChain)) has the LLM score the prediction on a numeric scale (default 1-10) based on how well it satisfies the criteria
-
-<CodeTabs
-  tabs={[
-    PythonBlock(`from langsmith import Client  
-from langsmith.evaluation import LangChainStringEvaluator, evaluate\n
-criteria_evaluator = LangChainStringEvaluator(
-    "criteria",
-    config={
-        "criteria": {
-            "creativity": "Is this submission creative, imaginative, or novel?",
-            "conciseness": "Is this response concise and to the point?",
-        }
-    }
-)
-score_evaluator = LangChainStringEvaluator(
-    "score_string",
-    config={
-        "criteria": {
-            "accuracy": "How accurate is this prediction on a scale of 1-10?" 
-        },
-        # If you want the score to be saved on a scale from 0 to 1
-        "normalize_by": 10,
-    }  
-)\n
-client = Client()
-evaluate(
-    <your pipeline>,
-    data="<dataset_name>",
-    evaluators=[
-        criteria_evaluator,
-        score_evaluator
-    ], 
-    metadata={"revision_id": "the version of your pipeline you are testing"},
-)`),
-  ]}
-  groupId="client-language"
-/>
-
-::::tip Supported Criteria  
-Default criteria are implemented for the following aspects: conciseness, relevance, correctness, coherence, harmfulness, maliciousness, helpfulness, controversiality, misogyny, and criminality.  
-To specify custom criteria, write a mapping of a criterion name to its description, such as:
-
-```
-    criterion = {"creativity": "Is this submission creative, imaginative, or novel?"}
-    criteria_evaluator = LangChainStringEvaluator(
-        "labeled_criteria",
-        config={"criteria": criterion}
-    )
-```
-
-::::
-::::tip Interpreting the Score
-Evaluation scores don't have an inherent "direction" (i.e., higher is not necessarily better).
-The direction of the score depends on the criteria being evaluated. For example, a score of 1 for "helpfulness" means that the prediction was deemed to be helpful by the model.
-However, a score of 1 for "maliciousness" means that the prediction contains malicious content, which, of course, is "bad".
-::::
-
-## Criteria Evaluators (With Labels)
-
-If you have ground truth reference labels, you can evaluate your run against custom criteria while also providing that reference information to the LLM using the `"labeled_criteria"` or `"labeled_score_string"` evaluators.
-
-- The `"labeled_criteria"` evaluator ([reference](https://api.python.langchain.com/en/latest/evaluation/langchain.evaluation.criteria.eval_chain.LabeledCriteriaEvalChain.html#langchain.evaluation.criteria.eval_chain.LabeledCriteriaEvalChain)) instructs an LLM to assess if a prediction satisfies the criteria, taking into account the reference label
-- The `"labeled_score_string"` evaluator ([reference](https://api.python.langchain.com/en/latest/evaluation/langchain.evaluation.scoring.eval_chain.LabeledScoreStringEvalChain.html#langchain.evaluation.scoring.eval_chain.LabeledScoreStringEvalChain)) has the LLM score the prediction on a numeric scale based on how well it satisfies the criteria compared to the reference
-
-<CodeTabs
-  tabs={[
-    PythonBlock(`from langsmith import Client
-from langsmith.evaluation import LangChainStringEvaluator, evaluate\n  
-labeled_criteria_evaluator = LangChainStringEvaluator(
-    "labeled_criteria",
-    config={
-        "criteria": {
-            "helpfulness": (
-                "Is this submission helpful to the user," 
-                " taking into account the correct reference answer?"
-            )
-        }
-    },
-    prepare_data=lambda run, example: {
-        "prediction": run.outputs["output"],
-        "reference": example.outputs["answer"],
-        "input": example.inputs["question"],   
-    }
-)
-labeled_score_evaluator = LangChainStringEvaluator(
-    "labeled_score_string", 
-    config={
-        "criteria": { 
-            "accuracy": "How accurate is this prediction compared to the reference on a scale of 1-10?"
-        },
-        "normalize_by": 10,
-    },
-    prepare_data=lambda run, example: {
-        "prediction": run.outputs["output"], 
-        "reference": example.outputs["answer"],
-        "input": example.inputs["question"],
-    }  
-)\n
-client = Client()
-evaluate(
-    <your pipeline>,
-    data="<dataset_name>",
-    evaluators=[  
-        labeled_criteria_evaluator,
-        labeled_score_evaluator
-    ],
-    metadata={"revision_id": "the version of your pipeline you are testing"},
-)`),
-  ]}
-  groupId="client-language"
-/>
-
-## JSON Evaluators
-
-Evaluating extraction and function calling applications often comes down to validating that the LLM's string output can be parsed correctly and comparing it to a reference object. The JSON evaluators provide functionality to check your model's output consistency:
-
-- The `"json_validity"` ([reference](https://api.python.langchain.com/en/latest/evaluation/langchain.evaluation.parsing.base.JsonValidityEvaluator.html#langchain.evaluation.parsing.base.JsonValidityEvaluator)) evaluator checks if a prediction is valid JSON
-- The `"json_equality"` ([reference](https://api.python.langchain.com/en/latest/evaluation/langchain.evaluation.parsing.base.JsonEqualityEvaluator.html#langchain.evaluation.parsing.base.JsonEqualityEvaluator)) evaluator checks if a JSON prediction exactly matches a JSON reference, after normalization
-- The `"json_edit_distance"` ([reference](https://api.python.langchain.com/en/latest/evaluation/langchain.evaluation.parsing.json_distance.JsonEditDistanceEvaluator.html#langchain.evaluation.parsing.json_distance.JsonEditDistanceEvaluator)) evaluator computes the normalized edit distance between a JSON prediction and reference
-- The `"json_schema"` ([reference](https://api.python.langchain.com/en/latest/evaluation/langchain.evaluation.parsing.json_schema.JsonSchemaEvaluator.html#langchain.evaluation.parsing.json_schema.JsonSchemaEvaluator)) evaluator checks if a JSON prediction satisfies a provided JSON schema
-
-<CodeTabs
-  tabs={[
-    PythonBlock(`from langsmith.evaluation import LangChainStringEvaluator, evaluate\n
-json_validity_evaluator = LangChainStringEvaluator("json_validity")
-json_equality_evaluator = LangChainStringEvaluator("json_equality") 
-json_edit_distance_evaluator = LangChainStringEvaluator("json_edit_distance")
-json_schema_evaluator = LangChainStringEvaluator(
-    "json_schema",
-    config={
-        "schema": {
-            "type": "object",
-            "properties": {
-                "name": {"type": "string"},
-                "age": {"type": "integer", "minimum": 0}  
-            },
-            "required": ["name"] 
-        }
-    }
-)\n
-evaluate(
-    <your pipeline>,
-    data="<dataset_name>", 
-    evaluators=[
-        json_validity_evaluator,
-        json_equality_evaluator,  
-        json_edit_distance_evaluator,
-        json_schema_evaluator
-    ],
-)`),
-  ]}
-  groupId="client-language"
-/>
-
-## String or Embedding Distance
-
-To measure the similarity between a predicted string and a reference, you can use string distance metrics:
-
-- The `"string_distance"` ([reference](https://api.python.langchain.com/en/latest/evaluation/langchain.evaluation.string_distance.base.StringDistanceEvalChain.html#langchain.evaluation.string_distance.base.StringDistanceEvalChain)) evaluator computes a normalized string edit distance between the prediction and reference
-- The `"embedding_distance"` ([reference](https://api.python.langchain.com/en/latest/evaluation/langchain.evaluation.embedding_distance.base.EmbeddingDistance.html#langchain.evaluation.embedding_distance.base.EmbeddingDistance)) evaluator computes the distance between the text embeddings of the prediction and reference
-- The `"exact_match"` ([reference](https://api.python.langchain.com/en/latest/evaluation/langchain.evaluation.exact_match.base.ExactMatchStringEvaluator.html#langchain.evaluation.exact_match.base.ExactMatchStringEvaluator)) evaluator checks for an exact string match between prediction and reference
-
-<CodeTabs
-  tabs={[
-    PythonBlock(`from langsmith.evaluation import LangChainStringEvaluator, evaluate\n
-string_distance_evaluator = LangChainStringEvaluator(
-    "string_distance",  
-    config={"distance": "levenshtein", "normalize_score": True}
-)
-embedding_distance_evaluator = LangChainStringEvaluator( 
-    "embedding_distance",
-    config={
-      # Defaults to OpenAI, but you can customize which embedding provider to use:
-      # "embeddings": HuggingFaceEmbeddings(model="distilbert-base-uncased"), 
-      # Can also choose "euclidean", "chebyshev", "hamming", and "manhattan"
-        "distance_metric": "cosine",
-      } 
-)
-exact_match_evaluator = LangChainStringEvaluator(
-    "exact_match",
-    config={"ignore_case": True, "ignore_punctuation": True}  
-)\n
-evaluate(
-    <your pipeline>,
-    data="<dataset_name>",  
-    evaluators=[
-        string_distance_evaluator,
-        embedding_distance_evaluator, 
-        exact_match_evaluator
-    ],
-)`),
-  ]}
-  groupId="client-language"
-/>
-
-## Regex Match
-
-To evaluate predictions against a reference regular expression pattern, you can use the `"regex_match"` ([reference](https://api.python.langchain.com/en/latest/evaluation/langchain.evaluation.regex_match.base.RegexMatchStringEvaluator.html#langchain.evaluation.regex_match.base.RegexMatchStringEvaluator)) evaluator.
-The pattern is provided as a string in the example outputs of the dataset. The evaluator checks if the prediction matches the pattern.
-
-<CodeTabs
-  tabs={[
-    PythonBlock(`from langsmith.evaluation import LangChainStringEvaluator, evaluate\n
-regex_evaluator = LangChainStringEvaluator(
-    "regex_match", 
-    config={
-        # Optionally control which flags to use in the regex match
-        "flags": re.IGNORECASE  
-    }
-)\n
-evaluate(
-    <your pipeline>,
-    data="<dataset_name>", 
-    evaluators=[regex_evaluator],
-)`),
-  ]}
-  groupId="client-language"
-/>
-
-## Don't see what you're looking for?
-
-These implementations are just a starting point. We want to work with you to build better off-the-shelf evaluation tools for everyone.
-We'd love feedback and contributions! Send us feedback at support@langchain.dev, check out the [Evaluators](https://python.langchain.com/docs/guides/evaluation/) in LangChain or submit PRs or issues directly to better address your needs.
diff --git a/versioned_docs/version-old/evaluation/faq/experiments-app.mdx b/versioned_docs/version-old/evaluation/faq/experiments-app.mdx
deleted file mode 100644
index a74b3ac39..000000000
--- a/versioned_docs/version-old/evaluation/faq/experiments-app.mdx
+++ /dev/null
@@ -1,54 +0,0 @@
----
-sidebar_label: Run Experiments in Browser (no code)
-sidebar_position: 8
----
-
-# How to run experiments in the prompt playground (no code)
-
-While you can kick off experiments easily using the sdk, as outlined [here](../quickstart), it's often useful to run experiments directly in the [prompt playground](../../hub/quickstart#2-try-out-a-prompt-in-the-playground).
-
-This allows you to test your prompt / model configuration over a series of inputs to see how well it generalizes across different contexts or scenarios, without having to write any code.
-
-## Kicking off an experiment in the prompt playground
-
-1. **Navigate to the prompt playground** by clicking on "Hub" in the sidebar, then selecting a prompt from the list of available prompts or creating a new one.
-2. **Select the "Switch to dataset" button** to switch to the dataset you want to use for the experiment. Please note that the dataset keys of the dataset inputs must match the input variables of the prompt. In the below sections, note that the selected dataset has inputs with keys "text", which correctly match the input variable of the prompt. Also note that there is a max capacity of 15 inputs for the prompt playground.
-   ![Switch to dataset](../static/switch_to_dataset.png)
-3. **Click on the "Start" button** or CMD+Enter to start the experiment. This will run the prompt over all the examples in the dataset and create an entry for the experiment in the dataset details page. Note that you need to commit the prompt to the prompt hub before you can start the experiment to ensure it can be referenced in the experiment. The result for each input will be streamed and displayed inline for each input in the dataset.
-   ![Input variables](../static/input_variables_playground.png)
-4. **View the results** by clicking on the "View Dataset Run Table" button. This will take you to the experiment details page where you can see the results of the experiment.
-   ![View results](../static/view_results.png)
-5. **Navigate back to the commit page** by clicking on the "View Commit" button. This will take you back to the prompt page where you can make changes to the prompt and run more experiments. The "View Commit" button is available to all experiments that were run from the prompt playground. The experiment is prefixed with the prompt repository name, a unique identifier, and the date and time the experiment was run.
-   ![Playground experiment results](../static/playground_experiment_results.png)
-
-## Adding evaluation scores to the experiment
-
-Kicking off an experiment is no fun without actually running evaluations on the results. You can add evaluation scores to the experiment by configuring an automation rule for the dataset, again without writing any code. This will allow you to add evaluation scores to the experiment and compare the results across different experiments.
-It's also possible to add human annotations to the runs of any experiment.
-
-We currently support configuring LLM-as-a-judge evaluators on datasets that will evaluate the results of each run in each experiment kicked off from that dataset.
-
-The process for configuring this is very similar to the process for configuring an [online evaluator](../../monitoring/faq/online_evaluation) for your tracing projects.
-
-1. **Navigate to the dataset details page** by clicking "Datasets and Testing" in the sidebar and selecting the dataset you want to configure the evaluator for.
-2. **Click on the "Add Evaluator" button** to add an evaluator to the dataset. This will open a modal you can use to configure the evaluator.
-
-   ![Add Evaluator](../static/add_evaluator.png)
-
-3. **Give your evaluator a name** and **set an inline prompt or load a prompt from the prompt hub** that will be used to evaluate the results of the runs in the experiment.
-
-   ![Add evaluator name and prompt](../static/create_evaluator.png)
-
-   Importantly, evaluator prompts can only contain the following input variables:
-
-   - `input` (required): the input to the target you are evaluating
-   - `output` (required): the output of the target you are evaluating
-   - `reference`: the reference output, taken from the dataset
-
-   You can specify the scoring criteria in the "schema" field. In this example, we are asking the LLM to grade on "correctness" of the output with respect to the reference, with a boolean output of 0 or 1. The name of the field in the schema will be interpreted as the feedback key and the type will be the type of the score.
-
-   ![Evaluator prompt](../static/evaluator_prompt.png)
-
-4. **Save the evaluator** and navigate back to the dataset details page. Each subsequent experiment run from the dataset will now be evaluated by the evaluator you configured. Note that in the below image, each run in the experiment has a "correctness" score.
-
-   ![Playground evaluator results](../static/playground_evaluator_results.png)
diff --git a/versioned_docs/version-old/evaluation/faq/index.mdx b/versioned_docs/version-old/evaluation/faq/index.mdx
deleted file mode 100644
index c12707503..000000000
--- a/versioned_docs/version-old/evaluation/faq/index.mdx
+++ /dev/null
@@ -1,26 +0,0 @@
----
-sidebar_label: How-To Guides
-sidebar_position: 0
----
-
-# How-To Guides
-
-In this section you will find guides for how to do specific evaluation related things.
-
-**Datasets**
-
-- [How to manage datasets in the app](faq/manage-datasets)
-- [How to manage datasets programmatically](faq/manage-datasets#manage-datasets-programmatically)
-- [How to list datasets from the client](faq/manage-datasets#list-datasets-from-the-client)
-- [How to version datasets](faq/version-datasets)
-- [How to list datapoints from the client](faq/manage-datasets#list-examples-from-the-client)
-- [How to use synthetic data](faq/synthetic-data)
-
-**Evaluators**
-
-- [How to create custom evaluators](faq/custom-evaluators)
-- [How to use off-the-shelf LangChain evaluators](faq/evaluator-implementations)
-
-**Experiments**
-
-- [How to run experiments in the prompt playground](faq/experiments-app)
diff --git a/versioned_docs/version-old/evaluation/faq/manage-datasets.mdx b/versioned_docs/version-old/evaluation/faq/manage-datasets.mdx
deleted file mode 100644
index 7f02ea2d5..000000000
--- a/versioned_docs/version-old/evaluation/faq/manage-datasets.mdx
+++ /dev/null
@@ -1,362 +0,0 @@
----
-sidebar_label: Manage Datasets
-sidebar_position: 5
----
-
-import {
-  CodeTabs,
-  ShellBlock,
-  PythonBlock,
-  TypeScriptBlock,
-} from "@site/src/components/InstructionsWithCode";
-
-# Managing Datasets
-
-## In LangSmith
-
-The easiest way to interact with datasets is directly in the LangSmith app. Here, you can create and edit datasets and example rows. Below are a few ways to interact with them.
-
-### From Existing Runs
-
-We typically construct datasets over time by collecting representative examples from debugging or other runs. To do this, we first filter the runs to find the ones we want to add to the dataset. Then, we create a dataset and add the runs as examples.
-
-You can do this from any 'run' details page by clicking the 'Add to Dataset' button in the top right-hand corner.
-
-![Add to Dataset](../static/add_to_dataset.png)
-
-From there, we select the dataset to organize it in and update the ground truth output values if necessary.
-
-![Modify example](../static/modify_example.png)
-
-### Upload a CSV
-
-The easiest way to create a dataset from your own data is by clicking the 'upload a CSV dataset' button on the home page or in the top right-hand corner of the 'Datasets & Testing' page.
-
-![Upload CSV](../static/create_dataset_csv.png)
-
-Select a name and description for the dataset, and then confirm that the inferred input and output columns are correct.
-
-![Confirm Columns](../static/select_columns.png)
-
-### Exporting datasets to other formats
-
-You can export your LangSmith dataset to CSV or OpenAI evals format directly from the web application.
-
-To do so, click "Export Dataset" from the homepage.
-To do so, select a dataset, click on "Examples", and then click the "Export Dataset" button at the top of the examples table.
-
-![Export Dataset Button](../static/export-dataset-button.png)
-
-This will open a modal where you can select the format you want to export to.
-
-![Export Dataset Modal](../static/export-dataset-modal.png)
-
-## How to manage datasets programmatically
-
-You can create a dataset from existing runs or upload a CSV file (or pandas dataframe in python).
-
-Once you have a dataset created, you can continue to add new runs to it as examples. We recommend that you organize datasets to target a single "task", usually served by a single chain or LLM. For more discussions on datasets and evaluations, check out the [recommendations](../recommendations).
-
-### Create from list of values
-
-The most flexible way to make a dataset using the client is by creating examples from a list of inputs and optional outputs. Below is an example.
-
-Note that you can add arbitrary metadata to each example, such as a note or a source. The metadata is stored as a dictionary.
-
-<CodeTabs
-  tabs={[
-    PythonBlock(`from langsmith import Client\n
-example_inputs = [
-  ("What is the largest mammal?", "The blue whale"),
-  ("What do mammals and birds have in common?", "They are both warm-blooded"),
-  ("What are reptiles known for?", "Having scales"),
-  ("What's the main characteristic of amphibians?", "They live both in water and on land"),
-]\n
-client = Client()
-dataset_name = "Elementary Animal Questions"\n
-# Storing inputs in a dataset lets us
-# run chains and LLMs over a shared set of examples.
-dataset = client.create_dataset(
-    dataset_name=dataset_name, description="Questions and answers about animal phylogenetics.",
-)
-for input_prompt, output_answer in example_inputs:
-    client.create_example(
-        inputs={"question": input_prompt},
-        outputs={"answer": output_answer},
-        metadata={"source": "Wikipedia"},
-        dataset_id=dataset.id,
-    )`),
-    TypeScriptBlock(`import { Client } from "langsmith";\n
-const client = new Client({
-  // apiUrl: "https://api.langchain.com", // Defaults to the LANGCHAIN_ENDPOINT env var
-  // apiKey: "my_api_key", // Defaults to the LANGCHAIN_API_KEY env var
-  /* callerOptions: {
-         maxConcurrency?: Infinity; // Maximum number of concurrent requests to make
-         maxRetries?: 6; // Maximum number of retries to make
-  }*/
-});\n
-const exampleInputs: [string, string][] = [
-  ["What is the largest mammal?", "The blue whale"],
-  ["What do mammals and birds have in common?", "They are both warm-blooded"],
-  ["What are reptiles known for?", "Having scales"],
-  ["What's the main characteristic of amphibians?", "They live both in water and on land"],
-];\n
-const datasetName = "Elementary Animal Questions";\n
-// Storing inputs in a dataset lets us
-// run chains and LLMs over a shared set of examples.
-const dataset = await client.createDataset(datasetName, {
-  description: "Questions and answers about animal phylogenetics",
-});\n
-for (const [inputPrompt, outputAnswer] of exampleInputs) {
-  await client.createExample(
-    { question: inputPrompt },
-    { answer: outputAnswer },
-    {
-      datasetId: dataset.id,
-      metadata: { source: "Wikipedia" },
-    }
-  );
-}`),
-  ]}
-  groupId="client-language"
-/>
-
-### Create from existing runs
-
-To create datasets from existing runs, you can use the same approach. Below is an example:
-
-<CodeTabs
-  tabs={[
-    PythonBlock(`from langsmith import Client\n
-os.environ["LANGCHAIN_ENDPOINT"] = "https://api.smith.langchain.com"
-os.environ["LANGCHAIN_API_KEY"] = "<YOUR-LANGSMITH-API-KEY>"
-client = Client()
-dataset_name = "Example Dataset"\n
-# Filter runs to add to the dataset
-runs = client.list_runs(
-    project_name="my_project",
-    execution_order=1,
-    error=False,
-)\n
-dataset = client.create_dataset(dataset_name, description="An example dataset")
-for run in runs:
-    client.create_example(
-        inputs=run.inputs,
-        outputs=run.outputs,
-        dataset_id=dataset.id,
-    )`),
-    TypeScriptBlock(`import { Client, Run } from "langsmith";
-const client = new Client({
-  // apiUrl: "https://api.langchain.com", // Defaults to the LANGCHAIN_ENDPOINT env var
-  // apiKey: "my_api_key", // Defaults to the LANGCHAIN_API_KEY env var
-  /* callerOptions: {
-         maxConcurrency?: Infinity; // Maximum number of concurrent requests to make
-         maxRetries?: 6; // Maximum number of retries to make
-  }*/
-});\n
-const datasetName = "Example Dataset";
-// Filter runs to add to the dataset
-const runs: Run[] = [];
-for await (const run of client.listRuns({
-  projectName: "my_project",
-  executionOrder: 1,
-  error: false,
-})) {
-  runs.push(run);
-}\n
-const dataset = await client.createDataset(datasetName, {
-  description: "An example dataset",
-  dataType: "kv",
-});\n
-for (const run of runs) {
-  await client.createExample(run.inputs, run.outputs ?? {}, {
-    datasetId: dataset.id,
-  });
-}
-`),
-  ]}
-  groupId="client-language"
-/>
-
-### Create dataset from CSV
-
-In this section, we will demonstrate how you can create a dataset by uploading a CSV file.
-
-First, ensure your CSV file is properly formatted with columns that represent your input and output keys. These keys will be utilized to map your data properly during the upload. You can specify an optional name and description for your dataset. Otherwise, the file name will be used as the dataset name and no description will be provided.
-
-<CodeTabs
-  tabs={[
-    PythonBlock(`from langsmith import Client
-import os\n
-os.environ["LANGCHAIN_ENDPOINT"] = "https://api.smith.langchain.com"
-os.environ["LANGCHAIN_API_KEY"] = "<YOUR-LANGSMITH-API-KEY>"\n
-client = Client()\n
-csv_file = 'path/to/your/csvfile.csv'
-input_keys = ['column1', 'column2'] # replace with your input column names
-output_keys = ['output1', 'output2'] # replace with your output column names\n
-dataset = client.upload_csv(
-    csv_file=csv_file,
-    input_keys=input_keys,
-    output_keys=output_keys,
-    name="My CSV Dataset",
-    description="Dataset created from a CSV file"
-    data_type="kv"
-)`),
-    TypeScriptBlock(`import { Client } from "langsmith";\n
-const client = new Client();\n
-const csvFile = 'path/to/your/csvfile.csv';
-const inputKeys = ['column1', 'column2']; // replace with your input column names
-const outputKeys = ['output1', 'output2']; // replace with your output column names\n
-const dataset = await client.uploadCsv({
-    csvFile: csvFile,
-    fileName: "My CSV Dataset",
-    inputKeys: inputKeys,
-    outputKeys: outputKeys,
-    description: "Dataset created from a CSV file",
-    dataType: "kv"
-});`),
-  ]}
-  groupId="client-language"
-/>
-
-### Create dataset from pandas dataframe
-
-The python client offers an additional convenience method to upload a dataset from a pandas dataframe.
-
-```python
-from langsmith import Client
-import os
-import pandas as pd
-
-os.environ["LANGCHAIN_ENDPOINT"] = "https://api.smith.langchain.com"
-os.environ["LANGCHAIN_API_KEY"] = "<YOUR-LANGSMITH-API-KEY>"
-client = Client()
-
-df = pd.read_parquet('path/to/your/myfile.parquet')
-input_keys = ['column1', 'column2'] # replace with your input column names
-output_keys = ['output1', 'output2'] # replace with your output column names
-
-dataset = client.upload_dataframe(
-    df=df,
-    input_keys=input_keys,
-    output_keys=output_keys,
-    name="My Parquet Dataset",
-    description="Dataset created from a parquet file",
-    data_type="kv" # The default
-)
-```
-
-## List datasets from the client
-
-You can programmatically fetch the datasets from LangSmith using the `list_datasets` method in the client. Below are some common examples:
-
-### Query all datasets
-
-<CodeTabs
-  tabs={[
-    PythonBlock(`datasets = client.list_datasets()`),
-    TypeScriptBlock(`const datasets = await client.listDatasets();`),
-  ]}
-  groupId="client-language"
-/>
-
-### List datasets by name
-
-If you want to search by the exact name, you can do the following:
-
-<CodeTabs
-  tabs={[
-    PythonBlock(
-      `datasets = client.list_datasets(dataset_name="My Test Dataset 1")`
-    ),
-    TypeScriptBlock(
-      `const datasets = await client.listDatasets({datasetName: "My Test Dataset 1"});`
-    ),
-  ]}
-  groupId="client-language"
-/>
-
-If you want to do a case-invariant substring search, try the following:
-
-<CodeTabs
-  tabs={[
-    PythonBlock(
-      `datasets = client.list_datasets(dataset_name_contains="some substring")`
-    ),
-    TypeScriptBlock(
-      `const datasets = await client.listDatasets({datasetNameContains: "some substring"});`
-    ),
-  ]}
-  groupId="client-language"
-/>
-
-### List datasets by type
-
-You can filter datasets by type. Below is an example querying for chat datasets.
-
-<CodeTabs
-  tabs={[
-    PythonBlock(`datasets = client.list_datasets(data_type="chat")`),
-    TypeScriptBlock(
-      `const datasets = await client.listDatasets({dataType: "chat"});`
-    ),
-  ]}
-  groupId="client-language"
-/>
-
-## List Examples from the client
-
-Once you have a dataset created, you may want to download the examples. You can fetch dataset examples using the `list_examples` method on the LangSmith client. Below are some common calls:
-
-### List all examples for a dataset
-
-You can filter by dataset ID:
-
-<CodeTabs
-  tabs={[
-    PythonBlock(
-      `examples = client.list_examples(dataset_id="c9ace0d8-a82c-4b6c-13d2-83401d68e9ab")`
-    ),
-    TypeScriptBlock(
-      `const examples = await client.listExamples({datasetId: "c9ace0d8-a82c-4b6c-13d2-83401d68e9ab"});`
-    ),
-  ]}
-  groupId="client-language"
-/>
-
-Or you can filter by dataset name (this must exactly match the dataset name you want to query)
-
-<CodeTabs
-  tabs={[
-    PythonBlock(
-      `examples = client.list_examples(dataset_name="My Test Dataset")`
-    ),
-    TypeScriptBlock(
-      `const examples = await client.listExamples({datasetName: "My test Dataset"});`
-    ),
-  ]}
-  groupId="client-language"
-/>
-
-### List examples by id
-
-You can also list multiple examples all by ID.
-
-<CodeTabs
-  tabs={[
-    PythonBlock(`example_ids = [
- '734fc6a0-c187-4266-9721-90b7a025751a',
- 'd6b4c1b9-6160-4d63-9b61-b034c585074f',
- '4d31df4e-f9c3-4a6e-8b6c-65701c2fed13',
-]
-examples = client.list_examples(example_ids=example_ids)`),
-    TypeScriptBlock(`
-const exampleIds = [
-  "734fc6a0-c187-4266-9721-90b7a025751a",
-  "d6b4c1b9-6160-4d63-9b61-b034c585074f",
-  "4d31df4e-f9c3-4a6e-8b6c-65701c2fed13",
-];
-const examples = await client.listExamples({exampleIds: exampleIds});`),
-  ]}
-  groupId="client-language"
-/>
diff --git a/versioned_docs/version-old/evaluation/faq/regression-testing.mdx b/versioned_docs/version-old/evaluation/faq/regression-testing.mdx
deleted file mode 100644
index 6b0c750c2..000000000
--- a/versioned_docs/version-old/evaluation/faq/regression-testing.mdx
+++ /dev/null
@@ -1,40 +0,0 @@
----
-sidebar_label: Regression Testing
-sidebar_position: 3
----
-
-# Regression Testing
-
-When evaluating LLM applications, it is important to be able to track how your system performs over time. In this guide, we will show you how to use LangSmith's comparison view in
-order to track regressions in your application, and drill down to inspect the specific runs that improved/regressed over time.
-
-## Overview
-
-In the LangSmith comparison view, runs that _regressed_ on your specified feedback key against your baseline experiment will be highlighted in red, while runs that _improved_
-will be highlighted in green. At the top of each column, you can see how many runs in that experiment did better and and how many did worse than your baseline experiment.
-
-![Regressions](../static/regression_view.png)
-
-## Baseline Experiment
-
-In order to track regressions, you need a baseline experiment against which to compare. This will be automatically assigned as the first experiment in your comparison, but you can
-change it from the dropdown at the top of the page.
-
-![Baseline](../static/select_baseline.png)
-
-## Select Feedback Key
-
-You will also want to select the feedback key on which you would like focus. This can be selected via another dropdown at the top. Again, one will be assigned by
-default, but you can adjust as needed.
-
-![Feedback](../static/select_feedback.png)
-
-## Filter to Regressions or Improvements
-
-Click on the regressions or improvements buttons on the top of each column to filter to the runs that regressed or improved in that specific experiment.
-
-![Regressions Filter](../static/filter_to_regressions.png)
-
-## Try it out
-
-To get started with regression testing, try [running a no-code experiment in our prompt playground](experiments-app) or check out the [Evaluation Quick Start Guide](../quickstart) to get started with the SDK.
diff --git a/versioned_docs/version-old/evaluation/faq/synthetic-data.mdx b/versioned_docs/version-old/evaluation/faq/synthetic-data.mdx
deleted file mode 100644
index a994d1c62..000000000
--- a/versioned_docs/version-old/evaluation/faq/synthetic-data.mdx
+++ /dev/null
@@ -1,155 +0,0 @@
----
-sidebar_label: Synthetic Data for Evaluation
-sidebar_position: 9
----
-
-# Synthetic Data for Evaluation
-
-When prototyping a system, you may not have enough real data to thoroughly evaluate how the component will behave. This guide will walk you through two techniques for generating synthetic data to augment your dataset:
-
-1. **Paraphrasing Existing Inputs**: Generate semantically similar variations of your existing examples to test your system's consistency.
-
-2. **Generating New Inputs**: Create entirely new, plausible inputs to test the how your system generalizes to other scenarios.
-
-:::note Reliability
-Synthetic data is not a full substitute for real data. The quality of the data generated by these methods depends on factors like the model, prompt, and existing data. Always inspect synthetic datasets to ensure they capture the information you want to model and align with your use case.
-:::
-
-### Prerequisites
-
-This guide assumes you've already connected to LangSmith and have a starter dataset. Though we will use LangChain core below, the technique is simple enough to apply using whatever tools you're comfortable with.
-
-```python
-pip install langsmith langchain_openai
-```
-
-## Paraphrasing
-
-Paraphrasing existing inputs helps check if your chain's behavior is consistent across similar inputs. Since paraphrasing is a semantically invariant transformation, the outputs should remain the same as the original. Here's how to set it up:
-
-#### Step 1: Define the Paraphrase Generator
-
-Create a chain for generating paraphrases using the `ChatOpenAI` model with custom system prompts.
-
-```python
-import re
-from typing import List
-
-from langchain_openai import ChatOpenAI
-from langchain_core.prompts import (
-    ChatPromptTemplate,
-)
-
-paraphrase_llm = ChatOpenAI(temperature=0.5)
-prompt_template = ChatPromptTemplate.from_messages(
-    [
-        ("system",
-            "You are a helpful paraphrasing assistant tasked with rephrasing text."
-        ),
-        ("system", "Input: <INPUT>{query}</INPUT>"),
-        ("user",
-            "What are {n_paraphrases} different ways you could paraphrase the INPUT text?"
-            " Do not significantly change the meaning."
-            " Respond using numbered bullets. If you cannot think of any,"
-            " just say 'I don't know.'"
-        ),
-    ]
-)
-
-def parse(output: str) -> List[str]:
-    return re.findall(r"\d+\.\s+(.*?)\n", output)
-
-paraphrase_chain = prompt | llm | parse
-```
-
-#### Step 2: Paraphrase the Dataset
-
-Use the `Client` from LangSmith to access your dataset and generate paraphrases for it.
-
-```python
-from langsmith import Client
-
-client = Client()
-n_paraphrases = 3
-dataset_name = "Your Dataset Name"
-
-examples = client.list_examples(dataset_name=dataset_name)
-results = paraphrase_chain.batch(
-    [{"query": next(iter(example.inputs.values())), "n_paraphrases": n_paraphrases}
-    for example in examples]
-)
-inputs, outputs = [], []
-for example, batch_r in zip(examples, results):
-    input_key = next(iter(example.inputs))
-    for r in result:
-        inputs.append({input_key: r})
-        outputs.append(example.outputs)
-client.create_examples(
-    inputs=inputs,
-    outputs=outputs,
-    dataset_name=dataset_name,
-)
-```
-
-After running, your dataset should be roughly 3x the original size, with paraphrased variations of your original inputs.
-
-## Generating New Inputs
-
-To expand your dataset's semantic range and test your system's robustness, you can generate entirely new, plausible inputs. This method examines a random set of 5 existing examples and creates 6 novel ones that align with the inferred system but are distinct enough to have likely originated from different individuals.
-
-#### Step 1: Define the New Input Generator
-
-Create a chain for generating new inputs using the `ChatOpenAI` model with custom system prompts.
-
-```python
-input_gen_llm = ChatOpenAI(temperature=0.5)
-input_gen_prompt_template = ChatPromptTemplate.from_messages(
-    [
-        ("system",
-            # Update this prompt to more closely match your use case
-            "You are a creative assistant tasked with coming up with new inputs for an application."
-            "\nThe following are some examples you can use to understand the domain:\n\n{examples}"
-        ),
-        ("user",
-            "Can you generate {n_inputs} unique and plausible inputs that could be asked by different users?"
-        ),
-    ]
-)
-
-input_gen_chain = prompt | llm | parse
-```
-
-#### Step 2: Generate New Inputs for the Dataset
-
-Use the Client from LangSmith to access your dataset, sample a set of existing inputs, and generate new inputs based on them. Note that new inputs don't come with corresponding outputs, so you may need to manually label them or use a separate model to generate the outputs.
-
-```python
-import random
-
-client = Client()
-n_inputs = 6
-dataset_name = "Your Dataset Name"
-sample_size = 5
-
-examples = list(client.list_examples(dataset_name=dataset_name))
-example_inputs = [next(iter(example.inputs.values())) for example in random.sample(examples, sample_size)]
-example_inputs_str = '\n'.join(f"- {input}" for input in example_inputs)
-results = input_gen_chain.batch(
-    [{"examples": example_inputs_str, "n_inputs": n_inputs}]
-)
-inputs = [{"input": r} for r in results[0]]
-outputs = [{}] * len(inputs)
-client.create_examples(
-    inputs=inputs,
-    outputs=outputs,
-    dataset_name=dataset_name,
-)
-```
-
-After running, your dataset should contain new examples that differ more significantly from the original ones, helping you test your system's robustness to a wider range of inputs.
-
-### Considerations
-
-Remember that the quality of the paraphrases and generated inputs will depend on the model and prompt used, and these approaches may not be appropriate for all use cases. Always check your augmented data to ensure it maintains the original meaning, aligns with the system's context, and is suitable for your application.
-
-Synthetic data is most useful early in the development process, when you're trying to gauge how sensitive your chain or model is to input variations. By combining paraphrasing, new input generation, and other augmentation methods, you can expand and diversify your dataset to verify the feasibility and robustness of a feature before deploying it to production.
diff --git a/versioned_docs/version-old/evaluation/faq/unit-testing.mdx b/versioned_docs/version-old/evaluation/faq/unit-testing.mdx
deleted file mode 100644
index 3bec87a10..000000000
--- a/versioned_docs/version-old/evaluation/faq/unit-testing.mdx
+++ /dev/null
@@ -1,324 +0,0 @@
----
-sidebar_label: Unit Test
-sidebar_position: 4
----
-
-# Unit Tests
-
-LangSmith unit tests are assertions and expectations designed to **quickly** identify obvious bugs and regressions in your AI system. Relative to evaluations, tests are designed to be **fast** and **cheap** to run, focusing on **specific** functionality and edge cases.
-We recommend using LangSmith to track any unit tests that touch an LLM or other non-deterministic part of your AI system.
-
-:::note
-`@unit` currently requires `langsmith` python version `>=0.1.42`. If you are interested in unit testing functionality in TypeScript or other languages, please let us know at [support@langchain.dev](mailto:support@langchain.dev).  
-:::
-
-## Write @unit test
-
-To write a LangSmith unit test, decorate your test function with `@unit`.
-If you want to track the full nested trace of the system or component being tested, you can mark those functions with `@traceable`. For example:
-
-```python
-# my_app/main.py
-from langsmith import traceable
-@traceable # Optional
-def generate_sql(user_query):
-    # Replace with your SQL generation logic
-    # e.g., my_llm(my_prompt.format(user_query))
-    return "SELECT * FROM customers"
-```
-
-Then define your unit test:
-
-```python tests/test_my_app.py
-# tests/test_my_app.py
-from langsmith import unit
-from my_app.main import generate_sql
-
-@unit
-def test_sql_generation_select_all():
-    user_query = "Get all users from the customers table"
-    sql = generate_sql(user_query)
-    # LangSmith logs any exception raised by `assert` / `pytest.fail` / `raise` / etc.
-    # as a test failure
-    # highlight-next-line
-    assert sql == "SELECT * FROM customers"
-```
-
-## Run tests
-
-You can use a standard unit testing framework such as `pytest` ([docs](https://docs.pytest.org/en/7.1.x/contents.html)) to run. For example:
-
-```bash
-pytest tests/
-```
-
-Each time you run this test suite, LangSmith collects the pass/fail rate and other traces as a new `TestSuiteResult`, logging the `pass` rate (1 for pass, 0 for fail) over all the applicable tests.
-
-The test suite syncs to a corresponding dataset named after your package or github repository.
-
-![Unit Test Example](../static/unit-test-suite.png)
-
-## Going Further
-
-`@unit` is designed to stay out of your way and works well with familiar `pytest` features. For example:
-
-#### Defining inputs as fixtures
-
-Pytest fixtures let you define functions that serve as reusable inputs for your tests. LangSmith automatically syncs any test case inputs defined as fixtures. For example:
-
-```python
-import pytest
-
-@pytest.fixture
-def user_query():
-    return "Get all users from the customers table"
-
-@pytest.fixture
-def expected_sql():
-    return "SELECT * FROM customers"
-
-# output_keys indicate which test arguments to save as 'outputs' in the dataset (Optional)
-# Otherwise, all arguments are saved as 'inputs'
-@unit(output_keys=["expected_sql"])
-def test_sql_generation_with_fixture(user_query, expected_sql):
-    sql = generate_sql(user_query)
-    assert sql == expected_sql
-```
-
-#### Parametrizing tests
-
-Parametrizing tests lets you run the same assertions across multiple sets of inputs. Use `pytest`'s `parametrize` decorator to achieve this. For example:
-
-```python
-@unit
-@pytest.mark.parametrize(
-    "user_query, expected_sql",
-    [
-        ("Get all users from the customers table", "SELECT * FROM customers"),
-        ("Get all users from the orders table", "SELECT * FROM orders"),
-    ],
-)
-def test_sql_generation_parametrized(user_query, expected_sql):
-    sql = generate_sql(user_query)
-    assert sql == expected_sql
-```
-
-**Note:** as the parametrized list grows, you may consider using `evaluate()` instead. This parallelizes the evaluation and makes it easier to control individual experiments and the corresponding dataset.
-
-#### Expectations
-
-LangSmith provides an `expect` utility to help define expectations about your LLM output. For example:
-
-```python
-from langsmith import expect
-
-@unit
-def test_sql_generation_select_all():
-    user_query = "Get all users from the customers table"
-    sql = generate_sql(user_query)
-    expect(sql).to_contain("customers")
-```
-
-This will log the binary "expectation" score to the experiment results, additionally `assert`ing that the expectation is met possibly triggering a test failure.
-
-`expect` also provides "fuzzy match" methods. For example:
-
-```python
-@unit
-@pytest.mark.parametrize(
-    "query, expectation",
-    [
-       ("what's the capital of France?", "Paris"),
-    ],
-)
-def test_embedding_similarity(query, expectation):
-    prediction = my_chatbot(query)
-    expect.embedding_distance(
-        # This step logs the distance as feedback for this run
-        prediction=prediction, reference=expectation
-    # Adding a matcher (in this case, 'to_be_*"), logs 'expectation' feedback
-    ).to_be_less_than(0.5) # Optional predicate to assert against
-    expect.edit_distance(
-        # This computes the normalized Damerau-Levenshtein distance between the two strings
-        prediction=prediction, reference=expectation
-    # If no predicate is provided below, 'assert' isn't called, but the score is still logged
-    )
-```
-
-This test case will be assigned 4 scores:
-
-1. The `embedding_distance` between the prediction and the expectation
-2. The binary `expectation` score (1 if cosine distance is less than 0.5, 0 if not)
-3. The `edit_distance` between the prediction and the expectation
-4. The overall test pass/fail score (binary)
-
-The `expect` utility is modeled off of [Jest](https://jestjs.io/docs/expect)'s expect API, with some off-the-shelf functionality to make it easier to grade your LLMs.
-
-#### Dry-run mode
-
-If you want to run the tests without syncing the results to LangSmith, you can set `LANGCHAIN_TEST_TRACKING=false` in your environment.
-
-```bash
-LANGCHAIN_TEST_TRACKING=false pytest tests/
-```
-
-The tests will run as normal, but the experiment logs will not be sent to LangSmith.
-
-#### Caching
-
-LLMs on every commit in CI can get expensive. To save time and resources, LangSmith lets you cache results to disk. Any identical inputs will be loaded from the cache so you don't have to call out to your LLM provider unless there are changes to the model, prompt, or retrieved data.
-
-To enable caching, run with `LANGCHAIN_TEST_CACHE=/my/cache/path`. For example:
-
-```bash
-LANGCHAIN_TEST_CACHE=tests/cassettes pytest tests/my_llm_tests
-```
-
-All requests will be cached to `tests/cassettes` and loaded from there on subsequent runs. If you check this in to your repository, your CI will be able to use the cache as well.
-
-#### Using `watch` mode
-
-With caching enabled, you can iterate quickly on your tests using `watch` mode without worrying about unnecessarily hitting your LLM provider. For example, using [`pytest-watch`](https://pypi.org/project/pytest-watch/):
-
-```bash
-pip install pytest-watch
-LANGCHAIN_TEST_CACHE=tests/cassettes ptw tests/my_llm_tests
-```
-
-## Explanations
-
-The `@unit` test decorator converts any unit test into a parametrized LangSmith example. By default, all unit tests within a given file will be grouped as a single "test suite" with a corresponding dataset.
-
-The following metrics are available off-the-shelf:
-
-| Feedback             | Description                                                 | Example                                                                                                               |
-| -------------------- | ----------------------------------------------------------- | --------------------------------------------------------------------------------------------------------------------- |
-| `pass`               | Binary pass/fail score, 1 for pass, 0 for fail              | `assert False` # Fails                                                                                                |
-| `expectation`        | Binary expectation score, 1 if expectation is met, 0 if not | `expect(prediction).against(lambda x: re.search(r"\b[a-f\d]{8}-[a-f\d]{4}-[a-f\d]{4}-[a-f\d]{4}-[a-f\d]{12}\b", x)` ) |
-| `embedding_distance` | Cosine distance between two embeddings                      | expect.embedding_distance(prediction=prediction, reference=expectation)                                               |
-| `edit_distance`      | Edit distance between two strings                           | expect.edit_distance(prediction=prediction, reference=expectation)                                                    |
-
-You can also log any arbitrary feeback within a unit test manually using the `client`.
-
-```python
-from langsmith import unit, Client
-from langsmith.run_helpers import get_current_run_tree
-
-client = Client()
-
-@unit
-def test_foo():
-    run_tree = get_current_run_tree()
-    client.create_feedback(run_id=run_tree.id, key="my_custom_feedback", score=1)
-```
-
-## Reference
-
-### `expect`
-
-`expect` makes it easy to make approximate assertions on test results and log scores to LangSmith.
-Off-the-shelf, it allows you to compute and compare embedding distances, edit distances, and make custom assertions on values.
-
-#### `expect.embedding_distance(prediction, reference, *, config=None)`
-
-Compute the embedding distance between the prediction and reference.
-
-This logs the embedding distance to LangSmith and returns a [`Matcher`](#matcher) instance for making assertions on the distance value.
-
-By default, this uses the OpenAI API for computing embeddings.
-
-**Parameters**
-
-- `prediction` (str): The predicted string to compare.
-- `reference` (str): The reference string to compare against.
-- `config` (Optional[EmbeddingConfig]): Optional configuration for the embedding distance evaluator. Supported options:
-  - `encoder`: A custom encoder function to encode the list of input strings to embeddings. Defaults to the OpenAI API.
-  - `metric`: The distance metric to use for comparison. Supported values: "cosine", "euclidean", "manhattan", "chebyshev", "hamming".
-
-**Returns**
-
-A [`Matcher`](#matcher) instance for the embedding distance value.
-
-#### `expect.edit_distance(prediction, reference, *, config=None)`
-
-Compute the string distance between the prediction and reference.
-
-This logs the string distance (Damerau-Levenshtein) to LangSmith and returns a [`Matcher`](#matcher) instance for making assertions on the distance value.
-
-This depends on the `rapidfuzz` package for string distance computation.
-
-**Parameters**
-
-- `prediction` (str): The predicted string to compare.
-- `reference` (str): The reference string to compare against.
-- `config` (Optional[EditDistanceConfig]): Optional configuration for the string distance evaluator. Supported options:
-  - `metric`: The distance metric to use for comparison. Supported values: "damerau_levenshtein", "levenshtein", "jaro", "jaro_winkler", "hamming", "indel".
-  - `normalize_score`: Whether to normalize the score between 0 and 1.
-
-**Returns**
-
-A [`Matcher`](#matcher) instance for the string distance value.
-
-#### `expect.value(value)`
-
-Create a [`Matcher`](#matcher) instance for making assertions on the given value.
-
-**Parameters**
-
-- `value` (Any): The value to make assertions on.
-
-**Returns**
-
-A [`Matcher`](#matcher) instance for the given value.
-
-#### `Matcher`
-
-A class for making assertions on expectation values.
-
-**`to_be_less_than(value)`**
-
-Assert that the expectation value is less than the given value.
-
-**`to_be_greater_than(value)` **
-
-Assert that the expectation value is greater than the given value.
-
-**`to_be_between(min_value, max_value)`**
-
-Assert that the expectation value is between the given min and max values.
-
-**`to_be_approximately(value, precision=2)`**
-
-Assert that the expectation value is approximately equal to the given value.
-
-**`to_equal(value)`**
-
-Assert that the expectation value equals the given value.
-
-**`to_contain(value)`**
-
-Assert that the expectation value contains the given value.
-
-**`against(func)`**
-
-Assert the expectation value against a custom function.
-
-### `unit` API
-
-The `unit` decorator is used to mark a function as a test case for LangSmith. It ensures that the necessary example data is created and associated with the test function. The decorated function will be executed as a test case, and the results will be recorded and reported by LangSmith.
-
-#### `@unit(id=None, output_keys=None, client=None, test_suite_name=None)`
-
-Create a unit test case in LangSmith.
-
-**Parameters**
-
-- `id` (Optional[uuid.UUID]): A unique identifier for the test case. If not provided, an ID will be generated based on the test function's module and name.
-- `output_keys` (Optional[Sequence[str]]): A list of keys to be considered as the output keys for the test case. These keys will be extracted from the test function's inputs and stored as the expected outputs.
-- `client` (Optional[ls_client.Client]): An instance of the LangSmith client to be used for communication with the LangSmith service. If not provided, a default client will be used.
-- `test_suite_name` (Optional[str]): The name of the test suite to which the test case belongs. If not provided, the test suite name will be determined based on the environment or the package name.
-
-**Environment Variables**
-
-- `LANGSMITH_TEST_CACHE`: If set, API calls will be cached to disk to save time and costs during testing. Recommended to commit the cache files to your repository for faster CI/CD runs. Requires the 'langsmith[vcr]' package to be installed.
-- `LANGSMITH_TEST_TRACKING`: Set this variable to the path of a directory to enable caching of test results. This is useful for re-running tests without re-executing the code. Requires the 'langsmith[vcr]' package.
diff --git a/versioned_docs/version-old/evaluation/faq/version-datasets.mdx b/versioned_docs/version-old/evaluation/faq/version-datasets.mdx
deleted file mode 100644
index a2558e242..000000000
--- a/versioned_docs/version-old/evaluation/faq/version-datasets.mdx
+++ /dev/null
@@ -1,66 +0,0 @@
----
-sidebar_label: Version Datasets
-sidebar_position: 6
----
-
-# How to version datasets
-
-## Basics
-
-Any time you _add_, _update_, or _delete_ examples in your dataset, a new version of your dataset is created. This allows you to track changes to your dataset over time and to understand how your dataset has evolved.
-
-By default, the version is defined by the timestamp of the change. When you click on a particular version of a dataset (by timestamp) in the "Examples" tab, you can see the state of the dataset at that point in time.
-
-![Version Datasets](../static/version_dataset.png)
-
-Note that examples are read-only when viewing a past version of the dataset. You will also see the operations that were between this version of the dataset and the "latest" version of the dataset. Also, by default the **latest version of the dataset is shown in the "Examples" tab** and experiments from **all versions are shown in the "Tests" tab**.
-
-In the "Tests" tab, you can see the results of tests run on the dataset at different versions.
-
-![Version Datasets](../static/version_dataset_tests.png)
-
-## Tagging versions
-
-You can also tag versions of your dataset to give them a more human-readable name. This can be useful for marking important milestones in your dataset's history.
-
-For example, you might tag a version of your dataset as "prod" and use it to run tests against your LLM pipeline.
-
-Tagging can be done in the UI by clicking on "+ Tag this version" in the "Examples" tab.
-
-![Tagging Datasets](../static/tag_this_version.png)
-
-You can also tag versions of your dataset using the SDK. Here's an example of how to tag a version of a dataset using the python SDK:
-
-```python
-from langsmith import Client
-fromt datetime import datetime
-
-client = Client()
-
-initial_time = datetime(2024, 1, 1, 0, 0, 0) # The timestamp of the version you want to tag
-
-# You can tag a specific dataset version with a semantic name, like "prod"
-client.update_dataset_tag(
-    dataset_name=toxic_dataset_name, as_of=initial_time, tag="prod"
-)
-```
-
-## Running experiments on specific versions of datasets
-
-You can execute an experiment on a specific version of a dataset in the sdk by using the `as_of` parameter in `list_examples`. `as_of`
-
-Here is an example of how to run an experiment on a specific version of a dataset using the python SDK:
-
-```python
-from langsmith.evaluation import evaluate
-from langsmith import Client
-
-client = Client()
-
-result = evaluate(
-    lambda inputs: label_query(**inputs), # Your target to evaluate, [defined elsewhere]
-    data=client.list_examples(dataset_name="my_dataset", as_of="prod"),
-    evaluators=[correct_label], # Your evaluators, [defined elsewhere]
-    experiment_prefix="dataset versioning example",
-)
-```
diff --git a/versioned_docs/version-old/evaluation/index.mdx b/versioned_docs/version-old/evaluation/index.mdx
deleted file mode 100644
index 77985cc02..000000000
--- a/versioned_docs/version-old/evaluation/index.mdx
+++ /dev/null
@@ -1,142 +0,0 @@
----
-sidebar_label: Overview
-sidebar_position: 0
----
-
-import ThemedImage from "@theme/ThemedImage";
-
-# Evaluation Overview
-
-## What are evaluations?
-
-Evaluations allow you to understand the performance of your LLM application over time. At its core, an evaluation is a function that takes in a set of inputs and outputs from your chain, agent, or model,
-and returns a score (or multiple scores). This score may be based on comparing the outputs with reference outputs (e.g. with string matching or using an LLM as a judge).
-However, there are also evaluators that don't require a reference output - for example, one that checks if the output is valid JSON, which is a common requirement in LLM applications.
-LangSmith allows you to run evaluations on your application via `Datasets`, which are made up of `Examples`.
-
-## Components of an evaluation pipeline
-
-The following diagram outlines the building blocks for evaluations in LangSmith. `Datasets` define the inputs over which you run your chain, model, or agent (the `Task`),
-and optionally the reference outputs against which your evaluator will compare the outputs of your `Task`. These datasets can be from any number of sources -
-you might manually curate them, collect them from user input/feedback, or generate them via LLM. Your `Evaluator` can be any arbitrary function which returns a score
-based on the inputs and outputs of your `Task`, and the reference output if desired. You can also use [one of LangSmith's off-the-shelf
-evaluators](evaluation/faq/evaluator-implementations) to get started quickly!
-
-<ThemedImage
-  alt="LangSmith Primitives"
-  sources={{
-    light: require("./static/langsmith_summary.png").default,
-    dark: require("./static/langsmith_summary_dark.png").default,
-  }}
-/>
-
-## Datasets
-
-`Datasets` are collections of `Examples`, the core building block for the evaluation workflow in LangSmith.
-Examples provide the inputs over which you will be running your pipeline,
-and, if applicable, the outputs that you will be comparing against.
-All examples in a given dataset should follow the same schema. Examples contain an `"inputs"` dict and an `"output"` dict,
-along with (optionally) a `metadata` dict.
-
-![Example](static/sample_langsmith_example.png)
-
-<div
-  style={{
-    display: "flex",
-    flexDirection: "column",
-    textAlign: "center",
-    fontSize: "14px",
-    marginTop: "-15px",
-    marginBottom: "30px",
-  }}
->
-  An Example in the LangSmith UI
-</div>
-
-A single run of all your example inputs through your `Task` is called an `Experiment`. In LangSmith, you can easily view all the experiments that are associated
-with your dataset, and track your application's performance over time!
-
-![Dataset](static/sample_langsmith_dataset.png)
-
-<div
-  style={{
-    display: "flex",
-    flexDirection: "column",
-    textAlign: "center",
-    fontSize: "14px",
-    marginTop: "-15px",
-    marginBottom: "30px",
-  }}
->
-  A Dataset in the LangSmith UI
-</div>
-
-### Creating Datasets
-
-Datasets in LangSmith can be created in two main ways:
-
-- [In the LangSmith SDK](evaluation/faq/manage-datasets#how-to-manage-datasets-programmatically) with `create_dataset`.
-- [In the LangSmith UI](evaluation/faq/manage-datasets) by clicking "New Dataset" from the [LangSmith datasets page](https://smith.langchain.com/datasets). These can
-  be uploaded as a CSV, or you can manually create examples in the UI.
-
-### Types of Datasets
-
-Dataset types communicate common input and output schemas. There are three types of datasets in LangSmith: `kv`, `llm`, and `chat`. `kv` datasets are the default type, and are
-sufficient for almost all use-cases. `llm` and `chat` datasets can be useful to conveniently export datasets into known fine-tuning formats.
-
-- `kv`: In `kv` datasets, inputs and outputs can be arbitrary key-value pairs. These are useful when evaluating chains and agents that require
-  multiple inputs or that return multiple outputs.
-  The tradeoff with these datasets is that running evaluations on them can be a bit more involved. If there are multiple keys, you will have to manually specify the `prepare_data`
-  function in any off-the-shelf evaluators so they know what information to consider in generating a score.
-- `llm`: `llm` datasets correspond to the string inputs and outputs from the "completion" style LLMS (string in, string out). The `"inputs"` dictionary contains a single `"input"` key mapped to a single prompt string. Similarly, the `"outputs"` dictionary contains a single `"output"` key mapped to a single response string.
-- `chat`: `chat` datasets correspond to messages and generations from LLMs that expect structured "chat" messages as inputs and outputs. Each example row
-  expects an `"inputs"` dictionary containing a single `"input"` key mapped to a list of serialized chat messages. The `"outputs"` dictionary contains a single `"output"` key mapped to a single list of serialized chat messages.
-
-## Evaluators
-
-Evaluators are functions that help score how well your system did on a particular example. When running an evaluation,
-your example inputs are run through your `Task` to produce `Runs`, which are then passed into your evaluator along with the `Example`.
-The function then returns an `EvaluationResult`, which specifies your metric name and score. Evaluations in LangSmith are run via the `evaluate()` function.
-The following diagram gives an overview of the data flow in an evaluation:
-
-<ThemedImage
-  alt="LangSmith Evaluations"
-  sources={{
-    light: require("./static/langsmith_app_flow.png").default,
-    dark: require("./static/langsmith_app_flow_dark.png").default,
-  }}
-/>
-<div style={{ marginBottom: "30px" }} />
-
-The inputs to an evaluator consist of:
-
-1. An `Example` - the inputs for your pipeline and optionally the reference outputs or labels
-2. A `Run` - observed output gathered from running the inputs through the `Task`
-
-An evaluator will then return an `EvaluationResult` (or similarly shaped dictionary), which is made up of:
-
-- `key`: The name the metric being evaluated
-- `score`: The value of the metric on this example
-- `comment`: the reasoning trajectory or other string information motivating the score
-
-### Types of Evaluators
-
-The evaluator itself can be any arbitrary function. There are a few different types of evaluators that are commonly used:
-
-- **Heuristics**: A heuristic evaluator is a hard-coded function that does some computation to determine a score. For example, you might write an
-  evaluator that checks whether the output of the system is an empty string, or determines if it is valid JSON. These would be considered **reference-free** evaluators,
-  as they don't consider any example output when making their decision. You might also want to check that the output of the system matches the reference output exactly,
-  which would be considered a **ground truth** evaluator because it compares the output to a reference. See [How to create custom evaluators](evaluation/faq/custom-evaluators).
-- **LLM-as-judge**: An LLM-as-judge evaluator uses an LLM to score system output. For example, you might want to check whether your system is outputting
-  offensive content. This is **reference-free**, as there is no comparison to an example output. You might also want to check whether the system output has the same
-  meaning as the example output, which would be a **ground truth** evaluator. To get started with LLM-as-a-judge, try out LangSmith's [off-the-shelf evaluators](evaluation/faq/evaluator-implementations)!
-- **Human**: You can also evaluate your runs manually. This can be done in LangSmith [via the SDK](tracing/faq/logging_feedback#capturing-feedback-programmatically),
-  or [in the LangSmith UI](tracing/faq/logging_feedback#annotating-traces-with-feedback).
-
-## Next steps
-
-To get started with code, check out the [Quick Start Guide](evaluation/quickstart).
-
-If you want to learn how to accomplish a particular task, check out our comprehensive [How-To Guides](evaluation/faq)
-
-For a higher-level set of recommendations on how to think about testing and evaluating your LLM app, check out the [evaluation recommendations](evaluation/recommendations) page.
diff --git a/versioned_docs/version-old/evaluation/migration.mdx b/versioned_docs/version-old/evaluation/migration.mdx
deleted file mode 100644
index 9aac37fce..000000000
--- a/versioned_docs/version-old/evaluation/migration.mdx
+++ /dev/null
@@ -1,199 +0,0 @@
----
-sidebar_label: Migrating to `evaluate`
-sidebar_position: 7
----
-
-# Migrating from `run_on_dataset` to `evaluate`
-
-In python, we've introduced a cleaner `evaluate()` function to replace the `run_on_dataset` function. While we are not deprecating the `run_on_dataset` function, the new function lets you get started and without needing to install `langchain` in your local environment.
-
-This guide will walk you through the process of migrating your existing code from using `run_on_dataset` to leveraging the benefits of `evaluate`.
-
-## Key Differences
-
-#### 1. `llm_or_chain_factory` -> first positional argument
-
-The "thing you are evaluating" (pipeline, target, model, chain, agent, etc.) is **always** the first positional argument and **always** has the following signature:
-
-```python
-def predict(inputs: dict) -> dict:
-    """Call your model or pipeline with the given inputs and return the predictions."""
-    # Example:
-    # result = client.chat.completions.create(...)
-    # response = result.choices[0].message.content
-    return {"output": ...}
-```
-
-No need to specify the confusing "`llm_or_chain_factory`". If you need to create a new version of your object for each data point, initialize it within the `predict()` function.
-If you want to evaluate a LangChain object (runnable, etc.), you can directly call `evaluate(chain.invoke, data: ...,...)`.
-
-#### 2. `dataset_name` -> `data`
-
-The data field accepts a broader range of inputs, including the dataset name, id, or an iterator over examples. This lets you easily evaluate over a subset of the data to quickly debug.
-
-If you were previously specifying a `dataset_version`, you can directly pass the target version like so:
-
-```python
-dataset_version = "lates" # your tagged version
-
-results = evaluate(
-    ...,
-    data=client.list_examples(dataset_name="my_dataset", as_of=dataset_version),
-    ...
-)
-
-```
-
-#### 3. `RunEvalConfig` -> `List[RunEvaluator]`
-
-The config has been deprecated (removing the LangChain dependency). Instead, directly provide a list of evaluators to the `evaluators` argument.
-
-    a. Custom evaluators are simple functions that take a `Run` and an `Example` and return a dictionary with the evaluation results. For example:
-
-```python
-def exact_match(run: Run, example: Example) -> dict:
-    """Calculate the exact match score of the run."""
-    expected = example.outputs["answer"]
-    predicted = run.outputs["output"]
-    return {"score": expected.lower() == predicted.lower(), "key": "exact_match"}
-
-evaluate(
-    ...,
-    evaluators=[exact_match],
-
-)
-```
-
-Anything that subclasses `RunEvaluator` still works as they did before, we just will automatically promote your compatible functions to `RunEvaluator` instances.
-
-    b. `LangChain` evaluators can be incorporated using the `LangChainStringEvaluator` wrapper.
-
-For example, if you were previously using the "Criteria" evaluator, this evaluation:
-
-```python
-eval_config = RunEvalConfig(
-    evaluators=[RunEvalConfig.Criteria(
-        criteria={"usefulness": "The prediction is useful if..."},
-        llm=my_eval_llm,
-    )]
-)
-
-client.run_on_dataset(..., eval_config=eval_config)
-```
-
-becomes:
-
-```python
-from langsmith.evaluation import LangChainStringEvaluator
-
-evaluators=[
-    LangChainStringEvaluator(
-        "labeled_criteria",
-        config={
-            "criteria": {
-                "usefulness": "The prediction is useful if...",
-            },
-            "llm": my_eval_llm,
-        },
-    ),
-]
-```
-
-c. For evaluating multi-key datasets using off-the-shelf LangChain evaluators, replace any `input_key`, `reference_key`, `prediction_key` with a custom `prepare_data` function.
-
-If your dataset has a single key for the inputs and reference answer, and if your target pipeline returns a response in a single key, the evaluators can automatically use these responses directly without any additional configuration.
-
-For multi-key datasets, you must explain which values to use for the model prediction, (and optionally for the expected answer and/or inputs). This is done by providing a `prepare_data` function that converts a run and example to a dictionary of `{"input": ..., "prediction": ..., "reference": ...}`.
-
-```python
-def prepare_data(run: Run, example: Example) -> dict:
-    # Run is the trace of your pipeline
-    # Example is a dataset record
-    return {
-        "prediction": run.outputs["output"],
-        "input": example.inputs["input"],
-        "reference": example.outputs["answer"],
-    }
-
-qa_evaluator = LangChainStringEvaluator(
-    "qa",
-    prepare_data=prepare_data,
-    config={"llm": my_qa_llm},
-)
-```
-
-#### 4. `batch_evaluators` -> `summary_evaluators`.
-
-These let you compute custom metrics over the whole dataset. For example, precision:
-
-```python
-def precision(runs: List[Run], examples: List[Example]) -> dict:
-    """Calculate the precision of the runs."""
-    expected = [example.outputs["answer"] for example in examples]
-    predicted = [run.outputs["output"] for run in runs]
-    tp = sum([p == e for p, e in zip(predictions, expected) if p == "yes"])
-    fp = sum([p == "yes" and e == "no" for p, e in zip(predictions, expected)])
-    return {"score": tp / (tp + fp), "key": "precision"}
-```
-
-#### 5. `project_metadata` -> `metadata`.
-
-#### 6. `project_name` -> `experiment_prefix`.
-
-`evaluate()` always appends an experiment uuid to the prefix to ensure uniqueness, so you don't have to
-run into those confusing "project already exists" errors.
-
-#### 7. `concurrency_level` -> `max_concurrency`.
-
-## Migration Steps
-
-#### 1. Update your imports:
-
-```python
-from langsmith.evaluation import evaluate
-```
-
-#### 2. Change your `run_on_dataset` call to `evaluate`:
-
-```python
-results = evaluate(
-    ...,
-    data=...,
-    evaluators=[...],
-    summary_evaluators=[...],
-    metadata=...,
-    experiment_prefix=...,
-    max_concurrency=...,
-)
-```
-
-#### 3. If you were using a factory function, replace it with a direct invocation:
-
-```python
-def predict(inputs: dict):
-    my_pipeline = ...
-    return my_pipeline.invoke(inputs)
-```
-
-#### 4. If you were using LangChain evaluators, wrap them with `LangChainStringEvaluator`:
-
-```python
-from langsmith.evaluation import LangChainStringEvaluator
-
-evaluators=[
-    LangChainStringEvaluator("embedding_distance"),
-    LangChainStringEvaluator(
-        "labeled_criteria",
-        config={"criteria": {"usefulness": "The prediction is useful if..."}},
-        prepare_data=prepare_criteria_data
-    ),
-]
-```
-
-#### 5. Update any references to `project_metadata`, `project_name`, `dataset_version`, and `concurrency_level` to use the new argument names.
-
-## Support
-
-If you encounter any issues during the migration process or have further questions, please don't hesitate to reach out to our support team at [support@langchain.dev](mailto:support@langchain.dev). We're here to help ensure a smooth transition!
-
-Happy evaluating!
diff --git a/versioned_docs/version-old/evaluation/quickstart.mdx b/versioned_docs/version-old/evaluation/quickstart.mdx
deleted file mode 100644
index c2836ba58..000000000
--- a/versioned_docs/version-old/evaluation/quickstart.mdx
+++ /dev/null
@@ -1,193 +0,0 @@
----
-sidebar_label: Quick Start
-sidebar_position: 1
----
-
-import Tabs from "@theme/Tabs";
-import CodeBlock from "@theme/CodeBlock";
-import {
-  CodeTabs,
-  PythonBlock,
-  TypeScriptBlock,
-} from "@site/src/components/InstructionsWithCode";
-import { ClientInstallationCodeTabs } from "@site/src/components/ClientInstallation";
-
-# Evaluation Quick Start
-
-This guide helps you get started evaluating your AI system using LangSmith, so you can deploy the best perfoming model for your needs. This guide gets you started with the basics.
-
-## 1. Install LangSmith
-
-<CodeTabs
-  tabs={[
-    {
-      value: "python",
-      label: "Python",
-      language: "bash",
-      content: `pip install -U langsmith`,
-    },
-    {
-      value: "typescript",
-      label: "TypeScript",
-      language: "bash",
-      content: `yarn add langchain`,
-    },
-  ]}
-  groupId="client-language"
-/>
-
-## 2. Evaluate
-
-Evalution requires a system to test, [data](faq) to serve as test cases, and optionally evaluators to grade the results.
-
-<CodeTabs
-  tabs={[
-    {
-      value: "python",
-      label: "Python",
-      language: "python",
-      content: `from langsmith import Client
-from langsmith.schemas import Run, Example
-from langsmith.evaluation import evaluate
-import openai
-from langsmith.wrappers import wrap_openai\n
-client = Client()\n
-# Define dataset: these are your test cases
-dataset_name = "Rap Battle Dataset"
-dataset = client.create_dataset(dataset_name, description="Rap battle prompts.")
-client.create_examples(
-    inputs=[
-        {"question": "a rap battle between Atticus Finch and Cicero"},
-        {"question": "a rap battle between Barbie and Oppenheimer"},
-    ],
-    outputs=[
-        {"must_mention": ["lawyer", "justice"]},
-        {"must_mention": ["plastic", "nuclear"]},
-    ],
-    dataset_id=dataset.id,
-)\n
-# Define AI system
-openai_client = wrap_openai(openai.Client())\n
-def predict(inputs: dict) -> dict:
-    messages = [{"role": "user", "content": inputs["question"]}]
-    response = openai_client.chat.completions.create(messages=messages, model="gpt-3.5-turbo")
-    return {"output": response}\n
-# Define evaluators
-def must_mention(run: Run, example: Example) -> dict:
-    prediction = run.outputs.get("output") or ""
-    required = example.outputs.get("must_mention") or []
-    score = all(phrase in prediction for phrase in required)
-    return {"key":"must_mention", "score": score}\n
-experiment_results = evaluate(
-    predict, # Your AI system
-    data=dataset_name, # The data to predict and grade over
-    evaluators=[must_mention], # The evaluators to score the results
-    experiment_prefix="rap-generator", # A prefix for your experiment names to easily identify them
-    metadata={
-      "version": "1.0.0",
-    },
-)`,
-    },
-    {
-      value: "typescript",
-      label: "TypeScript",
-      language: "typescript",
-      content: `import { Client } from "langsmith";
-import { Run, Example } from "langsmith";
-import { EvaluationResult } from "langsmith/evaluation";
-// Note: native evaluate() function support coming soon to the LangSmith TS SDK
-import { runOnDataset } from "langchain/smith";
-import OpenAI from "openai";\n
-const client = new Client();
-// Define dataset: these are your test cases
-const datasetName = "Rap Battle Dataset";
-const dataset = await client.createDataset(datasetName, {
-  description: "Rap battle prompts.",
-});
-await client.createExamples({
-    inputs: [
-        {question: "a rap battle between Atticus Finch and Cicero"},
-        {question: "a rap battle between Barbie and Oppenheimer"},
-    ],
-    outputs: [
-        {must_mention: ["lawyer", "justice"]},
-        {must_mention: ["plastic", "nuclear"]},
-    ],
-    datasetId: dataset.id,
-});\n
-// Define AI system
-const openaiClient = new OpenAI();\n
-async function predictResult({ question }: { question: string }) {
-    const messages = [{ "role": "user", "content": question }];
-    const output = await openaiClient.chat.completions.create({
-        model: "gpt-3.5-turbo",
-        messages: messages
-    });
-    return { output };
-}\n
-// Define evaluators
-const mustMention = async ({ run, example }: { run: Run; example?: Example; }): Promise<EvaluationResult> => {
-  const mustMention: string[] = example?.outputs?.must_contain ?? [];
-  const score = mustMention.every((phrase) =>
-    run?.outputs?.output.includes(phrase)
-  );
-  return {
-    key: "must_mention",
-    score: score,
-  };
-};\n
-await runOnDataset(
-  predictResult, // Your AI system
-   datasetName, // The data to predict and grade over
-   {
-    evaluationConfig: {customEvaluators: [mustMention] 
-  },
-  projectMetadata: {
-    version: "1.0.0",
-  },
-});`,
-    },
-  ]}
-  groupId="client-language"
-/>
-
-Configure your API key, then run the script to evaluate your system.
-
-<CodeTabs
-  tabs={[
-    {
-      value: "python",
-      label: "Python",
-      language: "bash",
-      content: `export LANGCHAIN_API_KEY=<your api key>`,
-    },
-    {
-      value: "typescript",
-      label: "TypeScript",
-      language: "bash",
-      content: `export LANGCHAIN_API_KEY=<your api key>`,
-    },
-  ]}
-  groupId="client-language"
-/>
-
-## 3. Review Results
-
-The evaluation results will be streamed to a new experiment linked to your "Rap Battle Dataset". You can view the results by clicking on the link printed by the `evaluate` function or by navigating to the [Datasets & Testing](https://smith.langchain.com/datasets) page, clicking "Rap Battle Dataset", and viewing the latest test run.
-
-There, you can inspect the traces and feedback generated from the evaluation configuration.
-
-![Eval test run screenshot](static/eval-test-run.png)
-
-You can click "Open Run" to view the trace and feedback generated for that example.
-
-![Eval trace screenshot](static/eval-run-trace.png)
-
-To compare to another test on this dataset, you can click "Compare Tests".
-
-![Compare Tests](static/compare-tests.png)
-
-## More on evaluation
-
-Congratulations! You've now created a dataset and used it to evaluate your agent or LLM.
-To learn how to make your own custom evaluators, review the [Custom Evaluator](faq) guide. To learn more about some pre-built evaluators available in the LangChain open-source library, check out the [LangChain Evaluators](faq/evaluator-implementations) guide.
diff --git a/versioned_docs/version-old/evaluation/recommendations.mdx b/versioned_docs/version-old/evaluation/recommendations.mdx
deleted file mode 100644
index d6cc0b293..000000000
--- a/versioned_docs/version-old/evaluation/recommendations.mdx
+++ /dev/null
@@ -1,101 +0,0 @@
----
-sidebar_label: Recommendations
-sidebar_position: 6
----
-
-# Recommendations
-
-This conceptual guide shares thoughts on how to use testing and evaluations for your LLM applications. There is no one-size-fits-all solution, but we believe the most successful teams will adapt strategies from design, software development, and machine learning to their use cases to deliver better, more reliable results.
-
-### Test early and often
-
-While "unit tests" don't truly exist for the model, writing "minimum functionality tests" for each chain during the debugging and prototyping stage will help you scaffold more reliable systems.
-
-Datasets facilitate this. Using debugging projects, you can log runs while prototyping. From these runs, you can select representative samples to add to a "Functionality Test Dataset" for that component. Evaluators can be run in CI to ensure that individual chains (or other components) still perform as desired for known use cases.
-
-- Completing a specific structured schema
-- Selecting the correct tool for a given question
-- Extracting the correct information from a passage
-- Generating valid code for a typical input.
-- Avoiding unwanted behavior when given leading inputs (e.g., appropriate polite refusals, adversarial inputs, etc.)
-
-These datasets can range from anywhere between 10-100+ examples and will continue to grow as you capture more example traces and add them as known tests.
-
-### Create domain-specific evaluators
-
-LangChain has strong and configurable built-in evaluators for common tasks, and everyone will benefit from your [contributions to these evaluators](https://github.com/langchain-ai/langchain/tree/master/libs/langchain/langchain/evaluation). However, often the best evaluation metrics are domain-specific. Some examples include:
-
-- Evaluate the validity and efficiency of domain-specific code
-- Applying custom rules to check the response output against a proprietary system
-- Asserting numerical values are within a certain range
-
-### Use labels where possible
-
-When adding examples to a dataset, you can improve the output to represent a "gold standard" label. Evaluators that compare outputs against labels generally are much more reliable than those that have to operate "reference-free."
-
-Once you have deployed an application, capture and filter user feedback (even in testing deployments) to help improve the signal.
-
-### Use aggregate evals
-
-Testing individual data points is useful for asserting behavior on known examples, but a lot of information can only be measured in aggregate. Aggregating automated feedback over a dataset can help you detect differences in performance across component versions or between configurations.
-
-These datasets are usually 100-1000+ examples to return statistically significant results.
-
-### Measure model stability
-
-LLMs can be non-deterministic. They also can be sensitive to small (even imperceptible) changes in the input. Generating a dataset of synthetic examples is a good way to measure this. Some common approaches to address this usually start from a representative dataset and then:
-
-- Generate examples using explicit transformations that don't change the meaning of the input, such as changing pronouns or roles, verb tense, misspellings, paraphrasing, etc. These are semantic invariance tests
-- Generate "similar examples" from the model (or differently tokenized LLMs). When evaluating, ensure that the correctness or other metrics don't change, or ask the model to assert whether the outputs are equivalent.
-- (If the model's temperature > 0) run the model multiple times and grade whether outputs are consistent.
-
-### Measure performance on subsets
-
-Use tags or organize datasets based on cohorts or important properties to return stratified results for different groups. This can help you quantify your application's bias or other issues that might not be apparent when looking at intermingled results.
-
-### Evaluate production data
-
-Once you have deployed an application, you can use the same evaluators to measure performance or behavior on real user data. This can help you identify issues that might not be apparent during testing, and it can help quantify signals that are contained in the unstructured data. These can be used alongside other application metrics to help better understand ways to improve your application.
-
-You can also log proxy metrics (such as click-through/response rate) as feedback to measure to drive better analysis.
-
-Check out some cookbook examples for this:
-
-- [Evaluate production runs (batch)](https://github.com/langchain-ai/langsmith-cookbook/blob/main/feedback-examples/algorithmic-feedback/algorithmic_feedback.ipynb): automate feedback metrics for advanced monitoring and performance tuning.
-- [Evaluate production runs (real-time)](https://github.com/langchain-ai/langsmith-cookbook/blob/main/feedback-examples/realtime-algorithmic-feedback/realtime_feedback.ipynb): automatically generate feedback metrics for every run using an async callback.
-
-### Don't train on test datasets
-
-If you've ever heard of the "train, validation, test" splits in ML, you are well aware that if you use a dataset for optimizing a prompt, fine-tuning an LLM, or picking other configurable parameters in your setup, it's important to keep this separate from the datasets you use for testing. Otherwise, you risk "overfitting" to the test data, which will likely lead to poor performance on new data once you deploy it.
-
-### Test the model yourself
-
-Looking at the data remains an effective (albeit time-consuming) evaluation technique in many scenarios. You can evaluate runs yourself and log feedback from your application users using
-
-LangSmith exposes this in the client via a `create_feedback` method. We recommend adding as many signals as possible and using tags and aggregated feedback to help you understand what is happening in your application.
-
-### Ask appropriate questions
-
-When thinking of what evaluator to use, it is helpful to think of "what question I need to answer" to be sure that my application has the desired behavior. Then it's vital to decide "what question can I reasonably answer given the input data".
-
-Asking a model if an output is "correct" will likely return an unreliable result, unless the model has additional information (such as a ground-truth label) that wasn't available to the evaluated model.
-
-It can be useful to select evaluators based on whether labels are present and what types of information would be useful for your concerns. Below are a few examples:
-
-|             | Reference Free                                                                                                               | With References                                         |
-| ----------- | ---------------------------------------------------------------------------------------------------------------------------- | ------------------------------------------------------- |
-| Pass/Fail   | Exact/fuzzy string match; "Does this output answer the user's question? YES or NO                                            | "Is the generated output equivalent to the answer?"     |
-| Scoring     | Perplexity / Normalized log probs; "On a scale from 1 to 5, 1 being a \_\_\_ and 5 being \_\_\_, how \_\_\_ is this output?" | ROUGE/BLEU; “On a scale from 1 to 5, how similar is …?” |
-| Labeling    | "Is this output mostly related to sports, finance, pop culture, or other?"                                                   | _less useful here_                                      |
-| Comparisons | Which of these outputs best responds to the following input: 1. \_\_\_ 2. \_\_\_                                             | _less useful here_                                      |
-
-You'll notice that we've included some more traditional NLP measurements like "perplexity" or "ROUGE" alongside natural language questions prompted to an LLM. Both techniques have their place and very notable limitations. We recommend using a combination of these approaches to get a more complete picture of your application's performance.
-
-### Other Resources
-
-There's a lot of great work that has been done in this space. Some resources our community have found useful include:
-
-- ELeutherAI's [LM Evaluation Harness](https://github.com/EleutherAI/lm-evaluation-harness/)
-- HuggingFace [Evaluate](https://huggingface.co/docs/evaluate/index)
-- OpenAI's [evals](https://github.com/openai/evals/) repository
-- Chatbot Arena [lmsys](https://chat.lmsys.org/)
diff --git a/versioned_docs/version-old/evaluation/static/add_evaluator.png b/versioned_docs/version-old/evaluation/static/add_evaluator.png
deleted file mode 100644
index 911bee1ad..000000000
Binary files a/versioned_docs/version-old/evaluation/static/add_evaluator.png and /dev/null differ
diff --git a/versioned_docs/version-old/evaluation/static/add_to_dataset.png b/versioned_docs/version-old/evaluation/static/add_to_dataset.png
deleted file mode 100644
index 7692dbd94..000000000
Binary files a/versioned_docs/version-old/evaluation/static/add_to_dataset.png and /dev/null differ
diff --git a/versioned_docs/version-old/evaluation/static/compare-tests.png b/versioned_docs/version-old/evaluation/static/compare-tests.png
deleted file mode 100644
index 9ab260ef7..000000000
Binary files a/versioned_docs/version-old/evaluation/static/compare-tests.png and /dev/null differ
diff --git a/versioned_docs/version-old/evaluation/static/create_dataset_csv.png b/versioned_docs/version-old/evaluation/static/create_dataset_csv.png
deleted file mode 100644
index dfcc0d16f..000000000
Binary files a/versioned_docs/version-old/evaluation/static/create_dataset_csv.png and /dev/null differ
diff --git a/versioned_docs/version-old/evaluation/static/create_evaluator.png b/versioned_docs/version-old/evaluation/static/create_evaluator.png
deleted file mode 100644
index 609384c0e..000000000
Binary files a/versioned_docs/version-old/evaluation/static/create_evaluator.png and /dev/null differ
diff --git a/versioned_docs/version-old/evaluation/static/eval-run-trace.png b/versioned_docs/version-old/evaluation/static/eval-run-trace.png
deleted file mode 100644
index 778d92bb0..000000000
Binary files a/versioned_docs/version-old/evaluation/static/eval-run-trace.png and /dev/null differ
diff --git a/versioned_docs/version-old/evaluation/static/eval-test-run.png b/versioned_docs/version-old/evaluation/static/eval-test-run.png
deleted file mode 100644
index b98455247..000000000
Binary files a/versioned_docs/version-old/evaluation/static/eval-test-run.png and /dev/null differ
diff --git a/versioned_docs/version-old/evaluation/static/evaluator_prompt.png b/versioned_docs/version-old/evaluation/static/evaluator_prompt.png
deleted file mode 100644
index 4f939365a..000000000
Binary files a/versioned_docs/version-old/evaluation/static/evaluator_prompt.png and /dev/null differ
diff --git a/versioned_docs/version-old/evaluation/static/export-dataset-button.png b/versioned_docs/version-old/evaluation/static/export-dataset-button.png
deleted file mode 100644
index 04270d7c7..000000000
Binary files a/versioned_docs/version-old/evaluation/static/export-dataset-button.png and /dev/null differ
diff --git a/versioned_docs/version-old/evaluation/static/export-dataset-modal.png b/versioned_docs/version-old/evaluation/static/export-dataset-modal.png
deleted file mode 100644
index e470e36ff..000000000
Binary files a/versioned_docs/version-old/evaluation/static/export-dataset-modal.png and /dev/null differ
diff --git a/versioned_docs/version-old/evaluation/static/filter_to_regressions.png b/versioned_docs/version-old/evaluation/static/filter_to_regressions.png
deleted file mode 100644
index 86b6c11e1..000000000
Binary files a/versioned_docs/version-old/evaluation/static/filter_to_regressions.png and /dev/null differ
diff --git a/versioned_docs/version-old/evaluation/static/input_variables_playground.png b/versioned_docs/version-old/evaluation/static/input_variables_playground.png
deleted file mode 100644
index 86a762d24..000000000
Binary files a/versioned_docs/version-old/evaluation/static/input_variables_playground.png and /dev/null differ
diff --git a/versioned_docs/version-old/evaluation/static/langsmith_app_flow.png b/versioned_docs/version-old/evaluation/static/langsmith_app_flow.png
deleted file mode 100644
index 377d32731..000000000
Binary files a/versioned_docs/version-old/evaluation/static/langsmith_app_flow.png and /dev/null differ
diff --git a/versioned_docs/version-old/evaluation/static/langsmith_app_flow_dark.png b/versioned_docs/version-old/evaluation/static/langsmith_app_flow_dark.png
deleted file mode 100644
index a88f7cecd..000000000
Binary files a/versioned_docs/version-old/evaluation/static/langsmith_app_flow_dark.png and /dev/null differ
diff --git a/versioned_docs/version-old/evaluation/static/langsmith_evaluation_dark.png b/versioned_docs/version-old/evaluation/static/langsmith_evaluation_dark.png
deleted file mode 100644
index 52dcd77fe..000000000
Binary files a/versioned_docs/version-old/evaluation/static/langsmith_evaluation_dark.png and /dev/null differ
diff --git a/versioned_docs/version-old/evaluation/static/langsmith_evaluators.png b/versioned_docs/version-old/evaluation/static/langsmith_evaluators.png
deleted file mode 100644
index 1c530412c..000000000
Binary files a/versioned_docs/version-old/evaluation/static/langsmith_evaluators.png and /dev/null differ
diff --git a/versioned_docs/version-old/evaluation/static/langsmith_landscape_v2.png b/versioned_docs/version-old/evaluation/static/langsmith_landscape_v2.png
deleted file mode 100644
index 132894887..000000000
Binary files a/versioned_docs/version-old/evaluation/static/langsmith_landscape_v2.png and /dev/null differ
diff --git a/versioned_docs/version-old/evaluation/static/langsmith_landscape_v2_dark.png b/versioned_docs/version-old/evaluation/static/langsmith_landscape_v2_dark.png
deleted file mode 100644
index 01858f5f3..000000000
Binary files a/versioned_docs/version-old/evaluation/static/langsmith_landscape_v2_dark.png and /dev/null differ
diff --git a/versioned_docs/version-old/evaluation/static/langsmith_summary.png b/versioned_docs/version-old/evaluation/static/langsmith_summary.png
deleted file mode 100644
index 7855d68b9..000000000
Binary files a/versioned_docs/version-old/evaluation/static/langsmith_summary.png and /dev/null differ
diff --git a/versioned_docs/version-old/evaluation/static/langsmith_summary_dark.png b/versioned_docs/version-old/evaluation/static/langsmith_summary_dark.png
deleted file mode 100644
index cf44965a5..000000000
Binary files a/versioned_docs/version-old/evaluation/static/langsmith_summary_dark.png and /dev/null differ
diff --git a/versioned_docs/version-old/evaluation/static/modify_example.png b/versioned_docs/version-old/evaluation/static/modify_example.png
deleted file mode 100644
index 0f034522f..000000000
Binary files a/versioned_docs/version-old/evaluation/static/modify_example.png and /dev/null differ
diff --git a/versioned_docs/version-old/evaluation/static/playground_evaluator_results.png b/versioned_docs/version-old/evaluation/static/playground_evaluator_results.png
deleted file mode 100644
index a7a68f325..000000000
Binary files a/versioned_docs/version-old/evaluation/static/playground_evaluator_results.png and /dev/null differ
diff --git a/versioned_docs/version-old/evaluation/static/playground_experiment_results.png b/versioned_docs/version-old/evaluation/static/playground_experiment_results.png
deleted file mode 100644
index 8ee7c986f..000000000
Binary files a/versioned_docs/version-old/evaluation/static/playground_experiment_results.png and /dev/null differ
diff --git a/versioned_docs/version-old/evaluation/static/regression_view.png b/versioned_docs/version-old/evaluation/static/regression_view.png
deleted file mode 100644
index d891593bf..000000000
Binary files a/versioned_docs/version-old/evaluation/static/regression_view.png and /dev/null differ
diff --git a/versioned_docs/version-old/evaluation/static/sample_langsmith_dataset.png b/versioned_docs/version-old/evaluation/static/sample_langsmith_dataset.png
deleted file mode 100644
index a741b571b..000000000
Binary files a/versioned_docs/version-old/evaluation/static/sample_langsmith_dataset.png and /dev/null differ
diff --git a/versioned_docs/version-old/evaluation/static/sample_langsmith_example.png b/versioned_docs/version-old/evaluation/static/sample_langsmith_example.png
deleted file mode 100644
index 9677db78b..000000000
Binary files a/versioned_docs/version-old/evaluation/static/sample_langsmith_example.png and /dev/null differ
diff --git a/versioned_docs/version-old/evaluation/static/select_baseline.png b/versioned_docs/version-old/evaluation/static/select_baseline.png
deleted file mode 100644
index 00b933762..000000000
Binary files a/versioned_docs/version-old/evaluation/static/select_baseline.png and /dev/null differ
diff --git a/versioned_docs/version-old/evaluation/static/select_columns.png b/versioned_docs/version-old/evaluation/static/select_columns.png
deleted file mode 100644
index 2548198c0..000000000
Binary files a/versioned_docs/version-old/evaluation/static/select_columns.png and /dev/null differ
diff --git a/versioned_docs/version-old/evaluation/static/select_feedback.png b/versioned_docs/version-old/evaluation/static/select_feedback.png
deleted file mode 100644
index fa2263ae8..000000000
Binary files a/versioned_docs/version-old/evaluation/static/select_feedback.png and /dev/null differ
diff --git a/versioned_docs/version-old/evaluation/static/switch_to_dataset.png b/versioned_docs/version-old/evaluation/static/switch_to_dataset.png
deleted file mode 100644
index 06a8ce062..000000000
Binary files a/versioned_docs/version-old/evaluation/static/switch_to_dataset.png and /dev/null differ
diff --git a/versioned_docs/version-old/evaluation/static/tag_this_version.png b/versioned_docs/version-old/evaluation/static/tag_this_version.png
deleted file mode 100644
index b257fcaa5..000000000
Binary files a/versioned_docs/version-old/evaluation/static/tag_this_version.png and /dev/null differ
diff --git a/versioned_docs/version-old/evaluation/static/unit-test-suite.png b/versioned_docs/version-old/evaluation/static/unit-test-suite.png
deleted file mode 100644
index aa6da19e6..000000000
Binary files a/versioned_docs/version-old/evaluation/static/unit-test-suite.png and /dev/null differ
diff --git a/versioned_docs/version-old/evaluation/static/version_dataset.png b/versioned_docs/version-old/evaluation/static/version_dataset.png
deleted file mode 100644
index 73ef3af6e..000000000
Binary files a/versioned_docs/version-old/evaluation/static/version_dataset.png and /dev/null differ
diff --git a/versioned_docs/version-old/evaluation/static/version_dataset_tests.png b/versioned_docs/version-old/evaluation/static/version_dataset_tests.png
deleted file mode 100644
index 8f406a616..000000000
Binary files a/versioned_docs/version-old/evaluation/static/version_dataset_tests.png and /dev/null differ
diff --git a/versioned_docs/version-old/evaluation/static/view_results.png b/versioned_docs/version-old/evaluation/static/view_results.png
deleted file mode 100644
index 9c032b279..000000000
Binary files a/versioned_docs/version-old/evaluation/static/view_results.png and /dev/null differ
diff --git a/versioned_docs/version-old/hub/dev-setup.mdx b/versioned_docs/version-old/hub/dev-setup.mdx
deleted file mode 100644
index 503c03801..000000000
--- a/versioned_docs/version-old/hub/dev-setup.mdx
+++ /dev/null
@@ -1,44 +0,0 @@
----
-sidebar_label: Developer Setup
-sidebar_position: 2
----
-
-import {
-  HubInstallationCodeTabs,
-  HubPullCodeTabs,
-  HubPushCodeTabs,
-} from "@site/src/components/Hub";
-
-# Developer Setup
-
-This guide will continue from the hub quickstart, using the Python or TypeScript SDK to interact with the hub instead of the Playground UI.
-
-This guide assumes you've gone through the Hub [Quick Start](./quickstart) including login-required steps.
-
-If you don't yet have an account, you'll only be able to pull public objects.
-
-## 1. Install/upgrade packages
-
-**Note:** You likely need to upgrade even if they're already installed!
-
-<HubInstallationCodeTabs />
-
-## 2. Configuring environment variables
-
-Get an API key for your **Personal** organization if you have not yet. The hub will not work with your non-personal organization's api key!
-
-```bash
-export LANGCHAIN_HUB_API_KEY="ls_..."
-```
-
-If you already have `LANGCHAIN_API_KEY` set to a personal organization’s api key from LangSmith, you can skip this.
-
-## 3. Pull an object from the hub and use it
-
-<HubPullCodeTabs />
-
-## 4. Push a prompt to your personal organization
-
-For this step, you'll need the `handle` for your account!
-
-<HubPushCodeTabs />
diff --git a/versioned_docs/version-old/hub/faq.mdx b/versioned_docs/version-old/hub/faq.mdx
deleted file mode 100644
index 7803dfd05..000000000
--- a/versioned_docs/version-old/hub/faq.mdx
+++ /dev/null
@@ -1,45 +0,0 @@
----
-sidebar_label: FAQs
-sidebar_position: 3
----
-
-# Frequently Asked Questions
-
-### What is LangChain Hub?
-
-[LangChain Hub](https://smith.langchain.com/hub) lets you discover, version control, and experiment with different prompts for LangChain and LLMs in general directly in your browser.
-
-### How do I share a private prompt with my teammates?
-
-You can share prompts within a LangSmith organization by uploading them within a shared organization.
-
-First, create an API key for your organization, then set the variable in your development environment:
-
-```bash
-export LANGCHAIN_HUB_API_KEY = "ls__.."
-```
-
-Then, you can upload prompts to the organization. Assuming your organization's handle is "my-organization":
-
-```python
-from langchain import hub
-
-prompt = ...
-hub.push("my-organization/my-prompt-name", prompt, new_repo_is_public=False)
-```
-
-Now, all your team-members within your LangSmith organization will be able to view, pull, and open the prompt in the playground.
-
-### Why can't I push anything other than prompts?
-
-Hub currently only supports LangChain prompt objects. We are working on adding support for more!
-
-If you have a specific request, please join the `hub-feedback` [discord](https://discord.gg/6adMQxSpJS) channel and let us know!
-
-### Can I upload a prompt to the hub from a LangSmith Trace?
-
-Coming soon!
-
-### Can LangChain Hub do \_\_\_\_?
-
-Maybe, and we'd love to hear from you! Please join the `hub-feedback` [discord](https://discord.gg/6adMQxSpJS) channel
diff --git a/versioned_docs/version-old/hub/quickstart.mdx b/versioned_docs/version-old/hub/quickstart.mdx
deleted file mode 100644
index 69837380d..000000000
--- a/versioned_docs/version-old/hub/quickstart.mdx
+++ /dev/null
@@ -1,126 +0,0 @@
----
-sidebar_label: Quick Start
-sidebar_position: 1
----
-
-# Quick Start
-
-## What is LangChain Hub?
-
-<>
-  <div
-    style={{
-      position: "relative",
-      paddingBottom: "57.50798722044729%",
-      height: 0,
-    }}
-  >
-    <iframe
-      src="https://www.loom.com/embed/4032f7a835b44f8096f29d4a3ea4a7ab?sid=9b5e1b22-3ffc-4ddb-b8c3-1b2c2457d893"
-      frameBorder={0}
-      webkitallowfullscreen=""
-      mozallowfullscreen=""
-      allowFullScreen=""
-      style={{
-        position: "absolute",
-        top: 0,
-        left: 0,
-        width: "100%",
-        height: "100%",
-      }}
-    />
-  </div>
-  <br />
-</>
-
-LangChain Hub lets you discover, share, and version control prompts for LangChain and LLMs in general.
-
-It's a great place to find inspiration for your own prompts, or to share your own prompts with the world!
-
-Currently, it supports LangChain prompt templates, and more object types are coming soon.
-
-:::tip Public Features
-Some hub features can be used without logging in [here](https://smith.langchain.com/hub)! However, creating and modifying prompts requires a non-waitlisted account.
-:::
-
-The steps in this guide will acquaint you with LangChain Hub:
-
-1. Browse the hub for a prompt of interest
-2. Try out a prompt in the playground
-3. Log in and set a handle
-4. Modify the prompt in the playground and commit it back to the hub
-
-## 1. Browse the hub for a prompt of interest
-
-You can access the public view of the hub directly at [https://smith.langchain.com/hub](https://smith.langchain.com/hub).
-
-From this screen, you can browse prompts that others have published.
-
-![Hub Home](static/hub-home.png)
-
-On the left side, you can filter by different **tags**, such as types of prompts (Chat vs. Regular), use cases, or models they're designed to be used with (llama-2 vs. gpt-4).
-
-If you see a prompt that looks interesting, you can either click into its page, or you can jump straight to using it in the playground with the "Try it" button.
-
-## 2. Try out a prompt in the playground
-
-For this example, we'll use the following prompt: [https://smith.langchain.com/hub/langchain/my-first-prompt](https://smith.langchain.com/hub/efriis/my-first-prompt)
-
-![Hub Prompt](static/hub-repo.png)
-
-To start, you can get a sense of what the prompt does just by looking at it (this one is pretty straightforward).
-Below the contents of the prompt, you can see a code snippet of how to use it in Python. For more information on
-using hub prompts from code, finish this guide and check out the [developer guide](dev-setup).
-
-Next, let's try out the object in the playground by clicking the [playground button](https://smith.langchain.com/hub/efriis/my-first-prompt/playground) in the top-right.
-
-The playground should look like this:
-
-![Hub Playground](static/hub-playground.png)
-
-On the left, we see an editable view of our Chat Prompt.
-
-To the right, we can configure our inputs and model, and above that, you can add API Keys for playground-supported model providers.
-
-Let's try it out! First, fill out your OpenAI API Key in "Secrets", and fill out a profession (e.g. biologist) and question (e.g. "what is 1 fun fact about parrots?"). Now click "Run"!
-The output should look something like this:
-
-![Hub Playground after running](static/hub-playground-complete.png)
-
-## 3. Log in and set a handle (One-Time Setup)
-
-:::note
-You must log into an account, where the "Personal" organization is not waitlisted, in order to proceed with steps 3 and 4.
-:::
-
-Now that we've tried out a prompt, let's log in and set a handle. This will allow us to commit changes to the prompt back to the hub under our own user!
-
-First, let's click that "Login" button in the top-right and log in. If you find yourself on the waitlist, you can enter your access code if you have one, or hang tight! We're letting people off every week.
-
-Second, go to the [hub home](https://smith.langchain.com/hub). If you haven't set a handle yet, you'll be prompted to add one, so people can associate your prompts with you!
-
-The handle reserves a namespace for all of your prompts, so everything you add will be saved under `your-handle/prompt-name`.
-
-![Hub Set Handle](static/hub-handle.png)
-
-## 4. Commit to a new repo under your user
-
-Staying on [efriis/my-first-prompt's playground](https://smith.langchain.com/hub/efriis/my-first-prompt/playground), let's make some changes and commit it back to a
-repository under your user. To start, let's modify the prompt to change the style of the response. Instead of answering "cheerfully," pick a new adverb (e.g. "angrily").
-
-Once you've run it, we can commit it directly to a new prompt under your user. Click the "Commit" button in the top-right, and you should see a modal like this:
-
-**Note:** you may have to return to the repo page and click the "Playground" button in order to see the "Commit" button.
-
-![Hub Playground Commit](static/hub-playground-commit.png)
-
-Here, you can create a new repo called `my-first-prompt` and use this as a first commit! Once you've done that, you'll be redirected to your new prompt.
-
-## 5. Create an example for your repo
-
-To show off potential use cases for the prompt, let's add an example to our new repo! Fill out another profession and question and click "Run" again.
-When the run has finished, click "Save as Example" to move it into the left panel as an example. Now commit to your repo again and click on your repo's name at the top of the screen to navigate back to your repo's home page.
-
-There, you should see your new example! These examples are publicly shown on your repo page.
-
-![Hub Set Handle](static/hub-example.png)
diff --git a/versioned_docs/version-old/hub/static/hub-example.png b/versioned_docs/version-old/hub/static/hub-example.png
deleted file mode 100644
index 36d4937b9..000000000
Binary files a/versioned_docs/version-old/hub/static/hub-example.png and /dev/null differ
diff --git a/versioned_docs/version-old/hub/static/hub-handle.png b/versioned_docs/version-old/hub/static/hub-handle.png
deleted file mode 100644
index 0c4da3ea2..000000000
Binary files a/versioned_docs/version-old/hub/static/hub-handle.png and /dev/null differ
diff --git a/versioned_docs/version-old/hub/static/hub-home.png b/versioned_docs/version-old/hub/static/hub-home.png
deleted file mode 100644
index b270cba77..000000000
Binary files a/versioned_docs/version-old/hub/static/hub-home.png and /dev/null differ
diff --git a/versioned_docs/version-old/hub/static/hub-playground-commit.png b/versioned_docs/version-old/hub/static/hub-playground-commit.png
deleted file mode 100644
index 8e542b7fa..000000000
Binary files a/versioned_docs/version-old/hub/static/hub-playground-commit.png and /dev/null differ
diff --git a/versioned_docs/version-old/hub/static/hub-playground-complete.png b/versioned_docs/version-old/hub/static/hub-playground-complete.png
deleted file mode 100644
index 7b0d90075..000000000
Binary files a/versioned_docs/version-old/hub/static/hub-playground-complete.png and /dev/null differ
diff --git a/versioned_docs/version-old/hub/static/hub-playground.png b/versioned_docs/version-old/hub/static/hub-playground.png
deleted file mode 100644
index 0e2ee44e3..000000000
Binary files a/versioned_docs/version-old/hub/static/hub-playground.png and /dev/null differ
diff --git a/versioned_docs/version-old/hub/static/hub-repo.png b/versioned_docs/version-old/hub/static/hub-repo.png
deleted file mode 100644
index 7f7495d7e..000000000
Binary files a/versioned_docs/version-old/hub/static/hub-repo.png and /dev/null differ
diff --git a/versioned_docs/version-old/index.mdx b/versioned_docs/version-old/index.mdx
deleted file mode 100644
index 44260c941..000000000
--- a/versioned_docs/version-old/index.mdx
+++ /dev/null
@@ -1,211 +0,0 @@
----
-sidebar_label: Quick Start
-sidebar_position: 1
-table_of_contents: true
----
-
-import Tabs from "@theme/Tabs";
-import CodeBlock from "@theme/CodeBlock";
-import {
-  CodeTabs,
-  PythonBlock,
-  TypeScriptBlock,
-} from "@site/src/components/InstructionsWithCode";
-import {
-  LangChainInstallationCodeTabs,
-  LangChainQuickStartCodeTabs,
-  ConfigureEnvironmentCodeTabs,
-  RunTreeQuickStartCodeTabs,
-  ConfigureSDKEnvironmentCodeTabs,
-  PythonSDKTracingCode,
-  TypeScriptSDKTracingCode,
-} from "@site/src/components/QuickStart";
-import { ClientInstallationCodeTabs } from "@site/src/components/ClientInstallation";
-import DocCardList from "@theme/DocCardList";
-
-# Getting started with LangSmith
-
-## Introduction
-
-[LangSmith](https://smith.langchain.com/) is a platform for building production-grade LLM applications. It allows you to closely monitor and evaluate your application, so you can ship quickly and with confidence. Use of LangChain is not necessary - LangSmith works on its own!
-
-## Install LangSmith
-
-We offer Python and Typescript SDKs for all your LangSmith needs.
-
-<CodeTabs
-  tabs={[
-    {
-      value: "python",
-      label: "Python",
-      language: "bash",
-      content: `pip install -U langsmith`,
-    },
-    {
-      value: "typescript",
-      label: "TypeScript",
-      language: "bash",
-      content: `yarn add langchain langsmith`,
-    },
-  ]}
-  groupId="client-language"
-/>
-
-## Create an API key
-
-To create an API key head to the [Settings page](https://smith.langchain.com/settings). Then click **Create API Key.**
-
-## Setup your environment
-
-<ConfigureSDKEnvironmentCodeTabs />
-
-## Log your first trace
-
-We provide multiple ways to log traces to LangSmith. Below, we'll highlight
-how to use `traceable`. See more on the [Integrations](./tracing/integrations/index.mdx) page.
-
-<CodeTabs
-  tabs={[
-    {
-      value: "python",
-      label: "Python",
-      language: "python",
-      content: PythonSDKTracingCode(),
-    },
-    {
-      value: "typescript",
-      label: "TypeScript",
-      language: "typescript",
-      content: TypeScriptSDKTracingCode(),
-    },
-  ]}
-  groupId="client-language"
-/>
-
-- View a [sample output trace](https://smith.langchain.com/public/b37ca9b1-60cd-4a2a-817e-3c4e4443fdc0/r).
-- Learn more about tracing on the [tracing page](./tracing/index.mdx).
-
-## Create your first evaluation
-
-Evalution requires a system to test, [data](./evaluation/faq/index.mdx) to serve as test cases, and optionally evaluators to grade the results. Here we use a built-in accuracy evaluator.
-
-<CodeTabs
-  tabs={[
-    {
-      value: "python",
-      label: "Python",
-      language: "python",
-      content: `from langsmith import Client
-from langsmith.evaluation import evaluate\n
-client = Client()\n
-# Define dataset: these are your test cases
-dataset_name = "Sample Dataset"
-dataset = client.create_dataset(dataset_name, description="A sample dataset in LangSmith.")
-client.create_examples(
-    inputs=[
-        {"postfix": "to LangSmith"},
-        {"postfix": "to Evaluations in LangSmith"},
-    ],
-    outputs=[
-        {"output": "Welcome to LangSmith"},
-        {"output": "Welcome to Evaluations in LangSmith"},
-    ],
-    dataset_id=dataset.id,
-)\n
-# Define your evaluator
-def exact_match(run, example):
-    return {"score": run.outputs["output"] == example.outputs["output"]}\n
-experiment_results = evaluate(
-    lambda input: "Welcome " + input['postfix'], # Your AI system goes here
-    data=dataset_name, # The data to predict and grade over
-    evaluators=[exact_match], # The evaluators to score the results
-    experiment_prefix="sample-experiment", # The name of the experiment
-    metadata={
-      "version": "1.0.0",
-      "revision_id": "beta"
-    },
-)
-`,
-    },
-    {
-      value: "typescript",
-      label: "TypeScript",
-      language: "typescript",
-      content: `import { Client, Run, Example } from 'langsmith';
-import { runOnDataset } from 'langchain/smith';
-import { EvaluationResult } from 'langsmith/evaluation';\n
-const client = new Client();\n
-// Define dataset: these are your test cases
-const datasetName = "Sample Dataset";
-const dataset = await client.createDataset(datasetName, {
-    description: "A sample dataset in LangSmith."
-});
-await client.createExamples({
-    inputs: [
-        { postfix: "to LangSmith" },
-        { postfix: "to Evaluations in LangSmith" },
-    ],
-    outputs: [
-        { output: "Welcome to LangSmith" },
-        { output: "Welcome to Evaluations in LangSmith" },
-    ],
-    datasetId: dataset.id,
-});\n
-// Define your evaluator
-const exactMatch = async ({ run, example }: { run: Run; example?: Example; }): Promise<EvaluationResult> => {
-    return {
-        key: 'exact_match',
-        score: run.outputs?.output === example?.outputs?.output ? 1 : 0,
-    };
-};\n
-await runOnDataset(
-    (input: { postfix: string }) => ({ output: \`Welcome $\{input.postfix\}\` }), // Your AI system goes here
-    datasetName, // The data to predict and grade over
-    {
-        evaluationConfig: { customEvaluators: [exactMatch] },
-        projectMetadata: {
-            version: "1.0.0",
-            revision_id: "beta",
-        },
-    }
-);`,
-    },
-  ]}
-  groupId="client-language"
-/>
-
-- See more on the [evaluation quick start page](./evaluation/quickstart.mdx).
-
-## Next Steps
-
-Check out the following sections to learn more about LangSmith:
-
-- **[User Guide](./user_guide.mdx)**: Learn about the workflows LangSmith supports at each stage of the LLM application lifecycle.
-- **[Pricing](./pricing.mdx)**: Learn about the pricing model for LangSmith.
-- **[Self-Hosting](./self_hosting)**: Learn about self-hosting options for LangSmith.
-- **[Tracing](./tracing/index.mdx)**: Learn about the tracing capabilities of LangSmith.
-- **[Evaluation](./evaluation/index.mdx)**: Learn about the evaluation capabilities of LangSmith.
-
-## Additional Resources
-
-- **[LangSmith Cookbook](https://github.com/langchain-ai/langsmith-cookbook/tree/main)**: A collection of tutorials and end-to-end walkthroughs using LangSmith.
-- **[LangChain Python](https://python.langchain.com/)**: Docs for the Python LangChain library.
-- **[LangChain Python API Reference](https://api.python.langchain.com/)**: documentation to review the core APIs of LangChain.
-- **[LangChain JS](https://js.langchain.com/docs/)**: Docs for the TypeScript LangChain library
-- **[Discord](https://discord.gg/6adMQxSpJS)**: Join us on our Discord to discuss all things LangChain!
-
-## FAQ
-
-### How do I migrate projects between organizations?
-
-Currently we do not support project migration betwen organizations. While you can manually imitate this by reading and writing runs and datasets using the SDK (see the querying runs and traces guide [here](./tracing/faq/querying_traces.mdx)), it will be fastest to create a new project within your organization and go from there.
-
-### Why aren't my runs aren't showing up in my project?
-
-If you aren't seeing any warnings when running your application, it may be that you are still using an API key from your "personal" organization. Check your most recent runs there to confirm by selecting your `Personal` tenant in the [settings](https://smith.langchain.com/settings) page and then viewing your [projects](https://smith.langchain.com/projects).
-
-If you're still running into issues, please reach out to us at <a href="mailto:support@langchain.dev">support@langchain.dev</a>.
-
-### My team deals with sensitive data that cannot be logged. How can I ensure that only my team can access it?
-
-If you are interested in a private deployment of LangSmith or if you need to self-host, please reach out to us at <a href="mailto:sales@langchain.dev">sales@langchain.dev</a>. Self-hosting LangSmith requires an annual enterprise license that also comes with support and formalized access to the LangChain team.
diff --git a/versioned_docs/version-old/monitoring/concepts.mdx b/versioned_docs/version-old/monitoring/concepts.mdx
deleted file mode 100644
index 7d414a1ee..000000000
--- a/versioned_docs/version-old/monitoring/concepts.mdx
+++ /dev/null
@@ -1,54 +0,0 @@
----
-sidebar_label: Concepts
-sidebar_position: 2
-table_of_contents: true
----
-
-# Concepts
-
-In this guide we will go over some of the concepts that are important to understand when thinking about production logging and automations in LangSmith.
-A lot of these concepts build off of tracing concepts - it is recommended to read the [Tracing Concepts](../tracing/concepts) documentation before.
-
-## Runs
-
-A `Run` is a span representing a single unit of work or operation within your LLM application. This could be anything from single call to an LLM or chain, to a prompt formatting call, to a runnable lambda invocation. If you are familiar with [OpenTelemetry](https://opentelemetry.io/), you can think of a run as a span.
-
-## Traces
-
-A `Trace` is a collection of runs that are related to a single operation. For example, if you have a user request that triggers a chain, and that chain makes a call to an LLM, then to an output parser, and so on, all of these runs would be part of the same trace. If you are familiar with [OpenTelemetry](https://opentelemetry.io/), you can think of a LangSmith trace as a collection of spans. Runs are bound to a trace by a unique trace ID.
-
-## Filter
-
-A `Filter` is a rule that applies to all runs in a project. The default filter you see on the main page selects only top-level runs (`IsRoot` is `true`) but you can filter for sub-runs as well.
-
-You can even filter for runs that are part of a trace with a particular attribute, for example filtering for runs with name `"ChatOpenAI"` that are part of a trace with `user_score` equal to 0.
-
-## Threads
-
-A `Thread` is a sequence of traces representing a conversation. Each response is represented as its own trace, but these traces are linked together by being part of the same conversation.
-
-You can track threads by attaching a special metadata key to runs (one of `session_id`, `thread_id` or `conversation_id`).
-
-See [this documentation](../tracing/faq/customizing_trace_attributes#adding-metadata-and-tags-to-traces) for how to add metadata keys to a trace.
-
-## Monitoring Dashboard
-
-Monitoring dashboards display key metrics over time for a configurable time window. We track LLM related statistics like latency, feedback, time-to-first-token, cost, and more. You can see these dashboard by going to the `Monitors` tab.
-
-## Rules
-
-Rules represent actions that are taken on a set of runs. These are configured by a specifying a filter rule, a sampling rate, and an action to take. Currently, the supported actions are adding to dataset, adding to annotation queue, and sending to online evaluation.
-
-An example of a rule could be, in plain English, "Run a 'vagueness' evaluator on 70% of root runs with a feedback score of 0 for the feedback key `user_score`"
-
-## Datasets
-
-Datasets are a way to collect examples, which are input-output pairs. You can use datasets for evaluation, as well as fine-tuning and few-shot prompting. For more information, see [here](../evaluation)
-
-## Annotation Queues
-
-Annotation Queues are a user-friendly way to annotate a lot of traces.
-
-## Online Evaluation
-
-Online evaluation is when an LLM is used to assign feedback to particular runs.
diff --git a/versioned_docs/version-old/monitoring/faq/_category_.json b/versioned_docs/version-old/monitoring/faq/_category_.json
deleted file mode 100644
index b9e125a41..000000000
--- a/versioned_docs/version-old/monitoring/faq/_category_.json
+++ /dev/null
@@ -1,5 +0,0 @@
-{
-  "position": 2,
-  "collapsed": true,
-  "collapsible": true
-}
\ No newline at end of file
diff --git a/versioned_docs/version-old/monitoring/faq/annotation_queue.mdx b/versioned_docs/version-old/monitoring/faq/annotation_queue.mdx
deleted file mode 100644
index 6d7b3a27d..000000000
--- a/versioned_docs/version-old/monitoring/faq/annotation_queue.mdx
+++ /dev/null
@@ -1,49 +0,0 @@
----
-sidebar_label: Annotation Queue
-sidebar_position: 6
----
-
-# How to use annotation queues
-
-Annotation queues are a user friendly way to quickly cycle through and annotate data.
-
-## How to view annotation queues
-
-You can see what annotation queues your organization has by navigating to there on the left-hand sidebar.
-
-![Annotation Queue](../static/annotation_queue.png)
-
-## How to add feedback
-
-You can leave feedback by clicking the `Add tag` button in the upper right hand corner
-
-![Annotation Queue](../static/add_tag.png)
-
-## How to leave a note
-
-You can also leave free form feedback in the form of a note.
-
-![Annotation Queue](../static/notes.png)
-
-## How to see the trace of the run
-
-By default, you only see the inputs and outputs of the high level run.
-You can see the full trace by clicking `View Run`
-
-![Annotation Queue](../static/view_run.png)
-
-This will open up a side panel with the full run
-
-![Annotation Queue](../static/queue_side.png)
-
-## How to cycle through a queue
-
-You can move through a queue in a few ways. Buttons for these are all at the bottom
-
-![Annotation Queue](../static/queue_buttons.png)
-
-`Move to end` moves the datapoint you are currently viewing to the end of the queue
-
-`Done` marks a datapoint as done and removes it from the queue
-
-The `->` and `<-` buttons allow you move the next (or the prior) datapoint in the queue.
diff --git a/versioned_docs/version-old/monitoring/faq/automations.mdx b/versioned_docs/version-old/monitoring/faq/automations.mdx
deleted file mode 100644
index 41a8db68f..000000000
--- a/versioned_docs/version-old/monitoring/faq/automations.mdx
+++ /dev/null
@@ -1,41 +0,0 @@
----
-sidebar_label: Automations
-sidebar_position: 5
----
-
-# How to apply automations
-
-While it is useful to look at all datapoints by hand, it can be useful to create automations that automatically take action upon a filtered subset of datapoints.
-Automations are defined by a filter, sampling rate and an action
-
-## How to create a filter
-
-You can create a filter by doing what you normally would to filter traces. When you then click on `Rules`, an automation is created with that specified filter.
-
-![Create filter](../static/filter_rule.png)
-
-## How to specify a sampling rate
-
-You can specify a sampling rate (between 0 and 1) for automations. This will control the percent of the filtered runs that are sent to an automation
-
-![Sampling rate](../static/automations.png)
-
-## How to manage automations
-
-You can manage automations by going `Settings` -> `Rules`. From here you can view all automations you already created, you can edit them, and you can delete them.
-You can also create new automations, although it is generally recommended you create automations from the `Traces` panel in a Project, so that you can see the filter you apply.
-
-![Manage Automations](../static/manage_automations.png)
-
-### How to view logs for your automations
-
-You can view logs for your automations by going to `Settings` -> `Rules` and click on the `Logs` button in any row.
-
-You can also get to logs by clicking on `Rules` in the top right hand corner of any project details page, then clicking on `See Logs` for any rule.
-
-Logs allow you to gain confidence that your rules are working as expected. You can now view logs that list all runs processed by a given rule for the past day. For rules that apply online evaluation scores, you can easily see the output score and navigate to the run. For rules that add runs as examples to datasets, you can view the example produced.
-If a particular rule execution has triggered an error, you can view the error message by hovering over the error icon.
-
-![Logs_Gif](../static/rules_logs.gif)
-
-![Logs](../static/rules_logs.png)
diff --git a/versioned_docs/version-old/monitoring/faq/filter.mdx b/versioned_docs/version-old/monitoring/faq/filter.mdx
deleted file mode 100644
index 8447e20db..000000000
--- a/versioned_docs/version-old/monitoring/faq/filter.mdx
+++ /dev/null
@@ -1,71 +0,0 @@
----
-sidebar_label: Filtering
-sidebar_position: 2
----
-
-# How to filter
-
-This page contains a series of guides for how to filter runs.
-Being able to accurately filter runs is important for both manual inspection as well as setting up automations.
-
-## How to create a filter
-
-There are two ways to create a filter.
-First, you can create a filter from the high level nav bar. By default there is one filter applied: `IsRoot` is `true`. This restricts all runs to be top level traces.
-
-![Filtering](../static/filter.png)
-
-You can also define a filter from the `Filter Shortcuts` on the sidebar. This contains commonly used filters.
-
-![Filtering](../static/filter_shortcuts.png)
-
-## How to filter for sub runs
-
-In order to filter for sub runs, you first need to remove the default filter of `IsRoot` is `true`. After that, you can apply any filter you wish. A common way to do this is to filter by name for sub runs.
-This relies on good naming for all parts of your pipeline - see [here](../../tracing/faq/customizing_trace_attributes#customizing-the-run-name) for more details on how to do that.
-
-## How to filter for sub runs whose parent traces have some attribute
-
-A common concept is to filter for sub runs whose parent traces have some attribute. An example is filtering for sub runs of a particular type whose parent trace has positive (or negative) feedback associated with it.
-
-In order to do this, first set up a filter for sub runs (per the above section). After that, you can then add another filter rule. You can then click the `Advanced Filters` link all the way at the bottom of the filter. This will open up a new modal where you can add `Trace filters`. These filters will apply to the traces of all the parent runs of the individual runs you've already filtered for.
-
-![Filtering](../static/trace_filter.png)
-
-## How to filter for runs whose child runs have some attribute
-
-This is the opposite of the above. You may want to search for runs who have specific types of sub runs. An example of this could be searching for all traces that had a sub run with name `Foo`. This is useful when `Foo` is not always called, but you want to analyze the cases where it is.
-
-In order to do this, you can click on the `Advanced Filters` link all the way at the bottom of the filter. This will open up a new modal where you can add `Tree filters`. This will make the rule you specific apply to all child runs of the individual runs you've already filtered for.
-
-![Filtering](../static/child_runs.png)
-
-## How to copy the filter
-
-Sometimes you may want to copy a filter that you have constructed. You may way to do this to share it with a co-worker, reuse it in the future, or use it in the SDK.
-
-In order to copy the filter, you can first create it in the UI. From there, you can click the copy button in the upper right hand corner. If you have constructed tree or trace filters, you can also copy those.
-
-This will give you a string like `and(eq(is_root, true), and(eq(feedback_key, "user_score"), eq(feedback_score, 1)))`
-
-![Copy Filter](../static/copy_filter.png)
-
-## How to manually specify a raw query
-
-If you have copied a previous filter (see above) you may want to manually specify that raw query in a future session. You may also find it easier to modify this filter than to use the UI.
-
-In order to do this, you can click on `Advanced filters` on the bottom. From there you can paste a raw query into the appropriate box.
-
-Note that this will add that query to the existing queries, not overwrite it.
-
-![Raw Query](../static/raw_query.png)
-
-## How to use `AI Query` to auto-generate a query
-
-Sometimes figuring out the exact query to specify can be difficult! In order to make it easier, we've added a `AI Query` functionality. With this, you can type in the filter you want to construct in natural language and it will convert it into a valid query.
-
-For example: "All runs longer than 10 seconds"
-
-Note that this is an experimental feature and may not work for all queries.
-
-![AI Query](../static/ai_query.png)
diff --git a/versioned_docs/version-old/monitoring/faq/index.mdx b/versioned_docs/version-old/monitoring/faq/index.mdx
deleted file mode 100644
index fbfc85986..000000000
--- a/versioned_docs/version-old/monitoring/faq/index.mdx
+++ /dev/null
@@ -1,40 +0,0 @@
----
-sidebar_label: How-To Guides
-sidebar_position: 0
----
-
-# How-To Guides
-
-In this section you will find guides for how to use LangSmith production monitoring and automations.
-
-## Filters
-
-- [How to create a filter](faq/filter#how-to-create-a-filter)
-- [How to filter for sub runs](faq/filter#how-to-filter-for-sub-runs)
-- [How to filter for runs whose child runs have some attribute](faq/filter#how-to-filter-for-runs-whose-child-runs-have-some-attribute)
-
-## Monitors
-
-- [How to change the time period](faq/monitoring#how-to-change-the-time-period)
-- [How to view monitors by subsets](faq/monitoring#how-to-view-monitors-by-subset)
-- [How to drill into specific subsets](faq/monitoring#how-to-drill-into-specific-subsets)
-
-## Automations
-
-- [How to create a filter](faq/automations#how-to-create-a-filter)
-- [How to specify a sampling rate](faq/automations#how-to-specify-a-sampling-rate)
-- [How to manage automations](faq/automations#how-to-manage-automations)
-- [How to use webhooks with automations](faq/webhooks)
-
-## Annotation Queues
-
-- [How to view annotation queues](faq/annotation_queue#how-to-view-annotation_queues)
-- [How to add feedback](faq/annotation_queue#how-to-add-feedback)
-- [How to leave a note](faq/annotation_queue#how-to-leave-a-note)
-- [How to see the trace of the run](faq/annotation_queue#how-to-see-the-trace-of-the-run)
-- [How to cycle through a queue](faq/annotation_queue#how-to-cycle-through-a-queue)
-
-## Online Evaluation
-
-- [How to set up online evaluations](faq/online_evaluation#how-to-set-up-online-evaluation)
-- [How to configurate online evaluation](faq/online_evaluation#how-to-configure-online-evaluation)
diff --git a/versioned_docs/version-old/monitoring/faq/monitoring.mdx b/versioned_docs/version-old/monitoring/faq/monitoring.mdx
deleted file mode 100644
index ff3c93e5a..000000000
--- a/versioned_docs/version-old/monitoring/faq/monitoring.mdx
+++ /dev/null
@@ -1,30 +0,0 @@
----
-sidebar_label: Monitoring
-sidebar_position: 2
----
-
-# How to monitor
-
-LangSmith has a collection of monitoring charts. These can be accessed on the `Monitor` tab within a particular project.
-
-## How to change the time period
-
-You can view monitors over differing time periods. This can be controlled by the tabs at the top of the page. By default, it is set to seven days.
-
-## How to view monitors by subsets
-
-By default, the monitor tab shows results for all runs. However, you can group runs in order to see how different subsets perform.
-This can be useful to compare how two different prompts or models are performing.
-
-In order to do this, you first need to make sure you are [attaching appropriate tags or metadata](../../tracing/faq/customizing_trace_attributes#adding-metadata-and-tags-to-traces) to these runs when logging them.
-After that, you can click the `Tag` or `Metadata` tab at the top to group runs accordingly.
-
-![Subsets Monitor](../static/subsets_monitor.png)
-
-## How to drill into specific subsets
-
-Monitoring charts can be useful to idea when spikes in errors or latency may be occurring. When you observe those spikes in a monitoring dashboard, you can easily drill into the runs causing those issues by clicking on the dot in the dashboard.
-
-From there, you will be brought back to the `Traces` tab, with a filter applied so you are only viewing the runs that occurred in the time bucket that you clicked into.
-
-![Drill Monitor](../static/drill_monitor.png)
diff --git a/versioned_docs/version-old/monitoring/faq/online_evaluation.mdx b/versioned_docs/version-old/monitoring/faq/online_evaluation.mdx
deleted file mode 100644
index 824c1245a..000000000
--- a/versioned_docs/version-old/monitoring/faq/online_evaluation.mdx
+++ /dev/null
@@ -1,49 +0,0 @@
----
-sidebar_label: Online Evaluation
-sidebar_position: 4
----
-
-# How to use online evaluation
-
-One of the actions you can set up as part of an automation is online evaluation. This involves running an automatic evaluator on the on a set of runs, then attaching a feedback tag and score to each run.
-
-Currently, we provide support for specifying a prompt template, a model, and a set of criteria to evaluate the runs on.
-
-## How to set up online evaluation
-
-The way to configure online evaluation is to first set up an [automation](../../monitoring/faq/automations).
-
-![Subsets Monitor](../static/filter_rule.png)
-
-From here, you can select `Online Evaluation` from the list of possible actions
-
-![Subsets Monitor](../static/automations.png)
-
-## How to configure online evaluation
-
-When selection `Online Evaluation` as an action in an automation, you are presented with a panel from which you can configure online evaluation.
-
-![Subsets Monitor](../static/evaluator.png)
-
-You can configure the model, the prompt template, and the criteria
-
-### The model
-
-You can choose any model available in the dropdown.
-
-### The prompt template
-
-You can customize the prompt template to be whatever you want.
-The prompt template is a LangChain prompt template - this means that anything in `{...}` is treated as a variable to format.
-There are two permitted variables: `input` and `output`, corresponding to the input and output of the run you are evaluating
-
-### The criteria
-
-An evaluator will attach arbitrary metadata tags to a run. These tags will have a name and a value. You can configure this in the `Criteria` section.
-The names and the descriptions of the fields will be passed in to the prompt.
-
-## How to set API keys
-
-Online evaluation uses LLMs. In order to set the API keys to use for these invocations, navigate to the `Settings -> Secrets -> Add secret` page and add any API keys there.
-
-![Subsets Monitor](../static/secrets.png)
diff --git a/versioned_docs/version-old/monitoring/faq/threads.mdx b/versioned_docs/version-old/monitoring/faq/threads.mdx
deleted file mode 100644
index 541fb0021..000000000
--- a/versioned_docs/version-old/monitoring/faq/threads.mdx
+++ /dev/null
@@ -1,99 +0,0 @@
----
-sidebar_label: Threads
-sidebar_position: 3
----
-
-import Tabs from "@theme/Tabs";
-import CodeBlock from "@theme/CodeBlock";
-import {
-  CodeTabs,
-  PythonBlock,
-  TypeScriptBlock,
-} from "@site/src/components/InstructionsWithCode";
-
-# How to track threads
-
-A `Thread` is a sequence of traces representing a single thread. Each response is represented as it's own trace, but these traces are linked together by being part of the same thread.
-
-To associate traces together, you need to pass in a special metadata key where the value is the unique identifier for that thread.
-
-Below is an example of logging conversations:
-
-<CodeTabs
-  tabs={[
-    {
-      value: "python",
-      label: "Python",
-      language: "python",
-      content: `
-import openai
-from langsmith import traceable
-import uuid
-client = openai.Client()
-session_id = str(uuid.uuid4())
-@traceable(
-    run_type="chain",
-    name="OpenAI Assistant",
-)
-def assistant(
-    messages: list[dict]
-):
-    return client.chat.completions.create(
-        model="gpt-3.5-turbo",
-        messages=[{"role": "system", "content": "You are a helpful assistant."}] + messages,
-    ).choices[0].message
-messages = [
-    {"role": "user", "content": "hi! im bob"}
-]
-response = assistant(
-    messages,
-    langsmith_extra={"metadata": {"session_id": session_id}}
-)
-messages = messages + [
-    response,
-    {"role": "user", "content": "what's my name?"}
-]
-response = assistant(
-    messages,
-    langsmith_extra={"metadata": {"session_id": session_id}}
-)`,
-    },
-    {
-      value: "langchain-python",
-      label: "LangChain (Python)",
-      language: "python",
-      content: `from langchain_anthropic import ChatAnthropic
-from langchain_core.prompts import ChatPromptTemplate
-from langchain_core.messages import HumanMessage, AIMessage
-from langchain_core.output_parsers import StrOutputParser
-import uuid
-model = ChatAnthropic(model="claude-3-haiku-20240307")
-prompt = ChatPromptTemplate.from_messages([('placeholder', "{messages}")])
-chain = prompt | model
-messages = [HumanMessage(content="hi! I'm bob")]
-config = {"metadata": {"conversation_id": str(uuid.uuid4())}}
-response = chain.invoke({"messages": messages}, config=config)
-messages = messages + [response, HumanMessage(content="whats my name")]
-response = chain.invoke({"messages": messages}, config=config)`,
-    },
-  ]}
-/>
-
-## How to view threads
-
-You can view threads by clicking on the `Threads` tag in a project. You will then see a list of all recent threads.
-
-![Thread Tab](../static/convo_tab.png)
-
-You can then click into a particular thread. This will open the history for a particular thread. If your threads are formatted as chat messages, you will a chatbot-like UI where you can see a history of inputs and outputs.
-
-![Conversation](../static/convo.png)
-
-## What are special metadata keys that associate traces as part of the same thread?
-
-In order to log runs as part of the same thread you need to pass a special metadata key to the run. The key value is the unique identifier for that conversation.
-The key name should be one of:
-
-- `session_id`
-- `thread_id`
-- `conversation_id`.
diff --git a/versioned_docs/version-old/monitoring/faq/webhooks.mdx b/versioned_docs/version-old/monitoring/faq/webhooks.mdx
deleted file mode 100644
index e87c158da..000000000
--- a/versioned_docs/version-old/monitoring/faq/webhooks.mdx
+++ /dev/null
@@ -1,193 +0,0 @@
-# How to use webhooks with automations
-
-When you add a webhook URL on an automation action, we will make a POST request to your webhook endpoint any time the rules you defined match any new runs.
-
-## Webhook Payload
-
-The payload we send to your webhook endpoint contains
-
-- "rule_id" this is the ID of the automation that sent this payload
-- "start_time" and "end_time" these are the time boundaries where we found matching runs
-- "runs" this is an array of runs, where each run is a dictionary. If you need more information about each run we suggest using our SDK in your endpoint to fetch it from our API.
-
-This is an example webhook payload
-
-```json
-{
-  "rule_id": "d75d7417-0c57-4655-88fe-1db3cda3a47a",
-  "start_time": "2024-04-05T01:28:54.734491+00:00",
-  "end_time": "2024-04-05T01:28:56.492563+00:00",
-  "runs": [
-    {
-      "status": "success",
-      "is_root": true,
-      "trace_id": "6ab80f10-d79c-4fa2-b441-922ed6feb630",
-      "dotted_order": "20230505T051324571809Z6ab80f10-d79c-4fa2-b441-922ed6feb630",
-      "run_type": "tool",
-      "modified_at": "2024-04-05T01:28:54.145062",
-      "tenant_id": "2ebda79f-2946-4491-a9ad-d642f49e0815",
-      "end_time": "2024-04-05T01:28:54.085649",
-      "name": "Search",
-      "start_time": "2024-04-05T01:28:54.085646",
-      "id": "6ab80f10-d79c-4fa2-b441-922ed6feb630",
-      "session_id": "6a3be6a2-9a8c-4fc8-b4c6-a8983b286cc5",
-      "parent_run_ids": [],
-      "child_run_ids": null,
-      "direct_child_run_ids": null,
-      "total_tokens": 0,
-      "completion_tokens": 0,
-      "prompt_tokens": 0,
-      "total_cost": null,
-      "completion_cost": null,
-      "prompt_cost": null,
-      "first_token_time": null,
-      "app_path": "/o/2ebda79f-2946-4491-a9ad-d642f49e0815/projects/p/6a3be6a2-9a8c-4fc8-b4c6-a8983b286cc5/r/6ab80f10-d79c-4fa2-b441-922ed6feb630?trace_id=6ab80f10-d79c-4fa2-b441-922ed6feb630&start_time=2023-05-05T05:13:24.571809",
-      "in_dataset": false,
-      "last_queued_at": null,
-      "inputs": null,
-      "inputs_s3_urls": null,
-      "outputs": null,
-      "outputs_s3_urls": null,
-      "extra": null,
-      "events": null,
-      "feedback_stats": null,
-      "serialized": null,
-      "share_token": null
-    }
-  ]
-}
-```
-
-### Webhook Security
-
-We strongly recommend you add a secret query string parameter to the webhook URL, and verify it on any incoming request. This ensures that if someone discovers your webhook URL you can distinguish those calls from authentic webhook notifications.
-
-An example would be
-
-```
-https://api.example.com/langsmith_webhook?secret=38ee77617c3a489ab6e871fbeb2ec87d
-```
-
-### Webhook Delivery
-
-When delivering events to your webhook endpoint we follow these guidelines
-
-- If we fail to connect to your endpoint, we retry the transport connection up to 2 times, before declaring the delivery failed.
-- If your endpoint takes longer than 5 seconds to reply we declare the delivery failed and do not .
-- If your endpoint returns a 5xx status code in less than 5 seconds we retry up to 2 times with exponential backoff.
-- If your endpoint returns a 4xx status code, we declare the delivery failed and do not retry.
-- Anything your endpoint returns in the body will be ignored
-
-## Example with Modal
-
-### Setup
-
-For an example of how to set this up, we will use [Modal](https://modal.com/). Modal provides autoscaling GPUs for inference and fine-tuning, secure containerization for code agents, and serverless Python web endpoints. We'll focus on the web endpoints here.
-
-First, create a Modal account. Then, locally install the Modal SDK:
-
-```shell
-pip install modal
-```
-
-To finish setting up your account, run the command:
-
-```shell
-modal setup
-```
-
-and follow the instructions
-
-### Secrets
-
-Next, you will need to set up some secrets in Modal.
-
-First, LangSmith will need to authenticate to Modal by passing in a secret.
-The easiest way to do this is to pass in a secret in the query parameters.
-To validate this secret, we will need to add a secret in _Modal_ to validate it.
-We will do that by creating a Modal secret.
-You can see instructions for secrets [here](https://modal.com/docs/guide/secrets).
-For this purpose, let's call our secret `ls-webhook` and have it set an environment variable with the name `LS_WEBHOOK`.
-
-We can also set up a LangSmith secret - luckily there is already an integration template for this!
-
-![LangSmith Modal Template](../static/modal_langsmith_secret.png)
-
-### Service
-
-After that, you can create a Python file that will serve as your endpoint.
-An example is below, with comments explaining what is going on:
-
-```python
-from fastapi import HTTPException, status, Request, Query
-from modal import Secret, Stub, web_endpoint, Image
-
-stub = Stub("auth-example", image=Image.debian_slim().pip_install("langsmith"))
-
-
-@stub.function(
-    secrets=[Secret.from_name("ls-webhook"), Secret.from_name("my-langsmith-secret")]
-)
-# We want this to be a `POST` endpoint since we will post data here
-@web_endpoint(method="POST")
-# We set up a `secret` query parameter
-def f(data: dict, secret: str = Query(...)):
-    # You can import dependencies you don't have locally inside Modal funxtions
-    from langsmith import Client
-
-    # First, we validate the secret key we pass
-    import os
-
-    if secret != os.environ["LS_WEBHOOK"]:
-        raise HTTPException(
-            status_code=status.HTTP_401_UNAUTHORIZED,
-            detail="Incorrect bearer token",
-            headers={"WWW-Authenticate": "Bearer"},
-        )
-
-    # This is where we put the logic for what should happen inside this webhook
-    ls_client = Client()
-    runs = data["runs"]
-    ids = [r["id"] for r in runs]
-    feedback = list(ls_client.list_feedback(run_ids=ids))
-    for r, f in zip(runs, feedback):
-        try:
-            ls_client.create_example(
-                inputs=r["inputs"],
-                outputs={"output": f.correction},
-                dataset_name="classifier-github-issues",
-            )
-        except Exception:
-            raise ValueError(f"{r} and {f}")
-    # Function body
-    return "success!"
-```
-
-We can now deploy this easily with `modal deploy ...` (see docs [here](https://modal.com/docs/guide/managing-deployments)).
-
-You should now get something like:
-
-```
-✓ Created objects.
-├── 🔨 Created mount /Users/harrisonchase/workplace/langsmith-docs/example-webhook.py
-├── 🔨 Created mount PythonPackage:langsmith
-└── 🔨 Created f => https://hwchase17--auth-example-f.modal.run
-✓ App deployed! 🎉
-
-View Deployment: https://modal.com/apps/hwchase17/auth-example
-```
-
-The important thing to remember is `https://hwchase17--auth-example-f.modal.run` - the function we created to run.
-NOTE: this is NOT the final deployment URL, make sure not to accidentally use that.
-
-### Hooking it up
-
-We can now take the function URL we create above and add it as a webhook.
-We have to remember to also pass in the secret key as a query parameter.
-Putting it all together, it should look something like:
-
-```
-https://hwchase17--auth-example-f-dev.modal.run?secret={SECRET}
-```
-
-Replace `{SECRET}` with the secret key you created to access the Modal service.
diff --git a/versioned_docs/version-old/monitoring/index.mdx b/versioned_docs/version-old/monitoring/index.mdx
deleted file mode 100644
index df77bfa12..000000000
--- a/versioned_docs/version-old/monitoring/index.mdx
+++ /dev/null
@@ -1,20 +0,0 @@
----
-sidebar_label: Overview
-sidebar_position: 0
----
-
-# Production Monitoring & Automations
-
-Closely inspecting key data points, growing benchmarking datasets, annotating traces, and drilling down into important data in trace view are workflows you’ll also want to do once your app hits production.
-It's also crucial to get a high-level overview of application performance with respect to latency, cost, and feedback scores. This ensures that it's delivering desirable results at scale.
-
-In order to facilitate this, LangSmith supports a series of workflows to support production monitoring and automations.
-This includes support for easily exploring and visualizing key production metrics, as well as support for defining automations to process the data.
-
-To get started, check out the [Quick Start Guide](monitoring/quickstart).
-
-After that, peruse the [Concepts Section](monitoring/concepts) to better understand the different components involved with monitoring and automations.
-
-If you want to learn how to accomplish a particular task, check out our comprehensive [How-To Guides](monitoring/faq)
-
-For example use cases, check out the [Use Cases](monitoring/use_cases) page.
diff --git a/versioned_docs/version-old/monitoring/quickstart.mdx b/versioned_docs/version-old/monitoring/quickstart.mdx
deleted file mode 100644
index f99a5147d..000000000
--- a/versioned_docs/version-old/monitoring/quickstart.mdx
+++ /dev/null
@@ -1,94 +0,0 @@
----
-sidebar_label: Quick Start
-sidebar_position: 1
-table_of_contents: true
----
-
-# Quick Start
-
-Production monitoring starts by configuring tracing for your application. See the [tracing section](../tracing) for details on how to do that.
-
-Compared to tracing while prototyping applications, you want to pay attention to a few particular points:
-
-- [Sampling](../tracing/faq/logging_and_viewing#setting-a-sampling-rate-for-tracing): When logging production workloads, you may only want to log a subset of the datapoints flowing through your system.
-- [Adding Metadata](../tracing/faq/customizing_trace_attributes#adding-metadata-and-tags-to-traces): As we'll see with automations, attaching relevant metadata to runs is particularly important to enable filtering and grouping your data.
-- [Feedback](../tracing/faq/logging_feedback): When an application is in production you can't always look at all datapoints. Capturing user feedback is helpful to draw your attention to particular datapoints.
-
-So - now you've got your logs flowing into LangSmith. What can you do with that data?
-
-## Filtering
-
-If you want to dive into particular runs, you can use the filtering functionality. By default, this selects all top level runs (where `Is Root` is `True`). You can filter based on name, metadata attribute, feedback, or even do a full text search.
-
-![Filtering](static/filter.png)
-
-For more information on filtering, see [here](faq/filter).
-
-## Monitoring
-
-LangSmith provides monitoring charts that allow you to track key metrics over time. You can expand to view metrics for a given period and drill down into a specific data point to get a trace table for that time period — this is especially handy for debugging production issues.
-
-To get started with monitoring, navigate to the `Monitoring` tab in the Project dashboard. Here, you can view charts such as `Trace Latency`, `Tokens/Second`, `Cost`, and feedback charts.
-LangSmith also allows for tag and metadata grouping, which allows users to mark different versions of their applications with different identifiers and view how they are performing side-by-side within each chart. This is helpful for A/B testing changes in prompt, model, or retrieval strategy.
-
-![Monitoring](static/monitoring.png)
-
-For more information on filtering, see [here](faq/monitoring).
-
-## Threads
-
-If your traces are part of the same conversation, you can track them using `Threads`. You can do this by attaching a special metadata key to each trace. Once you have done that, you can view them all in the same page.
-
-![Threads](static/convo.png)
-
-## Automations
-
-Although you'll likely want to spend time looking at traces by hand to gain an intuition for what's happening with your LLM pipelines, at some point, you will want to automate some of actions you are taking on those traces. That is where `Automations` come in handy.
-
-The first step for defining an automation is to define the filter you want to use to select the datapoints to apply that automation to. You can do this with the filtering capability above. After doing that, you can then hit the `Rules` button.
-
-![Filtering](static/filter_rule.png)
-
-That will cause a side panel to open up. This will display three main automations you can apply to your data: sending to a dataset, sending to an annotation queue, or running online evaluation over them. You can give this automation a name and also set a sampling rate. The sampling rate determines what percentage of rows that meet this filter are acted upon.
-
-![Automations](static/automations.png)
-
-For more information, see [here](faq/automations)
-
-### Sending to a Dataset
-
-One common workflow is to send datapoints to a dataset automatically. This can be done by selecting the dataset button and then selecting the dataset you want to send to (or create a new dataset).
-
-If you enable "Use corrections" then, for each matched run we will look for feedback containing a "correction" and save that as the outputs of the new dataset example. If no feedback is found, we will skip that run.
-
-### Sending to an Annotation Queue
-
-An annotation queue is a user-friendly way to look at and annotate a large amount of datapoints. When clicking on this button you select the annotation queue you want to send to (or create a new annotation queue).
-
-For more information, see [here](faq/annotation_queue)
-
-### Sending to Online Evaluation
-
-Often times you may want to use an LLM to annotate or leave feedback on datapoints. This can be for the purpose of trying to get some initial feedback on the LLM answer (vague, not vague) or to classify user input, or both! This can be done with `Online Evaluation`.
-
-NOTE: before clicking on this option, make sure to set up secrets to have access to any API keys for the LLMs you will use. You can do this by clicking `Settings -> Secrets -> Add secret`. These are different from Playground secrets, which live in the browser. Evaluator secrets live in our backend and are encrypted.
-
-![Filtering](static/secrets.png)
-
-After doing this, you can set up an automation and then select the `Online Evaluation` option. When clicking on this option, a panel is opened to configure the evaluator. The evaluator is determined by three components: the model, the prompt template, and the criteria.
-
-![Filtering](static/evaluator.png)
-
-The model is the LLM that will do the evaluation.
-
-The prompt template will be used to format the information from the run that you want to score. The `{inputs}` placeholder represents where the inputs of the run will be formatted to, and the `{outputs}` represents the outputs.
-
-The criteria represents the feedback that will be associated with the run. The name is the key of the feedback, and then the LLM will generate the value which will be used as the feedback score. The name and description of the criteria are passed to the LLM, so you should make them descriptive!
-
-For more information, see [here](faq/online_evaluation)
-
-### Webhooks
-
-You also have the option of being notified via a webhook whenever a rule matches new runs. Your webhook endpoint will be called with a JSON payload containing the matched runs.
-
-For more information, see [here](faq/webhooks).
diff --git a/versioned_docs/version-old/monitoring/static/add_tag.png b/versioned_docs/version-old/monitoring/static/add_tag.png
deleted file mode 100644
index 21eadbb21..000000000
Binary files a/versioned_docs/version-old/monitoring/static/add_tag.png and /dev/null differ
diff --git a/versioned_docs/version-old/monitoring/static/ai_query.png b/versioned_docs/version-old/monitoring/static/ai_query.png
deleted file mode 100644
index 9d327d5a5..000000000
Binary files a/versioned_docs/version-old/monitoring/static/ai_query.png and /dev/null differ
diff --git a/versioned_docs/version-old/monitoring/static/annotation_queue.png b/versioned_docs/version-old/monitoring/static/annotation_queue.png
deleted file mode 100644
index 13cd513d5..000000000
Binary files a/versioned_docs/version-old/monitoring/static/annotation_queue.png and /dev/null differ
diff --git a/versioned_docs/version-old/monitoring/static/automations.png b/versioned_docs/version-old/monitoring/static/automations.png
deleted file mode 100644
index 6fa9c0a1b..000000000
Binary files a/versioned_docs/version-old/monitoring/static/automations.png and /dev/null differ
diff --git a/versioned_docs/version-old/monitoring/static/child_runs.png b/versioned_docs/version-old/monitoring/static/child_runs.png
deleted file mode 100644
index 73d9f2a18..000000000
Binary files a/versioned_docs/version-old/monitoring/static/child_runs.png and /dev/null differ
diff --git a/versioned_docs/version-old/monitoring/static/class-optimization-neg.png b/versioned_docs/version-old/monitoring/static/class-optimization-neg.png
deleted file mode 100644
index 144d869d0..000000000
Binary files a/versioned_docs/version-old/monitoring/static/class-optimization-neg.png and /dev/null differ
diff --git a/versioned_docs/version-old/monitoring/static/class-optimization-pos.png b/versioned_docs/version-old/monitoring/static/class-optimization-pos.png
deleted file mode 100644
index d5c654901..000000000
Binary files a/versioned_docs/version-old/monitoring/static/class-optimization-pos.png and /dev/null differ
diff --git a/versioned_docs/version-old/monitoring/static/convo.png b/versioned_docs/version-old/monitoring/static/convo.png
deleted file mode 100644
index e26f695ca..000000000
Binary files a/versioned_docs/version-old/monitoring/static/convo.png and /dev/null differ
diff --git a/versioned_docs/version-old/monitoring/static/convo_tab.png b/versioned_docs/version-old/monitoring/static/convo_tab.png
deleted file mode 100644
index ae629443f..000000000
Binary files a/versioned_docs/version-old/monitoring/static/convo_tab.png and /dev/null differ
diff --git a/versioned_docs/version-old/monitoring/static/copy_filter.png b/versioned_docs/version-old/monitoring/static/copy_filter.png
deleted file mode 100644
index c4c362bdc..000000000
Binary files a/versioned_docs/version-old/monitoring/static/copy_filter.png and /dev/null differ
diff --git a/versioned_docs/version-old/monitoring/static/drill_monitor.png b/versioned_docs/version-old/monitoring/static/drill_monitor.png
deleted file mode 100644
index 5390e7e68..000000000
Binary files a/versioned_docs/version-old/monitoring/static/drill_monitor.png and /dev/null differ
diff --git a/versioned_docs/version-old/monitoring/static/evaluator.png b/versioned_docs/version-old/monitoring/static/evaluator.png
deleted file mode 100644
index a85e593d7..000000000
Binary files a/versioned_docs/version-old/monitoring/static/evaluator.png and /dev/null differ
diff --git a/versioned_docs/version-old/monitoring/static/filter.png b/versioned_docs/version-old/monitoring/static/filter.png
deleted file mode 100644
index 41942a916..000000000
Binary files a/versioned_docs/version-old/monitoring/static/filter.png and /dev/null differ
diff --git a/versioned_docs/version-old/monitoring/static/filter_rule.png b/versioned_docs/version-old/monitoring/static/filter_rule.png
deleted file mode 100644
index 80210fab7..000000000
Binary files a/versioned_docs/version-old/monitoring/static/filter_rule.png and /dev/null differ
diff --git a/versioned_docs/version-old/monitoring/static/filter_shortcuts.png b/versioned_docs/version-old/monitoring/static/filter_shortcuts.png
deleted file mode 100644
index 30d998595..000000000
Binary files a/versioned_docs/version-old/monitoring/static/filter_shortcuts.png and /dev/null differ
diff --git a/versioned_docs/version-old/monitoring/static/manage_automations.png b/versioned_docs/version-old/monitoring/static/manage_automations.png
deleted file mode 100644
index 66f3c3351..000000000
Binary files a/versioned_docs/version-old/monitoring/static/manage_automations.png and /dev/null differ
diff --git a/versioned_docs/version-old/monitoring/static/modal_langsmith_secret.png b/versioned_docs/version-old/monitoring/static/modal_langsmith_secret.png
deleted file mode 100644
index 04039ac2e..000000000
Binary files a/versioned_docs/version-old/monitoring/static/modal_langsmith_secret.png and /dev/null differ
diff --git a/versioned_docs/version-old/monitoring/static/monitoring.png b/versioned_docs/version-old/monitoring/static/monitoring.png
deleted file mode 100644
index 4eba25598..000000000
Binary files a/versioned_docs/version-old/monitoring/static/monitoring.png and /dev/null differ
diff --git a/versioned_docs/version-old/monitoring/static/notes.png b/versioned_docs/version-old/monitoring/static/notes.png
deleted file mode 100644
index a4459c76d..000000000
Binary files a/versioned_docs/version-old/monitoring/static/notes.png and /dev/null differ
diff --git a/versioned_docs/version-old/monitoring/static/optimization-negative.png b/versioned_docs/version-old/monitoring/static/optimization-negative.png
deleted file mode 100644
index 42634dbbd..000000000
Binary files a/versioned_docs/version-old/monitoring/static/optimization-negative.png and /dev/null differ
diff --git a/versioned_docs/version-old/monitoring/static/optimization-positive.png b/versioned_docs/version-old/monitoring/static/optimization-positive.png
deleted file mode 100644
index b54b0aaa9..000000000
Binary files a/versioned_docs/version-old/monitoring/static/optimization-positive.png and /dev/null differ
diff --git a/versioned_docs/version-old/monitoring/static/queue_buttons.png b/versioned_docs/version-old/monitoring/static/queue_buttons.png
deleted file mode 100644
index 601318279..000000000
Binary files a/versioned_docs/version-old/monitoring/static/queue_buttons.png and /dev/null differ
diff --git a/versioned_docs/version-old/monitoring/static/queue_side.png b/versioned_docs/version-old/monitoring/static/queue_side.png
deleted file mode 100644
index fa1463e1c..000000000
Binary files a/versioned_docs/version-old/monitoring/static/queue_side.png and /dev/null differ
diff --git a/versioned_docs/version-old/monitoring/static/raw_query.png b/versioned_docs/version-old/monitoring/static/raw_query.png
deleted file mode 100644
index 57be40985..000000000
Binary files a/versioned_docs/version-old/monitoring/static/raw_query.png and /dev/null differ
diff --git a/versioned_docs/version-old/monitoring/static/rules_logs.gif b/versioned_docs/version-old/monitoring/static/rules_logs.gif
deleted file mode 100644
index c248571dc..000000000
Binary files a/versioned_docs/version-old/monitoring/static/rules_logs.gif and /dev/null differ
diff --git a/versioned_docs/version-old/monitoring/static/rules_logs.png b/versioned_docs/version-old/monitoring/static/rules_logs.png
deleted file mode 100644
index c810724d8..000000000
Binary files a/versioned_docs/version-old/monitoring/static/rules_logs.png and /dev/null differ
diff --git a/versioned_docs/version-old/monitoring/static/secrets.png b/versioned_docs/version-old/monitoring/static/secrets.png
deleted file mode 100644
index f6484f526..000000000
Binary files a/versioned_docs/version-old/monitoring/static/secrets.png and /dev/null differ
diff --git a/versioned_docs/version-old/monitoring/static/subsets_monitor.png b/versioned_docs/version-old/monitoring/static/subsets_monitor.png
deleted file mode 100644
index 59077d0f1..000000000
Binary files a/versioned_docs/version-old/monitoring/static/subsets_monitor.png and /dev/null differ
diff --git a/versioned_docs/version-old/monitoring/static/time_period.png b/versioned_docs/version-old/monitoring/static/time_period.png
deleted file mode 100644
index 1d19fb921..000000000
Binary files a/versioned_docs/version-old/monitoring/static/time_period.png and /dev/null differ
diff --git a/versioned_docs/version-old/monitoring/static/trace_filter.png b/versioned_docs/version-old/monitoring/static/trace_filter.png
deleted file mode 100644
index 4babf4066..000000000
Binary files a/versioned_docs/version-old/monitoring/static/trace_filter.png and /dev/null differ
diff --git a/versioned_docs/version-old/monitoring/static/view_run.png b/versioned_docs/version-old/monitoring/static/view_run.png
deleted file mode 100644
index 5aed14362..000000000
Binary files a/versioned_docs/version-old/monitoring/static/view_run.png and /dev/null differ
diff --git a/versioned_docs/version-old/monitoring/use_cases/_category_.json b/versioned_docs/version-old/monitoring/use_cases/_category_.json
deleted file mode 100644
index 95b2480eb..000000000
--- a/versioned_docs/version-old/monitoring/use_cases/_category_.json
+++ /dev/null
@@ -1,5 +0,0 @@
-{
-  "position": 3,
-  "collapsed": true,
-  "collapsible": true
-}
\ No newline at end of file
diff --git a/versioned_docs/version-old/monitoring/use_cases/classification.mdx b/versioned_docs/version-old/monitoring/use_cases/classification.mdx
deleted file mode 100644
index 259de4c18..000000000
--- a/versioned_docs/version-old/monitoring/use_cases/classification.mdx
+++ /dev/null
@@ -1,308 +0,0 @@
----
-sidebar_label: Optimizing a Classifier
-sidebar_position: 2
-table_of_contents: true
----
-
-# Optimizing a Classifier
-
-This tutorial walks through optimizing a classifier based on user a feedback.
-Classifiers are great to optimize because its generally pretty simple to collect the desired output, which makes it easy to create few shot examples based on user feedback.
-That is exactly what we will do in this example.
-
-## The objective
-
-In this example, we will build a bot that classify GitHub issues based on their title.
-It will take in a title and classify it into one of many different classes.
-Then, we will start to collect user feedback and use that to shape how this classifier performs.
-
-## Getting started
-
-To get started, we will first set it up so that we send all traces to a specific project.
-We can do this by setting an environment variable:
-
-```python
-import os
-os.environ["LANGCHAIN_PROJECT"] = "classifier"
-```
-
-We can then create our initial application. This will be a really simple function that just takes in a GitHub issue title and tries to label it.
-
-```python
-import openai
-from langsmith import traceable, Client
-import uuid
-
-client = openai.Client()
-
-available_topics = [
-    "bug",
-    "improvement",
-    "new_feature",
-    "documentation",
-    "integration",
-]
-
-prompt_template = """Classify the type of the issue as one of {topics}.
-
-Issue: {text}"""
-
-@traceable(
-    run_type="chain",
-    name="Classifier",
-)
-def topic_classifier(
-    topic: str
-):
-    return client.chat.completions.create(
-        model="gpt-3.5-turbo",
-        temperature=0,
-        messages=[
-            {
-                "role": "user",
-                "content": prompt_template.format(
-                    topics=','.join(available_topics),
-                    text=topic,
-                )
-            }
-        ],
-    ).choices[0].message.content
-```
-
-We can then start to interact with it.
-When interacting with it, we will generate the LangSmith run id ahead of time and pass that into this function.
-We do this so we can attach feedback later on.
-
-Here's how we can invoke the application:
-
-```python
-run_id = uuid.uuid4()
-topic_classifier(
-    "fix bug in LCEL",
-    langsmith_extra={"run_id": run_id}
-)
-```
-
-Here's how we can attach feedback after.
-We can collect feedback in two forms.
-
-First, we can collect "positive" feedback - this is for examples that the model got right.
-
-```python
-ls_client = Client()
-run_id = uuid.uuid4()
-
-topic_classifier(
-    "fix bug in LCEL",
-    langsmith_extra={"run_id": run_id}
-)
-
-ls_client.create_feedback(
-    run_id,
-    key="user-score",
-    score=1.0,
-)
-```
-
-Next, we can focus on collecting feedback that corresponds to a "correction" to the generation.
-In this example the model will classify it as a bug, whereas I really want this to be classified as documentation.
-
-```python
-ls_client = Client()
-
-run_id = uuid.uuid4()
-topic_classifier(
-    "fix bug in documentation",
-    langsmith_extra={"run_id": run_id}
-)
-
-ls_client.create_feedback(
-    run_id,
-    key="correction",
-    correction="documentation"
-)
-```
-
-## Set up automations
-
-We can now set up automations to move examples with feedback of some form into a dataset.
-We will set up two automations, one for positive feedback and the other for negative feedback.
-
-The first will take all runs with positive feedback and automatically add them to a dataset.
-The logic behind this is that any run with positive feedback we can use as a good example in future iterations.
-Let's create a dataset called `classifier-github-issues` to add this data to.
-
-![Optimization Positive](../static/class-optimization-pos.png)
-
-The second will take all runs with a correction and use a webhook to add them to a dataset.
-When creating this webhook, we will select the option to "Use Corrections".
-This option will make it so that when creating a dataset from a run, rather than using the output of the run
-as the gold-truth output of the datapoint, it will use the correction.
-
-![Optimization Negative](../static/class-optimization-neg.png)
-
-## Updating the application
-
-We can now update our code to pull down the dataset we are sending runs to.
-Once we pull it down, we can create a string with the examples in it.
-We can then put this string as part of the prompt!
-
-```python
-
-### NEW CODE ###
-
-# Initialize the LangSmith Client so we can use to get the dataset
-ls_client = Client()
-
-# Create a function that will take in a list of examples and format them into a string
-def create_example_string(examples):
-    final_strings = []
-    for e in examples:
-        final_strings.append(f"Input: {e.inputs['topic']}\n> {e.outputs['output']}")
-    return "\n\n".join(final_strings)
-
-### NEW CODE ###
-
-
-client = openai.Client()
-
-available_topics = [
-    "bug",
-    "improvement",
-    "new_feature",
-    "documentation",
-    "integration",
-]
-
-prompt_template = """Classify the type of the issue as one of {topics}.
-
-Here are some examples:
-
-{examples}
-
-Begin!
-
-Issue: {text}
->"""
-
-@traceable(
-    run_type="chain",
-    name="Classifier",
-)
-def topic_classifier(
-    topic: str
-):
-    # We can now pull down the examples from the dataset
-    # We do this inside the function so it always get the most up-to-date examples,
-    # But this can be done outside and cached for speed if desired
-    examples = list(ls_client.list_examples(dataset_name="classifier-github-issues"))  # <- New Code
-    example_string = create_example_string(examples)
-
-    return client.chat.completions.create(
-        model="gpt-3.5-turbo",
-        temperature=0,
-        messages=[
-            {
-                "role": "user",
-                "content": prompt_template.format(
-                    topics=','.join(available_topics),
-                    text=topic,
-                    examples=example_string,
-                )
-            }
-        ],
-    ).choices[0].message.content
-```
-
-If now run the application with a similar input as before, we can see that it correctly learns that anything related to docs (even if a bug) should be classified as `documentation`
-
-```python
-ls_client = Client()
-
-run_id = uuid.uuid4()
-topic_classifier(
-    "address bug in documentation",
-    langsmith_extra={"run_id": run_id}
-)
-```
-
-## Semantic Search Over Examples
-
-One additional thing we can do is only use the most semantically similar examples.
-This is useful when you start to build up a lot of examples.
-
-In order to do this, we can first define an example to find the `k` most similar examples:
-
-```python
-import numpy as np
-
-def find_similar(examples, topic, k=5):
-    inputs = [e.inputs['topic'] for e in examples] + [topic]
-    embedds = client.embeddings.create(input=inputs, model="text-embedding-3-small")
-    embedds = [e.embedding for e in embedds.data]
-    embedds = np.array(embedds)
-    args = np.argsort(-embedds.dot(embedds[-1])[:-1])[:5]
-    examples = [examples[i] for i in args]
-    return examples
-```
-
-We can then use that in the application
-
-```python
-ls_client = Client()
-
-def create_example_string(examples):
-    final_strings = []
-    for e in examples:
-        final_strings.append(f"Input: {e.inputs['topic']}\n> {e.outputs['output']}")
-    return "\n\n".join(final_strings)
-
-
-
-client = openai.Client()
-
-available_topics = [
-    "bug",
-    "improvement",
-    "new_feature",
-    "documentation",
-    "integration",
-]
-
-prompt_template = """Classify the type of the issue as one of {topics}.
-
-Here are some examples:
-
-{examples}
-
-Begin!
-
-Issue: {text}
->"""
-
-@traceable(
-    run_type="chain",
-    name="Classifier",
-)
-def topic_classifier(
-    topic: str
-):
-    examples = list(ls_client.list_examples(dataset_name="classifier-github-issues"))
-    examples = find_similar(examples, topic)
-    example_string = create_example_string(examples)
-
-    return client.chat.completions.create(
-        model="gpt-3.5-turbo",
-        temperature=0,
-        messages=[
-            {
-                "role": "user",
-                "content": prompt_template.format(
-                    topics=','.join(available_topics),
-                    text=topic,
-                    examples=example_string,
-                )
-            }
-        ],
-    ).choices[0].message.content
-```
diff --git a/versioned_docs/version-old/monitoring/use_cases/index.mdx b/versioned_docs/version-old/monitoring/use_cases/index.mdx
deleted file mode 100644
index 2156f7b7b..000000000
--- a/versioned_docs/version-old/monitoring/use_cases/index.mdx
+++ /dev/null
@@ -1,59 +0,0 @@
----
-sidebar_label: Use Cases
-sidebar_position: 0
-table_of_contents: true
----
-
-# Use Cases
-
-The following guides are provided to serve as example use cases for how you can use LangSmith's production logging and automations.
-These are not meant to be exhaustive, nor are they optimized
-for your use case. They are meant as a reference to help you get started.
-
-## Add bad datapoints to an annotation queue
-
-This flow can be used to send datapoints that get negative end user feedback to an annotation queue,
-where you can inspect them manually.
-To do this, you will want to set `Sampling Rate` to be `1`,
-and you will want to filter to root runs with negative feedback.
-Your action is to send to an annotation queue.
-
-## Send datapoints with positive feedback to a dataset.
-
-This flow can be used to send datapoints with positive feedback to a dataset.
-The logic here is that these datapoints are good input/output pairs.
-They can then be used for testing, few shot prompting, or fine tuning.
-You will want to set a `Sampling Rate` of `1` and you will want to filter to root runs with positive
-feedback. Your action is to send to a dataset.
-
-## Send child runs whose trace got positive feedback to a dataset
-
-In the case where your application contains multiple steps,
-you may also want to build up datasets for each step.
-This is useful because often you will want to use few shot prompting on these individual steps.
-In order to do that, you need to collect examples of those individual steps.
-You often don’t get direct feedback on those individual steps, but rather on the top level trace.
-If you assume that if you get positive feedback on the overall trace then all sub-runs are also correct,
-you can set up a rule that selects all particular sub-runs whose parent trace has positive feedback.
-
-## Send random datapoints to an annotation queue
-
-You don’t always get great end user feedback (or it may be biased), so you may want to randomly sample some percentage of datapoints and send them to an annotation queue.
-
-To do this, you can set `Sampling Rate` to be a fraction and then sample all root runs.
-
-## Combinations of the above
-
-Oftentimes, combinations of the above rules make sense. For example, longer stacks of runs could be:
-
-**The “Help me get positive examples” rule set**
-
-- For a random sample of runs, send them to the annotation queue
-- For any datapoints with positive feedback, add them (or their child runs) to a dataset
-- You can then use these examples as few shot examples or to finetune
-
-**The “What datapoints should I look at?” rule set**
-
-- Define an online evaluator to run over random sample of datapoints
-- For any datapoints with negative LLM feedback, send them to annotation queue for manual inspection
-- From the annotation queue, you can give them correct labels and add them to a dataset to test against to see if you can improve
diff --git a/versioned_docs/version-old/monitoring/use_cases/optimization.mdx b/versioned_docs/version-old/monitoring/use_cases/optimization.mdx
deleted file mode 100644
index 23070e664..000000000
--- a/versioned_docs/version-old/monitoring/use_cases/optimization.mdx
+++ /dev/null
@@ -1,115 +0,0 @@
----
-sidebar_label: Optimization
-sidebar_position: 1
-table_of_contents: true
----
-
-# Optimization
-
-This walks through a specific use case.
-In this guide, we will create an application that we optimize over time.
-We will do this by collecting user feedback and then using that to collect few shot example datasets.
-We can then pull those few shot example datasets into the application at run time and use those as examples of how the application should behave.
-
-## The objective
-
-In this example, we will build a bot that can write tweets.
-We will start with a generic prompt, and then by leaving feedback on tweets we can start to build up a few shot example dataset.
-We will do this without any LangChain code, just using raw OpenAI and LangSmith
-
-## Getting started
-
-To get started, we will first set it up so that we send all traces to a specific project.
-We can do this by setting an environment variable:
-
-```python
-import os
-os.environ["LANGCHAIN_PROJECT"] = "optimization"
-```
-
-We can then create our initial application. This will be a really simple function that just takes in a topic and creates a tweet about it.
-
-```python
-import openai
-from langsmith import traceable, Client
-import uuid
-
-client = openai.Client()
-
-@traceable(
-    run_type="chain",
-    name="Tweeter",
-)
-def tweeter(
-    topic: str
-):
-    return client.chat.completions.create(
-        model="gpt-3.5-turbo",
-        messages=[{"role": "user", "content": f"Write a tweet about {topic}"}],
-    ).choices[0].message.content
-```
-
-We can then start to interact with it.
-When interacting with it, we will generate the LangSmith run id ahead of time and pass that into this function.
-We do this so we can attach feedback later on.
-
-Here's how we can invoke the application:
-
-```python
-run_id = uuid.uuid4()
-tweeter(
-    "football",
-    langsmith_extra={"run_id": run_id}
-)
-```
-
-Here's how we can attach feedback after:
-
-```python
-ls_client = Client()
-
-ls_client.create_feedback(
-    run_id,
-    key="user-score",
-    score=1.0,
-)
-```
-
-We can set a score of `1` when we liked the tweet, and a score of `0` when we don't like the tweet.
-Note that you could easily incorporate this into a UI to gather feedback in a more user friendly manner.
-
-## Set up automations
-
-We can now set up two automations.
-
-The first will take all runs with positive feedback and automatically add them to a dataset.
-The logic behind this is that any run with positive feedback we can use as a good example in future iterations.
-
-![Optimization Positive](../static/optimization-positive.png)
-
-The second will take all runs with negative feedback and automatically send them to an annotation queue.
-The logic behind this is that we can then have human reviewers looking at that annotation queue and correcting any bad examples to better ones.
-After correcting them, they can then send them to the same dataset.
-
-![Optimization Negative](../static/optimization-negative.png)
-
-## Updating the application
-
-We can now update our code to pull down the dataset we are sending runs to.
-We can use the datapoints in that dataset as few shot examples.
-
-```python
-@traceable(
-    run_type="chain",
-    name="Tweeter",
-)
-def tweeter(
-    topic: str
-):
-    examples = list(ls_client.list_examples(dataset_name="tweeting-optimization"))
-    example_string = "\n\n".join([f"Input: {e.inputs['topic']}\nOutput: {e.outputs['output']}" for e in examples])
-    return client.chat.completions.create(
-        model="gpt-3.5-turbo",
-        messages=[{"role": "user", "content": f"Write a tweet about {topic}. Here are some examples of how to do this well:\n\n{example_string}"}],
-    ).choices[0].message.content
-```
diff --git a/versioned_docs/version-old/pricing.mdx b/versioned_docs/version-old/pricing.mdx
deleted file mode 100644
index 3c6076eba..000000000
--- a/versioned_docs/version-old/pricing.mdx
+++ /dev/null
@@ -1,267 +0,0 @@
----
-sidebar_label: Pricing
-sidebar_position: 4
----
-
-import { RegionalUrl } from "@site/src/components/RegionalUrls";
-
-# Pricing
-
-## Plans
-
-<table>
-  <thead>
-    <tr>
-      <th>Plan</th>
-      <th>Developer</th>
-      <th>Startups</th>
-      <th>Plus</th>
-      <th>Enterprise</th>
-    </tr>
-  </thead>
-  <tbody>
-    <tr>
-      <th>Description</th>
-      {/* Developer */}
-      <td>Designed for hobbyists who want to start their adventure solo</td>
-      {/* Plus */}
-      <td>
-        Everything in Developer, plus team features, higher rate limits, and
-        longer data retention
-      </td>
-      {/* Startups */}
-      <td>Designed for early stage startups building AI applications</td>
-      {/* Enterprise */}
-      <td>
-        Designed for teams with more security, deployment, and support needs
-      </td>
-    </tr>
-    <tr>
-      <th>Specs</th>
-      {/* Developer */}
-      <td>
-        <ul>
-          <li>Free for 1 user</li>
-          <li>5,000 free traces per month</li>
-          <li>Additional traces billed @ $0.005/trace</li>
-        </ul>
-      </td>
-      {/* Plus */}
-      <td>
-        <ul>
-          <li>$39/user</li>
-          <li>10,000 free traces per month</li>
-          <li>Additional traces billed @ $0.005/trace</li>
-        </ul>
-      </td>
-      {/* Startups */}
-      <td>
-        <a href="https://airtable.com/app8ZrGLtHAtFVO1o/pagfLAmdTz4ep7TGu/form">
-          Contact us to learn more
-        </a>
-      </td>
-      {/* Enterprise */}
-      <td>Custom</td>
-    </tr>
-    <tr>
-      <th>Features</th>
-      {/* Developer */}
-      <td>
-        Key features:
-        <ul>
-          <li>1 Developer seat</li>
-          <li>Debugging traces</li>
-          <li>Dataset collection</li>
-          <li>Testing and evaluation</li>
-          <li>Prompt management</li>
-          <li>Monitoring</li>
-        </ul>
-      </td>
-      {/* Plus */}
-      <td>
-        Key features:
-        <ul>
-          <li>All features in Developer tier</li>
-          <li>Up to 10 seats</li>
-          <li>Hosted LangServe (beta)</li>
-          <li>Longer data retention</li>
-          <li>Higher rate limits</li>
-          <li>Email support</li>
-        </ul>
-      </td>
-      {/* Startups */}
-      <td>
-        What to expect:
-        <br />
-        <br />
-        We want all early stage companies to build with LangSmith. LangSmith for
-        Startups offers discounted prices and a generous free, monthly trace allotment,
-        so you can have the right tooling in place as you grow your business.
-      </td>
-      {/* Enterprise */}
-      <td>
-        Key features:
-        <ul>
-          <li>All features in Plus tier</li>
-          <li>Single Sign On (SSO)</li>
-          <li>Negotiable SLAs</li>
-          <li>Deployment options in customer’s environment</li>
-          <li>Custom rate limits</li>
-          <li>Team trainings</li>
-          <li>Shared Slack channel</li>
-          <li>Architectural guidance</li>
-          <li>Dedicated customer success manager</li>
-        </ul>
-      </td>
-    </tr>
-  </tbody>
-</table>
-
-## Plan Comparison
-
-|                                             |                                                                                                         Developer                                                                                                          |                                                                                                            Plus                                                                                                             |                                  Enterprise                                   |
-| ------------------------------------------- | :------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------: | :-------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------: | :---------------------------------------------------------------------------: |
-| <b>Features</b>                             |                                                                                                                                                                                                                            |                                                                                                                                                                                                                             |                                                                               |
-| Debugging Traces                            |                                                                                                             ✅                                                                                                             |                                                                                                             ✅                                                                                                              |                                      ✅                                       |
-| Dataset Collection                          |                                                                                                             ✅                                                                                                             |                                                                                                             ✅                                                                                                              |                                      ✅                                       |
-| Human Labeling                              |                                                                                                             ✅                                                                                                             |                                                                                                             ✅                                                                                                              |                                      ✅                                       |
-| Testing and Evaluation                      |                                                                                                             ✅                                                                                                             |                                                                                                             ✅                                                                                                              |                                      ✅                                       |
-| Prompt Management                           |                                                                                                             ✅                                                                                                             |                                                                                                             ✅                                                                                                              |                                      ✅                                       |
-| Hosted LangServe                            |                                                                                                             --                                                                                                             |                                                                                                             ✅                                                                                                              |                                      ✅                                       |
-| Monitoring                                  |                                                                                                             ✅                                                                                                             |                                                                                                             ✅                                                                                                              |                                      ✅                                       |
-| Role-Based Access Controls (RBAC)           |                                                                                                             --                                                                                                             |                                                                                                             --                                                                                                              |                                      ✅                                       |
-| <b>Team</b>                                 |                                                                                                                                                                                                                            |                                                                                                                                                                                                                             |                                                                               |
-| Developer Seats                             |                                                                                                        1 Free Seat                                                                                                         |                                                                                    Maximum 10 seats<br />$39 per seat/month<sup>1</sup>                                                                                     |                                Custom pricing                                 |
-| <b>Usage</b>                                |                                                                                                                                                                                                                            |                                                                                                                                                                                                                             |                                                                               |
-| Traces<sup>2</sup>                          | First 5k base traces and extended upgrades per month for free<br /><br />Pay as you go thereafter:<br /><br />$0.50 per 1k base traces (14-day retention)<br />Additional $4.50 per 1k extended traces (400-day retention) | First 10k base traces and extended upgrades per month for free<br /><br />Pay as you go thereafter:<br /><br />$0.50 per 1k base traces (14-day retention)<br />Additional $4.50 per 1k extended traces (400-day retention) |                                    Custom                                     |
-| Max ingested events / hour<sup>3</sup>      |                                                                                                50,000<sup>3</sup> / 250,000                                                                                                |                                                                                                           500,000                                                                                                           |                                    Custom                                     |
-| Total trace size storage / hour<sup>4</sup> |                                                                                                 500MB<sup>3</sup> / 2.5GB                                                                                                  |                                                                                                             5GB                                                                                                             |                                    Custom                                     |
-| <b>Security Controls</b>                    |                                                                                                                                                                                                                            |                                                                                                                                                                                                                             |                                                                               |
-| Single Sign On                              |                                                                                                             --                                                                                                             |                                                                                                     Google<br />GitHub                                                                                                      |                                  Custom SSO                                   |
-| Deployment                                  |                                                                                                     Hosted in US or EU                                                                                                     |                                                                                                     Hosted in US or EU                                                                                                      |           Add-on for self-hosted<br /> deployment in customer's VPC           |
-| <b>Support</b>                              |                                                                                                                                                                                                                            |                                                                                                                                                                                                                             |                                                                               |
-| Support Channels                            |                                                                                                         Community                                                                                                          |                                                                                                            Email                                                                                                            |                        Email<br />Shared Slack Channel                        |
-| Shared Slack Channel                        |                                                                                                             --                                                                                                             |                                                                                                             --                                                                                                              |                                      ✅                                       |
-| Team Training                               |                                                                                                             --                                                                                                             |                                                                                                             --                                                                                                              |                                      ✅                                       |
-| Application Architectural Guidance          |                                                                                                             --                                                                                                             |                                                                                                             --                                                                                                              |                                      ✅                                       |
-| Dedicated Customer Success Manager          |                                                                                                             --                                                                                                             |                                                                                                             --                                                                                                              |                                      ✅                                       |
-| SLA                                         |                                                                                                             --                                                                                                             |                                                                                                             --                                                                                                              |                                      ✅                                       |
-| <b>Procurement</b>                          |                                                                                                                                                                                                                            |                                                                                                                                                                                                                             |                                                                               |
-| Billing                                     |                                                                                            Monthly, self-serve<br />Credit Card                                                                                            |                                                                                            Monthly, self-serve<br />Credit Card                                                                                             |                            Annual Invoice<br />ACH                            |
-| Custom Terms and Data Privacy Agreement     |                                                                                                             --                                                                                                             |                                                                                                             --                                                                                                              |                                      ✅                                       |
-| Infosec Review                              |                                                                                                             --                                                                                                             |                                                                                                             --                                                                                                              |                                      ✅                                       |
-| Workspaces                                  |                                                                                   Single, default Workspace under Personal Organization                                                                                    |                                                                                             Up to 3 Workspaces per Organization                                                                                             | Up to 10 Workspaces per Organization (contact support@langchain.dev for more) |
-| Organization Roles (User and Admin)         |                                                                                                             --                                                                                                             |                                                                                                             ✅                                                                                                              |                                      ✅                                       |
-
-<sup>1</sup> Seats are billed monthly on the first of the month and in the future
-will be prorated if additional seats are purchased in the middle of the month. Seats
-removed mid-month are not credited.
-<br />
-<sup>2</sup> You can purchase LangSmith credits for your tracing usage. As long
-as you have a valid credit card in your account, we’ll service your traces and
-deduct from your credit balance. You’ll be able to set monthly ingest limits if
-you choose to control spend.
-<br />
-<sup>3</sup> Personal accounts without a credit card on file will be rate limited
-to 50,000 ingested events per hour and 500MB of storage per hour.
-<br />
-<sup>4</sup> Trace storage includes all submitted inputs, outputs, and metadata
-and is aggregated over all submission events. Depending on the design of your
-application, trace data may be sent multiple times (e.g. once at the start of a
-trace step and again after it is complete)
-
-## Questions and Answers
-
-### I’ve been using LangSmith since before pricing took effect for new users. When will pricing go into effect for my account?
-
-If you’ve been using LangSmith already, your usage will be billable starting in July 2024. At that point if you want to add seats or use more than the monthly allotment of free traces, you will need to add a credit card to LangSmith or contact sales. If you are interested in the Enterprise plan with higher rate limits and special deployment options, you can learn more or make a purchase by reaching out to [sales@langchain.dev](mailto:sales@langchain.dev).
-
-### Which plan is right for me?
-
-If you’re an individual developer, the Developer plan is a great choice for small projects.
-
-For teams that want to collaborate in LangSmith, check out the Plus plan. **If you are an early-stage startup building an AI application**, you may be eligible for our Startup plan with discounted prices and a generous free monthly trace allotment. Please reach out via our [Startup Contact Form](https://airtable.com/app8ZrGLtHAtFVO1o/pagfLAmdTz4ep7TGu/form) for more details.
-
-If you need more advanced administration, authentication and authorization, deployment options, support, or annual invoicing, the Enterprise plan is right for you. Please reach out via our [Sales Contact Form](https://www.langchain.com/contact-sales) for more details.
-
-### What is a seat?
-
-A seat is a distinct user inside your organization. We consider the total number of users (including invited users) to determine the number of seats to bill.
-
-### What is a trace?
-
-A trace is one complete invocation of your application chain or agent, evaluator run, or playground run. Here is an [example](https://smith.langchain.com/public/17c24270-9f74-47e7-b70c-d508afc448fa/r) of a single trace.
-
-### What is an ingested event?
-
-An ingested event is any distinct, trace-related data sent to LangSmith. This includes:
-
-- Inputs, outputs and metadata sent at the start of a run step within a trace
-- Inputs, outputs and metadata sent at the end of a run step within a trace
-- Feedback on run steps or traces
-
-### I’ve hit my rate or usage limits. What can I do?
-
-If you’ve consumed the monthly allotment of free traces in your account, you can add a credit card on the Developer and Plus plans to continue sending traces to LangSmith. If you’ve hit the rate limits on your tier, you can upgrade to a higher plan to get higher limits, or reach out to [support@langchain.dev](mailto:support@langchain.dev) with questions.
-
-### I have a developer account, can I upgrade my account to the Plus or Enterprise plan?
-
-Every user will have a unique personal account on the Developer plan. <b>We cannot upgrade a Developer account to the Plus or Enterprise plans.</b> If you’re interested in working as a team, create a separate LangSmith Organization on the Plus plan. This plan can upgraded to the Enterprise plan at a later date.
-
-### How will billing work?
-
-<b>Seats</b>
-<br />
-Seats are billed monthly on the first of the month in the future will be
-pro-rated if additional seats are purchased in the middle of the month. Seats
-removed mid-month will not be credited.
-<br />
-<br />
-<b>Traces</b>
-<br />
-As long as you have a card on file in your account, we’ll service your traces and
-bill you on the first of the month for traces that you submitted in the previous
-month. You will be able to set usage limits if you so choose to limit the maximum
-charges you could incur in any given month.
-
-### Can I limit how much I spend on tracing?
-
-You can set limits on the number of traces that can be sent to LangSmith per month on
-the <RegionalUrl text='Plans and Billing' suffix='/settings/payments' /> settings page.
-
-:::note
-While we do show you the dollar value of your usage limit for convenience, this limit evaluated
-in terms of number of traces instead of dollar amount. For example, if you are approved for our
-startup plan tier where you are given a generous allotment of free traces, your usage limit will
-not automatically change.
-
-You are not currently able to set a spend limit in the product.
-:::
-
-### How can my track my usage so far this month?
-
-Under the Settings section for your Organization you will see subsection for <b>Usage</b>. There, you will able to see a graph of the daily number of billable LangSmith traces from the last 30, 60, or 90 days. Note that this data is delayed by 1-2 hours and so may trail your actual number of runs slightly for the current day.
-
-### I have a question about my bill...
-
-Customers on the Developer and Plus plan tiers should email [support@langchain.dev](mailto:support@langchain.dev). Customers on the Enterprise plan should contact their sales representative directly.
-
-Enterprise plan customers are billed annually by invoice.
-
-### What can I expect from Support?
-
-On the Developer plan, community-based support is available on [Discord](https://discord.com/invite/6adMQxSpJS).
-
-On the Plus plan, you will also receive preferential, email support at [support@langchain.dev](mailto:support@langchain.dev) for LangSmith-related questions only and we'll do our best to respond within the next business day.
-
-On the Enterprise plan, you’ll get white-glove support with a Slack channel, a dedicated customer success manager, and monthly check-ins to go over LangSmith and LangChain questions. We can help with anything from debugging, agent and RAG techniques, evaluation approaches, and cognitive architecture reviews. If you purchase the add-on to run LangSmith in your environment, we’ll also support deployments and new releases with our infra engineering team on-call.
-
-### Which security frameworks is LangSmith compliant with?
-
-We are SOC 2 Type II, GDPR, and HIPAA compliant.
-
-You can request more information about our security policies and posture at [trust.langchain.com](https://trust.langchain.com). Please note we only enter into BAAs with customers on our Enterprise plan.
-
-### Will you train on the data that I send LangSmith?
-
-We will not train on your data, and you own all rights to your data. See [LangSmith Terms of Service](https://langchain.dev/terms-of-service) for more information.
diff --git a/versioned_docs/version-old/proxy/azure_openai.mdx b/versioned_docs/version-old/proxy/azure_openai.mdx
deleted file mode 100644
index 305a31195..000000000
--- a/versioned_docs/version-old/proxy/azure_openai.mdx
+++ /dev/null
@@ -1,81 +0,0 @@
----
-sidebar_label: Use LangSmith Proxy with Azure OpenAI
-sidebar_position: 2
----
-
-# Configure LangSmith Proxy to talk to your Azure OpenAI Endpoint
-
-## Prerequisites
-
-1. Docker installed on your local machine
-   - Instructions for installing Docker can be found [here](https://docs.docker.com/get-docker/)
-2. An Azure OpenAI API Key
-3. An Azure OpenAI endpoint
-
-## 1. Deploy the LangSmith Proxy
-
-The LangSmith Proxy is available as a Docker container. You can run it in your environment by running the following command:
-
-```bash
-docker pull docker.io/langchain/langsmith-proxy:latest # Force pull the latest version of the LangSmith Proxy
-docker run -e AZURE_OPENAI_ENDPOINT <YOUR AZURE_OPENAI_ENDPOINT> -p 8080:8080 docker.io/langchain/langsmith-proxy:latest # Run the LangSmith Proxy on port 8080 and publish it to the host
-```
-
-You should see the following output:
-
-```bash
-2024-03-06 12:59:57,458 CRIT Supervisor is running as root.  Privileges were not dropped because no user is specified in the config file.  If you intend to run as root, you can set user=root in the config file to avoid this message.
-2024-03-06 12:59:57,467 INFO supervisord started with pid 1
-2024-03-06 12:59:58,503 INFO spawned: 'nginx' with pid 8
-2024-03-06 12:59:58,552 INFO spawned: 'trace-processor' with pid 10
-2024-03-06 12:59:59,562 INFO success: nginx entered RUNNING state, process has stayed up for > than 1 seconds (startsecs)
-2024-03-06 12:59:59,563 INFO success: trace-processor entered RUNNING state, process has stayed up for > than 1 seconds (startsecs)
-Couldn't create langsmith client: API key must be provided when using hosted LangSmith API, will skip creating runs
-Listening for traces at 0.0.0.0:9999
-Connection from ('127.0.0.1', 47370)
-```
-
-Ignore the `Couldn't create langsmith client` message if you are not configuring tracing.
-
-## 2. Update your app to make requests to the LangSmith Proxy
-
-For this example, we'll be using your local proxy running on `localhost:8080`. You can replace this with the address of your proxy if it's running on a different machine.
-
-You may need to install some packages for this example:
-
-```bash
-pip install langchain_openai
-```
-
-Now, you can use the LangSmith Proxy to make requests to Azure OpenAI. Here's an example of how you can do this in Python:
-Let's create a file called `azure_openai_test.py` and add the following code:
-
-```python
-from langchain_openai import AzureChatOpenAI
-import os
-
-os.environ["OPENAI_API_VERSION"] = "2023-06-01-preview"
-os.environ["OPENAI_API_KEY"] = "YOUR API KEY"
-os.environ["AZURE_OPENAI_ENDPOINT"] = "http://localhost:8080/proxy/azure-openai"
-
-llm = AzureChatOpenAI(deployment_name="gpt-35-turbo")
-print(llm.invoke("Hello, world!"))
-```
-
-Run the script:
-
-```bash
-python azure_openai_test.py
-```
-
-You should see some output like this
-
-```
-content='Hello! How can I assist you today?'
-response_metadata={'token_usage': {'completion_tokens': 9, 'prompt_tokens': 11, 'total_tokens': 20}, 'model_name': 'gpt-35-turbo', 'system_fingerprint': 'fp_2f57f81c11',
-'prompt_filter_results': [{'prompt_index': 0, 'content_filter_results': {'hate': {'filtered': False, 'severity': 'safe'}, 'self_harm': {'filtered': False, 'severity': 'safe'},
-'sexual': {'filtered': False, 'severity': 'safe'}, 'violence': {'filtered': False, 'severity': 'safe'}}}], 'finish_reason': 'stop', 'logprobs': None, 'content_filter_results': {'hate': {'filtered': False, 'severity': 'safe'},
-'self_harm': {'filtered': False, 'severity': 'safe'}, 'sexual': {'filtered': False, 'severity': 'safe'}, 'violence': {'filtered': False, 'severity': 'safe'}}} id='run-0884458f-bccd-4444-8357-3f8becc7ea2c-0'
-```
-
-Nice! You have successfully configured the LangSmith Proxy to talk to your Azure OpenAI endpoint. You can now use your proxy endpoint as a drop-in replacement for the Azure OpenAI endpoint in your applications.
diff --git a/versioned_docs/version-old/proxy/quickstart.mdx b/versioned_docs/version-old/proxy/quickstart.mdx
deleted file mode 100644
index 25eeae008..000000000
--- a/versioned_docs/version-old/proxy/quickstart.mdx
+++ /dev/null
@@ -1,265 +0,0 @@
----
-sidebar_label: Quick Start
-sidebar_position: 1
----
-
-# Quick Start
-
-## What is the LangSmith Proxy
-
-The LangSmith Proxy(Alpha) is intended to be a drop-in replacement for your LLM apis with some additional features. It is designed to be a simple, easy-to-use, and easy-to-configure tool that adds minimal overhead to your existing LLM API usage.
-
-- **Easy to use**: The LangSmith LLM Proxy is designed to be easy to use. You can run it as a sidecar to your existing app and start using it immediately. Besides changing the URL of your LLM API, you don't need to make any changes to your app to start using the LangSmith Proxy.
-- **Cache support**: The LangSmith LLM Proxy supports caching of requests/responses(with streaming support) from the LLM API. This allows you to cache responses for a configurable amount of time, reducing the number of requests to the LLM API and improving response times. This can be especially useful if you are using the LLM API in a high-traffic environment or running CI(in cases like evals)
-- **Minimal overhead**: We use NGINX as a reverse proxy to minimize the overhead of the LangSmith LLM Proxy. Requests are passed through the proxy with minimal processing.
-- **Streaming support**: The LangSmith LLM Proxy supports streaming responses from the LLM API. This allows you to start processing the response as soon as it is available, rather than waiting for the entire response to be received.
-- **Tracing support(optional)**: The LangSmith LLM Proxy supports tracing of LLM calls via LangSmith. This allows you to trace calls to your LLM without any configuration changes to your app.
-
-## Models Supported
-
-The LangSmith Proxy supports the following APIS:
-
-- OpenAI(Chat and Completion)
-- AzureOpenAI(Chat and Completion)
-
-We are actively working on adding support for the following models:
-
-- Anthropic
-- Google Vertex
-- Gemini
-
-If you would like to see support for a specific model, please message us at support@langchain.dev
-
-The steps in this guide will acquaint you with deploying the LangSmith Proxy and using it to make requests to OpenAI.
-
-1. Launch the LangSmith Proxy container in your environment
-2. Edit your app to make requests to the LangSmith Proxy
-3. Forcefully turn off caching for the LangSmith Proxy
-4. Cache a streamed request
-5. Turn on tracing while using the LangSmith Proxy
-
-## Prerequisites
-
-1. Docker installed on your local machine
-   - Instructions for installing Docker can be found [here](https://docs.docker.com/get-docker/)
-2. An OpenAI API Key
-3. (Optional) If configuring tracing, a LangSmith API Key
-
-## 1. Deploy the LangSmith Proxy
-
-The LangSmith Proxy is available as a Docker container. You can run it in your environment by running the following command:
-
-```bash
-docker pull docker.io/langchain/langsmith-proxy:latest # Force pull the latest version of the LangSmith Proxy
-docker run -p 8080:8080 docker.io/langchain/langsmith-proxy:latest -p 8080:8080 # Run the LangSmith Proxy on port 8080 and publish it to the host
-```
-
-You should see the following output:
-
-```bash
-2024-03-06 12:59:57,458 CRIT Supervisor is running as root.  Privileges were not dropped because no user is specified in the config file.  If you intend to run as root, you can set user=root in the config file to avoid this message.
-2024-03-06 12:59:57,467 INFO supervisord started with pid 1
-2024-03-06 12:59:58,503 INFO spawned: 'nginx' with pid 8
-2024-03-06 12:59:58,552 INFO spawned: 'trace-processor' with pid 10
-2024-03-06 12:59:59,562 INFO success: nginx entered RUNNING state, process has stayed up for > than 1 seconds (startsecs)
-2024-03-06 12:59:59,563 INFO success: trace-processor entered RUNNING state, process has stayed up for > than 1 seconds (startsecs)
-Couldn't create langsmith client: API key must be provided when using hosted LangSmith API, will skip creating runs
-Listening for traces at 0.0.0.0:9999
-Connection from ('127.0.0.1', 47370)
-```
-
-Ignore the `Couldn't create langsmith client` message if you are not configuring tracing.
-
-## 2. Update your app to make requests to the LangSmith Proxy
-
-For this example, we'll be using your local proxy running on `localhost:8080`. You can replace this with the address of your proxy if it's running on a different machine.
-
-You may need to install some packages for this example:
-
-```bash
-pip install openai
-pip install asyncio
-```
-
-Now, you can use the LangSmith Proxy to make requests to OpenAI. Here's an example of how you can do this in Python:
-Let's create a file called `openai_test.py` and add the following code:
-
-```python
-import time
-
-import openai
-
-# Different models can be accessed by changing the /proxy/openai to /proxy/<model>
-OPENAI_API_URL = "http://localhost:8080/proxy/openai"
-
-client = openai.Client(api_key="", base_url=OPENAI_API_URL)
-start = time.time()
-response = client.chat.completions.create(
-    model="gpt-3.5-turbo",
-    messages=[
-        {"role": "system", "content": "You are a helpful assistant."},
-        {"role": "user", "content": "Write a poem about artificial intelligence."}
-    ],
-)
-print(response)
-print(f"Time taken: {time.time() - start}")
-```
-
-Run the file using the following command:
-
-```bash
-python openai_test.py
-
-ChatCompletion(id='chatcmpl-8zqYoQDvQy2uHHHtwyahUuh0hRH3r', choices=[Choice(finish_reason='stop', index=0, logprobs=None, message=ChatCompletionMessage(content="In a realm of circuits and code so bright,\nArtificial intelligence takes its flight.\nA mind of silicon, cold and precise,\nA creation of humans, a technological device.\n\nWith algorithms running like a symphony,\nAI learns and grows with incredible efficiency.\nProcessing data at lightning speed,\nUnraveling mysteries with amazing heed.\n\nIt sees patterns in the chaos, finds order in the haze,\nPredicts our future with astonishing gaze.\nYet behind the code, a question looms,\nCan AI truly understand human rooms?\n\nIts knowledge vast, its power immense,\nBut can it possess compassion, can it sense?\nWill it help or hinder, create or destroy,\nThis artificial mind, this modern decoy?\n\nAs we advance in this digital age,\nLet's remember AI is but a page.\nA tool we wield with cautious hand,\nFor its potential is great, but so is its demand. \n\nSo let us guide it with wisdom and care,\nFor artificial intelligence, like us, is rare.\nA marvel of innovation, a wonder to behold,\nMay we navigate this future, with hearts of gold.", role='assistant', function_call=None, tool_calls=None))], created=1709750742, model='gpt-3.5-turbo-0125', object='chat.completion', system_fingerprint='fp_2b778c6b35', usage=CompletionUsage(completion_tokens=220, prompt_tokens=24, total_tokens=244))
-Time taken: 4.794615030288696
-```
-
-There will also be a corresponding Cache Miss log entry in your proxy.
-
-```bash
-"POST /proxy/openai/chat/completions HTTP/1.1" 200 20418 "-" "OpenAI/Python 1.12.0" "CACHE: MISS"
-```
-
-Pretty slow! Let's try running this again.
-
-```bash
-python openai_test.py
-
-ChatCompletion(id='chatcmpl-8zqYoQDvQy2uHHHtwyahUuh0hRH3r', choices=[Choice(finish_reason='stop', index=0, logprobs=None, message=ChatCompletionMessage(content="In a realm of circuits and code so bright,\nArtificial intelligence takes its flight.\nA mind of silicon, cold and precise,\nA creation of humans, a technological device.\n\nWith algorithms running like a symphony,\nAI learns and grows with incredible efficiency.\nProcessing data at lightning speed,\nUnraveling mysteries with amazing heed.\n\nIt sees patterns in the chaos, finds order in the haze,\nPredicts our future with astonishing gaze.\nYet behind the code, a question looms,\nCan AI truly understand human rooms?\n\nIts knowledge vast, its power immense,\nBut can it possess compassion, can it sense?\nWill it help or hinder, create or destroy,\nThis artificial mind, this modern decoy?\n\nAs we advance in this digital age,\nLet's remember AI is but a page.\nA tool we wield with cautious hand,\nFor its potential is great, but so is its demand. \n\nSo let us guide it with wisdom and care,\nFor artificial intelligence, like us, is rare.\nA marvel of innovation, a wonder to behold,\nMay we navigate this future, with hearts of gold.", role='assistant', function_call=None, tool_calls=None))], created=1709750742, model='gpt-3.5-turbo-0125', object='chat.completion', system_fingerprint='fp_2b778c6b35', usage=CompletionUsage(completion_tokens=220, prompt_tokens=24, total_tokens=244))
-Time taken: 0.12684011459350586
-```
-
-Cache hit! Our request hits the cache and the response time is much faster. You will also see a Cache Hit log entry in your proxy.
-
-```bash
-"POST /proxy/openai/chat/completions HTTP/1.1" 200 24915 "-" "OpenAI/Python 1.12.0" "CACHE: HIT"
-```
-
-## 3. Forcefully turn off caching for the LangSmith Proxy
-
-In some scenarios, you may want to forcefully turn off caching for the LangSmith Proxy. You can do this by adding a Cache-Control header `{"Cache-Control": "no-cache"}` header to your request. This will force the LangSmith Proxy to make a request to the LLM API and bypass the cache.
-
-```python
-import time
-
-import openai
-
-# Different models can be accessed by changing the /proxy/openai to /proxy/<model>
-OPENAI_API_URL = "http://localhost:8080/proxy/openai"
-
-client = openai.Client(api_key="", base_url=OPENAI_API_URL, default_headers={"Cache-Control": "no-cache"})
-start = time.time()
-response = client.chat.completions.create(
-    model="gpt-3.5-turbo",
-    messages=[
-        {"role": "system", "content": "You are a helpful assistant."},
-        {"role": "user", "content": "Write a poem about artificial intelligence."}
-    ],
-)
-print(response)
-print(f"Time taken: {time.time() - start}")
-```
-
-There will also be a corresponding Cache Bypass log entry in your proxy.
-
-```bash
-"POST /proxy/openai/chat/completions HTTP/1.1" 200 24376 "-" "OpenAI/Python 1.12.0" "CACHE: BYPASS"
-```
-
-As you can see, the request takes a longer time to complete as the LangSmith Proxy is making a request to the LLM API. You will also see a Bypass Header in your response.
-
-## 4. Support for Streaming
-
-The LangSmith Proxy supports streaming responses from the LLM API. This allows you to start processing the response as soon as it is available, rather than waiting for the entire response to be received.
-This will still work with caching!
-
-Update your `openai_test.py` file to use the streaming API:
-
-```python
-import time
-
-import openai
-
-# Different models can be accessed by changing the /proxy/openai to /proxy/<model>
-OPENAI_API_URL = "http://localhost:8080/proxy/openai"
-
-client = openai.Client(api_key="", base_url=OPENAI_API_URL)
-start = time.time()
-stream = client.chat.completions.create(
-    model="gpt-3.5-turbo",
-    messages=[
-        {"role": "system", "content": "You are a helpful assistant."},
-        {"role": "user", "content": "Write a poem about artificial intelligence."}
-    ],
-    stream=True
-)
-for chunk in stream:
-    print(chunk)
-
-print(f"Time taken: {time.time() - start}")
-```
-
-```bash
-python openai_test.py
-
-ChatCompletionChunk(id='chatcmpl-8zqcc2vx7sLVumNOcxTBWH8VVFlNm', choices=[Choice(delta=ChoiceDelta(content='', function_call=None, role='assistant', tool_calls=None), finish_reason=None, index=0, logprobs=None)], created=1709750978, model='gpt-3.5-turbo-0125', object='chat.completion.chunk', system_fingerprint='fp_2b778c6b35')
-ChatCompletionChunk(id='chatcmpl-8zqcc2vx7sLVumNOcxTBWH8VVFlNm', choices=[Choice(delta=ChoiceDelta(content='In', function_call=None, role=None, tool_calls=None), finish_reason=None, index=0, logprobs=None)], created=1709750978, model='gpt-3.5-turbo-0125', object='chat.completion.chunk', system_fingerprint='fp_2b778c6b35')
-ChatCompletionChunk(id='chatcmpl-8zqcc2vx7sLVumNOcxTBWH8VVFlNm', choices=[Choice(delta=ChoiceDelta(content=' realms', function_call=None, role=None, tool_calls=None), finish_reason=None, index=0, logprobs=None)], created=1709750978, model='gpt-3.5-turbo-0125', object='chat.completion.chunk', system_fingerprint='fp_2b778c6b35')
-ChatCompletionChunk(id='chatcmpl-8zqcc2vx7sLVumNOcxTBWH8VVFlNm', choices=[Choice(delta=ChoiceDelta(content=' of', function_call=None, role=None, tool_calls=None), finish_reason=None, index=0, logprobs=None)], created=1709750978, model='gpt-3.5-turbo-0125', object='chat.completion.chunk', system_fingerprint='fp_2b778c6b35')
-ChatCompletionChunk(id='chatcmpl-8zqcc2vx7sLVumNOcxTBWH8VVFlNm', choices=[Choice(delta=ChoiceDelta(content=' ones', function_call=None, role=None, tool_calls=None), finish_reason=None, index=0, logprobs=None)], created=1709750978, model='gpt-3.5-turbo-0125', object='chat.completion.chunk', system_fingerprint='fp_2b778c6b35')
-ChatCompletionChunk(id='chatcmpl-8zqcc2vx7sLVumNOcxTBWH8VVFlNm', choices=[Choice(delta=ChoiceDelta(content=' and', function_call=None, role=None, tool_calls=None), finish_reason=None, index=0, logprobs=None)], created=1709750978, model='gpt-3.5-turbo-0125', object='chat.completion.chunk', system_fingerprint='fp_2b778c6b35')
-
-...
-Time taken: 3.4340438842773438
-```
-
-Let's run this again and see how the response time changes.
-
-```bash
-python openai_test.py
-
-ChatCompletionChunk(id='chatcmpl-8zqcc2vx7sLVumNOcxTBWH8VVFlNm', choices=[Choice(delta=ChoiceDelta(content='', function_call=None, role='assistant', tool_calls=None), finish_reason=None, index=0, logprobs=None)], created=1709750978, model='gpt-3.5-turbo-0125', object='chat.completion.chunk', system_fingerprint='fp_2b778c6b35')
-ChatCompletionChunk(id='chatcmpl-8zqcc2vx7sLVumNOcxTBWH8VVFlNm', choices=[Choice(delta=ChoiceDelta(content='In', function_call=None, role=None, tool_calls=None), finish_reason=None, index=0, logprobs=None)], created=1709750978, model='gpt-3.5-turbo-0125', object='chat.completion.chunk', system_fingerprint='fp_2b778c6b35')
-ChatCompletionChunk(id='chatcmpl-8zqcc2vx7sLVumNOcxTBWH8VVFlNm', choices=[Choice(delta=ChoiceDelta(content=' realms', function_call=None, role=None, tool_calls=None), finish_reason=None, index=0, logprobs=None)], created=1709750978, model='gpt-3.5-turbo-0125', object='chat.completion.chunk', system_fingerprint='fp_2b778c6b35')
-ChatCompletionChunk(id='chatcmpl-8zqcc2vx7sLVumNOcxTBWH8VVFlNm', choices=[Choice(delta=ChoiceDelta(content=' of', function_call=None, role=None, tool_calls=None), finish_reason=None, index=0, logprobs=None)], created=1709750978, model='gpt-3.5-turbo-0125', object='chat.completion.chunk', system_fingerprint='fp_2b778c6b35')
-ChatCompletionChunk(id='chatcmpl-8zqcc2vx7sLVumNOcxTBWH8VVFlNm', choices=[Choice(delta=ChoiceDelta(content=' ones', function_call=None, role=None, tool_calls=None), finish_reason=None, index=0, logprobs=None)], created=1709750978, model='gpt-3.5-turbo-0125', object='chat.completion.chunk', system_fingerprint='fp_2b778c6b35')
-ChatCompletionChunk(id='chatcmpl-8zqcc2vx7sLVumNOcxTBWH8VVFlNm', choices=[Choice(delta=ChoiceDelta(content=' and', function_call=None, role=None, tool_calls=None), finish_reason=None, index=0, logprobs=None)], created=1709750978, model='gpt-3.5-turbo-0125', object='chat.completion.chunk', system_fingerprint='fp_2b778c6b35')
-...
-Time taken: 0.07226419448852539
-```
-
-Again, much faster! The corresponding miss and hit logs will also be present in your proxy.
-
-```
-"POST /proxy/openai/chat/completions HTTP/1.1" 200 17761 "-" "OpenAI/Python 1.12.0" "CACHE: MISS"
-"POST /proxy/openai/chat/completions HTTP/1.1" 200 17745 "-" "OpenAI/Python 1.12.0" "CACHE: HIT"
-```
-
-## 5. Turn on tracing while using the LangSmith Proxy
-
-Requests made to the LangSmith proxy can also be traced.
-You can do this by running the docker image with the `LANGSMITH_API_KEY` environment variable set to your LangSmith API Key.
-
-```bash
-docker run -p 8080:8080 -e LANGCHAIN_API_KEY=<your_langsmith_api_key> -e  docker.io/langchain/langsmith-proxy:latest -p 8080:8080
-```
-
-Run the script again, and you should see a trace in your LangSmith dashboard.
-
-```bash
-python openai_test.py
-
-# In nginx logs
-Created run with inputs: {'messages': [{'role': 'system', 'content': 'You are a helpful assistant.'}, {'role': 'user', 'content': 'Write a poem about artificial intelligence.'}], 'model': 'gpt-3.5-turbo', 'stream': True}
-```
-
-The corresponding trace also appears in your LangSmith dashboard!
-
-[![LangSmith Trace](./static/trace.png)](./static/trace.png)
-
-## Next Steps
-
-- In this guide, you learned how to deploy the LangSmith Proxy and use it to proxy requests to OpenAI.
-- We highly recommend trying this out with your own applications and models.
-- Note that the proxy is intended to run near your application to minimize latency. You can run it as a sidecar to your application or as a separate service.
-- We also bundle this into the LangSmith Self-Hosted deployment by default. If you are using LangSmith Self-Hosted, you can use your LangSmith url as the proxy url.
diff --git a/versioned_docs/version-old/proxy/static/trace.png b/versioned_docs/version-old/proxy/static/trace.png
deleted file mode 100644
index 0246b9a3c..000000000
Binary files a/versioned_docs/version-old/proxy/static/trace.png and /dev/null differ
diff --git a/versioned_docs/version-old/self_hosting/docker.mdx b/versioned_docs/version-old/self_hosting/docker.mdx
deleted file mode 100644
index cf72a0851..000000000
--- a/versioned_docs/version-old/self_hosting/docker.mdx
+++ /dev/null
@@ -1,193 +0,0 @@
----
-sidebar_label: Docker
-sidebar_position: 2
-table_of_contents: true
----
-
-# Self-hosting LangSmith with Docker
-
-:::important Enterprise License Required
-Self-hosting LangSmith is an add-on to the Enterprise Plan designed for our largest, most security-conscious customers. See our [pricing page](https://www.langchain.com/pricing) for more detail, and contact us at sales@langchain.dev if you want to get a license key to trial LangSmith in your environment.
-:::
-
-This guide provides instructions for installing and setting up your environment to run LangSmith locally using Docker. You can do this either by using the LangSmith SDK or by using Docker Compose directly.
-
-## Prerequisites
-
-1. Ensure Docker is installed and running on your system. You can verify this by running:
-   ```bash
-   docker info
-   ```
-   If you don't see any server information in the output, make sure Docker is installed correctly and launch the Docker daemon.
-2. LangSmith License Key
-   1. You can get this from your Langchain representative. Contact us at sales@langchain.dev for more information.
-3. LangSmith Version
-   1. Our Docker Compose files are pegged to the latest self-hosted release of LangSmith. If you want to use a different version, you can specify it in the `.env` file or in the `docker-compose.yml` file.
-4. OpenAI API Key(optional).
-   1. Used for natural language search feature. Can specify OpenAI key in browser as well for the playground feature.
-5. Oauth Configuration(optional).
-   1. You can configure oauth using the `.env` file. You will need to provide a `client_id` and `client_issuer_url` for your oauth provider.
-   2. Note, we do rely on the OIDC Authorization Code with PKCE flow. We currently support almost anything that is OIDC compliant however Google does not support this flow.
-6. External Postgres(optional).
-   1. You can configure external postgres using the `.env` file. You will need to set the `POSTGRES_DATABASE_URI` environment variable to the connection string for your postgres instance.
-   2. If using a schema other than public, ensure that you do not have any other schemas with the pgcrypto extension enabled or you must include that in your search path.
-   3. Note: We do only officially support Postgres versions >= 14.
-7. External Redis(optional).
-   1. You can configure external redis using the `.env` file. You will need to set the `REDIS_DATABASE_URI` environment variable to the connection string for your redis instance.
-   2. Currently, we do not support using Redis with TLS. We will be supporting this shortly.
-   3. We only official support Redis versions >= 6.
-
-## Running via Docker Compose
-
-The following explains how to run the LangSmith using Docker Compose. This is the most flexible way to run LangSmith without Kubernetes. In production, we highly recommend using Kubernetes.
-
-### 1. Fetch the LangSmith `docker-compose.yml` file
-
-You can find the `docker-compose.yml` file and related files in the LangSmith SDK repository here: [<u>LangSmith Docker Compose File</u>](https://github.com/langchain-ai/langsmith-sdk/blob/main/python/langsmith/cli/docker-compose.yaml)
-
-Copy the `docker-compose.yml` file and all files in that directory from the LangSmith SDK to your project directory.
-
-- Ensure that you copy the `users.xml` file as well.
-
-### 2. Configure environment variables
-
-Copy the `.env.example` file from the LangSmith SDK to your project directory and rename it to `.env`. Then, set the following environment variables in the `.env` file:
-
-```bash
-# Don't change this file. Instead, copy it to .env and change the values there. The default values will work out of the box as long as you provide your license key.
-_LANGSMITH_IMAGE_VERSION=0.2.11 # Change to your desired LangSmith version. Required. Typically you should use the latest version defined in the .env file.
-LANGSMITH_LICENSE_KEY=your-license-key # Change to your Langsmith license key. Required
-OPENAI_API_KEY=your-openai-api-key # Needed for Online Evals and Magic Query features
-AUTH_TYPE=none # Set to "oauth" if you want to use OAuth2.0
-OAUTH_CLIENT_ID=your-client-id # Required if AUTH_TYPE=oauth
-OAUTH_ISSUER_URL=https://your-issuer-url # Required if AUTH_TYPE=oauth
-API_KEY_SALT=super # Change to your desired API key salt. Can be any random value. Must be set if AUTH_TYPE=oauth
-POSTGRES_DATABASE_URI=postgres:postgres@langchain-db:5432/postgres # Change to your database URI if using external postgres. Otherwise, leave it as is
-REDIS_DATABASE_URI=redis://langchain-redis:6379 # Change to your Redis URI if using external Redis. Otherwise, leave it as is
-LOG_LEVEL=warning # Change to your desired log level
-MAX_ASYNC_JOBS_PER_WORKER=10 # Change to your desired maximum async jobs per worker. We recommend 10/suggest spinning up more replicas of the queue worker if you need more throughput.
-```
-
-You can also set these environment variables in the `docker-compose.yml` file directly or export them in your terminal. We recommend setting them in the `.env` file.
-
-### 2. Start server
-
-Start the LangSmith application by executing the following command in your terminal:
-
-```bash
-docker-compose up
-```
-
-You can also run the server in the background by running:
-
-```bash
-docker-compose up -d
-```
-
-If the server starts correctly, it will open up the UI in your browser at [http://localhost](http://localhost/).
-
-The LangSmith UI should be visible/operational and look like this:
-
-![./static/langsmith_ui.png](./static/langsmith_ui.png)
-
-### Stopping the server
-
-```bash
-docker-compose down
-```
-
-### Checking the logs
-
-If, at any point, you want to check if the server is running and see the logs, run
-
-```bash
-docker-compose logs
-```
-
-## Running via the LangSmith SDK
-
-The following explains how to run the LangSmith using the LangSmith SDK. This is a convenient wrapper around the `docker-compose` command.
-We recommend only using this in a local setting as it is not as flexible as using `docker-compose` directly.
-
-### 1. Install the LangSmith SDK
-
-The Python LangSmith SDKs exposes a `langsmith` command line tool.
-
-First, install a recent version of the `langsmith` package:
-
-- Python/Pip: `pip install -U langsmith`
-
-This will install the LangSmith Client and the bundled command line tool.
-
-### 2. Start server
-
-Start the LangSmith tracing server by executing the following command in your terminal:
-
-```bash
-langsmith start --langsmith-license-key=<YOUR_LANGSMITH_LICENSE_KEY> --version=<LANGSMITH_VERSION> --openai-api-key=<YOUR_OPENAI_API_KEY>
-```
-
-If the server starts correctly, it will open up the UI in your browser at [http://localhost](http://localhost).
-
-The LangSmith UI should be visible/operational and look like this:
-
-![./static/langsmith_ui.png](./static/langsmith_ui.png)
-
-### Stopping the server
-
-To stop the server, run the following command:
-
-```bash
-langsmith stop
-```
-
-### Checking the logs
-
-If, at any point, you want to check if the server is running and see the logs, run
-
-```bash
-langsmith logs
-```
-
-## Using LangSmith
-
-Now that LangSmith is running, you can start using it to trace your code. You can find more information on how to use self-hosted LangSmith in the [Self-Hosted Usage Guide](/self_hosting/usage).
-
-### Frequently Asked Questions
-
-#### How can we upgrade our application?
-
-- We plan to release new minor versions of the LangSmith application every 6 weeks. This will include release notes and all changes should be backwards compatible. To upgrade, you will need to restart your LangSmith instance specifying the new version.
-
-#### How can we back up our application?
-
-- The docker solution uses docker volumes to store data. You can back up the data by backing up the volumes.
-
-#### How can we authenticate to the application?
-
-- Currently, our self-hosted solution supports oauth as an authn solution.
-- Note, we do offer a no-auth solution but highly recommend setting up oauth before moving into production.
-
-#### How can I use External `Postgres` or `Redis`?
-
-- You can configure external postgres or redis using the external sections in the `.env` file. You will need to provide the connection url/params for the database/redis instance. Look at the `.env.example` file for more information.
-
-#### What networking configuration is needed for the application?
-
-- Our deployment only needs egress for a few things:
-  - Fetching images (If mirroring your images, this may not be needed)
-  - Talking to any LLMs
-- Your VPC can set up rules to limit any other access.
-- Note: We require the X-Tenant-Id to be allowed to be passed through to the backend service. This is used to determine which tenant the request is for.
-
-#### What resources should we allocate to the application?
-
-- We recommend at least 4 vCPUs and 16GB of memory for our application. This is a rough estimate and can vary based on the number of users and the size of the data you are working with.
-
-#### Increasing the number of replicas
-
-- If you need more throughput, you can increase the number of replicas of the queue worker by running the following command:
-  ```bash
-  docker-compose up --scale langchain-queue=5
-  ```
-  This will start 5 replicas of the queue worker. You can change the number to whatever you need. Note that these containers are fairly CPU intensive, and you should ensure you have enough resources to support the number of replicas you are starting.
diff --git a/versioned_docs/version-old/self_hosting/kubernetes.mdx b/versioned_docs/version-old/self_hosting/kubernetes.mdx
deleted file mode 100644
index d4e84a2f3..000000000
--- a/versioned_docs/version-old/self_hosting/kubernetes.mdx
+++ /dev/null
@@ -1,197 +0,0 @@
----
-sidebar_label: Kubernetes
-sidebar_position: 1
-table_of_contents: true
----
-
-# Self-hosting LangSmith on Kubernetes
-
-:::important Enterprise License Required
-Self-hosting LangSmith is an add-on to the Enterprise Plan designed for our largest, most security-conscious customers. See our [pricing page](https://www.langchain.com/pricing) for more detail, and contact us at sales@langchain.dev if you want to get a license key to trial LangSmith in your environment.
-:::
-
-This guide will walk you through the process of deploying LangSmith to a Kubernetes cluster. We will use Helm to install LangSmith and its dependencies.
-
-We've successfully tested LangSmith on the following Kubernetes distributions:
-
-- Google Kubernetes Engine (GKE)
-- Amazon Elastic Kubernetes Service (EKS)
-- Azure Kubernetes Service (AKS)
-- OpenShift
-- Minikube and Kind (for development purposes)
-
-## Prerequisites
-
-Ensure you have the following tools/items ready. Some items are marked optional but :
-
-1. A working Kubernetes cluster that you can access via `kubectl`. Your cluster should have the following minimum requirements:
-
-   1. Recommended: At least 4 vCPUs, 16GB Memory available
-      - You may need to tune resource requests/limits for all of our different services based off of organization size/usage
-   2. Valid Dynamic PV provisioner or PVs available on your cluster. You can verify this by running:
-      ```bash
-      kubectl get storageclass
-      ```
-
-   The output should show at least one storage class with a provisioner that supports dynamic provisioning. For example:
-
-   ```bash
-      NAME            PROVISIONER             RECLAIMPOLICY   VOLUMEBINDINGMODE      ALLOWVOLUMEEXPANSION   AGE
-      gp2 (default)   kubernetes.io/aws-ebs   Delete          WaitForFirstConsumer   false                  161d
-   ```
-
-2. Helm
-   1. `brew install helm`
-3. LangSmith License Key
-   1. You can get this from your Langchain representative. Contact us at sales@langchain.dev for more information.
-4. SSL(optional)
-   1. This should be attachable to a load balancer that will be provisioned by your cloud provider. This will be used for the frontend service.
-5. OpenAI API Key(optional).
-   1. Used for natural language search feature(beta). Can specify OpenAI key in browser as well for the playground feature.
-6. OAuth Configuration(optional).
-   1. You can configure oauth using the `values.yaml` file. You will need to provide a `client_id` and `client_issuer_url` for your OAuth provider.
-   2. Note, we do rely on the OIDC Authorization Code with PKCE flow. We currently support almost anything that is OIDC compliant however Google does not support this flow.
-   3. Without OAuth, you will not be able to create users or organizations.
-7. External Postgres(optional).
-   1. You can configure external postgres using the `values.yaml` file. You will need to provide connection parameters for your postgres instance.
-   2. If using a schema other than public, ensure that you do not have any other schemas with the pgcrypto extension enabled, or you must include that in your search path.
-   3. Note: We do only officially support Postgres versions >= 14.
-8. External Redis(optional).
-   1. You can configure external redis using the `values.yaml` file. You will need to provide a connection url for your redis instance.
-   2. Currently, we do not support using Redis with TLS. We will be supporting this shortly.
-   3. We only official support Redis versions >= 6.
-
-## Configure your Helm Charts:
-
-1. Create a new file called `langsmith_config.yaml`. This should have a similar structure to the `values.yaml` file in the LangSmith Helm Chart repository. Only include the values you want to override to avoid having to update the file every time the chart is updated.
-2. Override any values in the file. Refer to the documentation for the [<u>LangSmith Helm Chart</u>](https://github.com/langchain-ai/helm/tree/main/charts/langsmith) to see all configurable values. Some values we recommend setting:
-   1. Resources
-   2. SSL(If on EKS or some other cloud provider)
-      1. Add an annotation to the `frontend.service` object to tell your cloud provider to provision a load balancer with said certificate attached
-   3. OpenAI Api Key
-   4. Images
-   5. Oauth
-
-An example bare minimum config file `langsmith_config.yaml`:
-
-```yaml
-config:
-  langsmithLicenseKey: ""
-```
-
-You can also see some example configurations in the examples directory.
-
-## Deploying to Kubernetes:
-
-1.  Verify that you can connect to your Kubernetes cluster(note: We highly suggest installing into an empty namespace)
-
-    1. Run `kubectl get pods`
-
-       Output should look something like:
-
-       ```bash
-       kubectl get pods                                                                                                                                                                     ⎈ langsmith-eks-2vauP7wf 21:07:46
-       No resources found in default namespace.
-       ```
-
-2.  Ensure you have the Langchain Helm repo added. (skip this step if you are using local charts)
-
-        helm repo add langchain https://langchain-ai.github.io/helm/
-        "langchain" has been added to your repositories
-
-3.  Run `helm install langsmith langchain/langsmith --values langsmith_config.yaml --namespace <your-namespace> --version <version>`
-
-    Output should look something like:
-
-    ```bash
-    NAME: langsmith
-    LAST DEPLOYED: Fri Sep 17 21:08:47 2021
-    NAMESPACE: langsmith
-    STATUS: deployed
-    REVISION: 1
-    TEST SUITE: None
-    ```
-
-4.  Run `kubectl get pods`
-    Output should now look something like:
-
-    ```bash
-    langsmith-backend-6ff46c99c4-wz22d       1/1     Running   0          3h2m
-    langsmith-frontend-6bbb94c5df-8xrlr      1/1     Running   0          3h2m
-    langsmith-hub-backend-5cc68c888c-vppjj   1/1     Running   0          3h2m
-    langsmith-playground-6d95fd8dc6-x2d9b    1/1     Running   0          3h2m
-    langsmith-postgres-0                     1/1     Running   0          9h
-    langsmith-queue-5898b9d566-tv6q8         1/1     Running   0          3h2m
-    langsmith-redis-0                        1/1     Running   0          9h
-    ```
-
-## Validate your deployment:
-
-1. Run `kubectl get services`
-
-   Output should look something like:
-
-   ```bash
-   NAME                    TYPE           CLUSTER-IP       EXTERNAL-IP                                                               PORT(S)        AGE
-   langsmith-backend       ClusterIP      172.20.140.77    <none>                                                                    1984/TCP       35h
-   langsmith-frontend      LoadBalancer   172.20.253.251   <external ip>                                                             80:31591/TCP   35h
-   langsmith-hub-backend   ClusterIP      172.20.112.234   <none>                                                                    1985/TCP       35h
-   langsmith-playground    ClusterIP      172.20.153.194   <none>                                                                    3001/TCP       9h
-   langsmith-postgres      ClusterIP      172.20.244.82    <none>                                                                    5432/TCP       35h
-   langsmith-redis         ClusterIP      172.20.81.217    <none>                                                                    6379/TCP       35h
-   ```
-
-2. Curl the external ip of the `langsmith-frontend` service:
-
-   ```bash
-   curl <external ip>/api/tenants
-   [{"id":"00000000-0000-0000-0000-000000000000","has_waitlist_access":true,"created_at":"2023-09-13T18:25:10.488407","display_name":"Personal","config":{"is_personal":true,"max_identities":1},"tenant_handle":"default"}]%
-   ```
-
-3. Visit the external ip for the `langsmith-frontend` service on your browser
-
-   The LangSmith UI should be visible/operational
-
-   ![./static/langsmith_ui.png](./static/langsmith_ui.png)
-
-## Using LangSmith
-
-Now that LangSmith is running, you can start using it to trace your code. You can find more information on how to use self-hosted LangSmith in the [Self-Hosted Usage Guide](/self_hosting/usage).
-
-### Frequently Asked Questions:
-
-#### How can we upgrade our application?
-
-- We plan to release new minor versions of the LangSmith application every 6 weeks. This will include release notes and all changes should be backwards compatible. To upgrade, you will need to follow the upgrade instructions in the Helm README and run a `helm upgrade langsmith --values <values file>`
-
-#### How can we back up our application?
-
-- Currently, we rely on PVCs/PV to power storage for our application. We strongly encourage setting up `Persistent Volume` backups or moving to a managed service for `Postgres` to support disaster recovery
-
-#### How does load balancing work/ingress work?
-
-- Currently, our application spins up one load balancer using a k8s service of type `LoadBalancer` for our frontend. If you do not want to set up a load balancer you can simply port-forward the frontend and use that as your external ip for the application. We also have an option for the chart to provision an ingress resource for the application.
-
-#### How can we authenticate to the application?
-
-- Currently, our self-hosted solution supports oauth as an authn solution. Note, we do offer a no-auth solution but highly recommend setting up oauth before moving into production.
-
-#### How can I use External `Postgres` or `Redis`?
-
-- You can configure external postgres or redis using the external sections in the `values.yaml` file. You will need to provide the connection url/params for the database/redis instance. Look at the configuration above example for more information.
-
-#### What networking configuration is needed for the application?
-
-Our deployment only needs egress for a few things:
-
-- Fetching images (If mirroring your images, this may not be needed)
-- Talking to any LLMs
-- Talking to any external services you may have configured
-- Fetching OAuth information
-  Your VPC can set up rules to limit any other access. Note: We require the X-Tenant-Id to be allowed to be passed through to the backend service. This is used to determine which tenant the request is for.
-
-#### What resources should we allocate to the application?
-
-- We recommend at least 4 vCPUs and 16GB of memory for our application.
-- We have some default resources set in our `values.yaml` file. You can override these values to tune resource usage for your organization.
-- If the metrics server is enabled in your cluster, we also recommend enabling autoscaling on all deployments.
diff --git a/versioned_docs/version-old/self_hosting/release_notes.mdx b/versioned_docs/version-old/self_hosting/release_notes.mdx
deleted file mode 100644
index 815bdcb9c..000000000
--- a/versioned_docs/version-old/self_hosting/release_notes.mdx
+++ /dev/null
@@ -1,99 +0,0 @@
----
-sidebar_label: Release Notes (Self-Hosted)
-sidebar_position: 4
----
-
-# LangSmith Release Notes
-
-:::note
-If you are updating directly from LangSmith v0.1.x and you wish to retain access to run data in the Langsmith UI after updating, you must first update to v0.2.x and perform a data migration. **Updating directly from v0.1.x to v0.3.x or later will result in data loss as the `runs` table in postgres will be dropped when deploying LangSmith v0.3.x or higher.** Details are available at https://github.com/langchain-ai/helm/blob/main/charts/langsmith/docs/UPGRADE-0.2.x.md
-:::
-
-## Week of March 25, 2024 - LangSmith v0.4
-
-LangSmith 0.4 improves performance and reliability, implements a new asynchronous queue worker to optimize run ingests, and an API key salt parameter.
-
-### Breaking changes
-
-- This release adds an API key salt parameter. This previously defaulted to your LangSmith License Key. **For updates from earlier versions you should set this parameter to your license key to ensure backwards compatibility.** Using a new api key salt will invalidate all existing api keys.
-- This release makes Clickhouse persistence use 50Gi of storage by default. You can adjust this by changing the `clickhouse.statefulSet.persistence.size` value in your `values.yaml` file.
-  - If your existing configuration does not configure persistence already, you will need to resize your existing pvc or set `clickhouse.statefulSet.persistence.size` to the previous default value of `8Gi`.
-
-### Performance and Reliability Changes
-
-- Implemented a new asynchronous queue worker and cached token encodings to improve performance when ingesting traces, reducing the delay between ingest and display in the LangSmith UI.
-
-### Infrastructure changes
-
-- Some our image repositories have been updated. You can see the root repositories in our `values.yaml` file and may need to update mirrors to pick up the new images.
-- Clickhouse persistence now uses 50Gi of storage by default. You can adjust this by changing the `clickhouse.statefulSet.persistence.size` value in your `values.yaml` file.
-  - If your existing configuration cannot support 50Gi, you may need to resize your existing storage class or set `clickhouse.statefulSet.persistence.size` to the previous default value of `8Gi`.
-- Consolidation of hubBackend and backend services. We now use one service to serve both of these endpoints. This should not impact your application.
-
-### Admin changes
-
-- Added an API key salt parameter in `values.yml`. This can be set to a custom value and changing it will invalidate all existing api keys.
-- Changed the OAuth flow to leverage Access Tokens instead of OIDC ID tokens. This change should not impact the end user experience.
-- Added scripts to enable feature flags in self-hosted environments for use in previewing pre-release features. Details are available at https://github.com/langchain-ai/helm/blob/main/charts/langsmith/docs/ADD-FEATURE-FLAG.md
-
-### Deprecation notices
-
-With the release of 0.4:
-
-- LangSmith 0.3.x and earlier are now in maintenance mode and may only receive critical security fixes.
-
-## Week of Februrary 21, 2024 - LangSmith v0.3
-
-LangSmith 0.3 improves performance and reliability, adds improved monitoring charts group by metadata and tag, and adds cost tracking.
-
-### Breaking changes
-
-- This release will drop the postgres run tables - if you are making a migration from LangSmith v0.1 and wish to retain run data, you must first update to v0.2 and perform a data migration. See https://github.com/langchain-ai/helm/blob/main/charts/langsmith/docs/UPGRADE-0.2.x.md for additional details
-
-### Performance and Reliability Changes
-
-- Continued performance when ingesting traces, reducing the delay between ingest and display in the LangSmith UI.
-
-### Admin changes
-
-- None
-
-### Deprecation notices
-
-With the release of 0.3:
-
-- LangSmith 0.2.x and earlier are now in maintenance mode and may only receive critical security fixes.
-
-## Week of January 29, 2024 - LangSmith v0.2
-
-LangSmith 0.2 improves performance and reliability, adds a updated interface for reviewing trace data, and adds support for batch processing of traces.
-
-### Requirements
-
-- This release requires `langsmith-sdk` version ≥ `0.0.71` (Python) and ≥ `0.0.56` (JS/TS) to support changes in pagination of API results. Older versions will only return the first 100 results when querying an endpoint.
-
-### Breaking changes
-
-- The search syntax for metadata in runs has changed and limits support for nested JSON to a single level. If you are supplying custom metadata in traces, you should flatten your metadata structure in order to allow it to be searchable, (e.g. `{"user_id": ..., "user_name":...,}`) and then search using `has(metadata, '{"user_name": ...}')`
-
-### Performance and Reliability Changes
-
-- Improved performance when ingesting traces, reducing the delay between ingest and display in the LangSmith UI.
-- Improved performance for updates and deletes on annotation labels.
-- Added pagination of API responses.
-- Fixed an issue impacting natural language searches.
-
-### Infrastructure Changes
-
-- Added the `clickhouse` database service. Run results will now be stored in ClickHouse instead of Postgres to improve performance and scalability and reduce delays in the time it takes for runs to appear in LangSmith.
-  - Note that if you wish to retain access to run data in the Langsmith UI after updating, a data migration will need to be performed. Details are available at https://github.com/langchain-ai/helm/blob/main/charts/langsmith/docs/UPGRADE-0.2.x.md
-
-### Admin changes
-
-- Increased the maximum number of users per organization from 5 to 100 for new organizations.
-
-### Deprecation notices
-
-With the release of 0.2:
-
-- LangSmith 0.1.x is now in maintenance mode and may only receive critical security fixes.
diff --git a/versioned_docs/version-old/self_hosting/static/langsmith_ui.png b/versioned_docs/version-old/self_hosting/static/langsmith_ui.png
deleted file mode 100644
index 2a229dbc8..000000000
Binary files a/versioned_docs/version-old/self_hosting/static/langsmith_ui.png and /dev/null differ
diff --git a/versioned_docs/version-old/self_hosting/usage.mdx b/versioned_docs/version-old/self_hosting/usage.mdx
deleted file mode 100644
index 6c66ca13a..000000000
--- a/versioned_docs/version-old/self_hosting/usage.mdx
+++ /dev/null
@@ -1,47 +0,0 @@
----
-sidebar_label: Usage
-sidebar_position: 3
-table_of_contents: true
----
-
-# How to use your self-hosted instance of LangSmith
-
-This guide will walk you through the process of using your self-hosted instance of LangSmith.
-
-:::important Self-Hosted LangSmith Instance Required
-This guide assumes you have already deployed a self-hosted LangSmith instance. If you have not, please refer to the [kubernetes deployment guide](/self_hosting/installation/kubernetes) or the [docker deployment guide](/self_hosting/installation/docker).
-:::
-
-### Using your deployment:
-
-1. Once you have deployed your instance, you can access the LangSmith UI at `http://<external ip>`.
-2. The backend API will be available at `http://<external ip>/api` and the hub API will be available at `http://<external ip>/api-hub`.
-
-To use the LangSmith API, you will need to set the following environment variables in your application:
-
-```bash
-LANGCHAIN_ENDPOINT=http://<external ip>/api
-LANGCHAIN_HUB_API_URL=http://<external ip>/api-hub
-LANGCHAIN_API_KEY=foo # Set to a legitimate API key if using OAuth
-```
-
-You can also configure these variables directly in the LangSmith SDK client:
-
-```python
-import langsmith
-
-langsmith_client = langsmith.Client(
-    api_key='<api_key>',
-    api_url='http://<external ip>/api',
-)
-
-import langchainhub
-
-langchainhub.Client(
-    api_key='<api_key>',
-    api_url='http://<external ip>/api-hub'
-)
-```
-
-After setting the above, you should be able to run your code and see the results in your self-hosted instance.
-We recommend running through the [<u>quickstart guide</u>](https://docs.smith.langchain.com/#quick-start) to get a feel for how to use LangSmith.
diff --git a/versioned_docs/version-old/static/LangSmith_Diagram-GA-final.png b/versioned_docs/version-old/static/LangSmith_Diagram-GA-final.png
deleted file mode 100644
index de867c8ad..000000000
Binary files a/versioned_docs/version-old/static/LangSmith_Diagram-GA-final.png and /dev/null differ
diff --git a/versioned_docs/version-old/static/rendered_trace.png b/versioned_docs/version-old/static/rendered_trace.png
deleted file mode 100644
index b98c552e1..000000000
Binary files a/versioned_docs/version-old/static/rendered_trace.png and /dev/null differ
diff --git a/versioned_docs/version-old/static/user_guide/annotating_traces.mp4 b/versioned_docs/version-old/static/user_guide/annotating_traces.mp4
deleted file mode 100644
index 7f3c18340..000000000
Binary files a/versioned_docs/version-old/static/user_guide/annotating_traces.mp4 and /dev/null differ
diff --git a/versioned_docs/version-old/static/user_guide/comparison.mp4 b/versioned_docs/version-old/static/user_guide/comparison.mp4
deleted file mode 100644
index e4649e2e0..000000000
Binary files a/versioned_docs/version-old/static/user_guide/comparison.mp4 and /dev/null differ
diff --git a/versioned_docs/version-old/static/user_guide/datasets.mp4 b/versioned_docs/version-old/static/user_guide/datasets.mp4
deleted file mode 100644
index 6f9d91aba..000000000
Binary files a/versioned_docs/version-old/static/user_guide/datasets.mp4 and /dev/null differ
diff --git a/versioned_docs/version-old/static/user_guide/debugging.mp4 b/versioned_docs/version-old/static/user_guide/debugging.mp4
deleted file mode 100644
index 088c9b906..000000000
Binary files a/versioned_docs/version-old/static/user_guide/debugging.mp4 and /dev/null differ
diff --git a/versioned_docs/version-old/static/user_guide/feedback_filtering.mp4 b/versioned_docs/version-old/static/user_guide/feedback_filtering.mp4
deleted file mode 100644
index 9a1f7cbce..000000000
Binary files a/versioned_docs/version-old/static/user_guide/feedback_filtering.mp4 and /dev/null differ
diff --git a/versioned_docs/version-old/static/user_guide/monitoring.mp4 b/versioned_docs/version-old/static/user_guide/monitoring.mp4
deleted file mode 100644
index 6cd2620d1..000000000
Binary files a/versioned_docs/version-old/static/user_guide/monitoring.mp4 and /dev/null differ
diff --git a/versioned_docs/version-old/static/user_guide/online_eval.mp4 b/versioned_docs/version-old/static/user_guide/online_eval.mp4
deleted file mode 100644
index cf658fb59..000000000
Binary files a/versioned_docs/version-old/static/user_guide/online_eval.mp4 and /dev/null differ
diff --git a/versioned_docs/version-old/static/user_guide/playground.mp4 b/versioned_docs/version-old/static/user_guide/playground.mp4
deleted file mode 100644
index 997ac12e7..000000000
Binary files a/versioned_docs/version-old/static/user_guide/playground.mp4 and /dev/null differ
diff --git a/versioned_docs/version-old/static/user_guide/running_tests.mp4 b/versioned_docs/version-old/static/user_guide/running_tests.mp4
deleted file mode 100644
index cf0611e84..000000000
Binary files a/versioned_docs/version-old/static/user_guide/running_tests.mp4 and /dev/null differ
diff --git a/versioned_docs/version-old/static/user_guide/threads.mp4 b/versioned_docs/version-old/static/user_guide/threads.mp4
deleted file mode 100644
index f721c3390..000000000
Binary files a/versioned_docs/version-old/static/user_guide/threads.mp4 and /dev/null differ
diff --git a/versioned_docs/version-old/tracing/concepts.mdx b/versioned_docs/version-old/tracing/concepts.mdx
deleted file mode 100644
index 0bd75a0b1..000000000
--- a/versioned_docs/version-old/tracing/concepts.mdx
+++ /dev/null
@@ -1,70 +0,0 @@
----
-sidebar_label: Concepts
-sidebar_position: 2
-table_of_contents: true
----
-
-import ThemedImage from "@theme/ThemedImage";
-
-# Concepts
-
-In this guide we will go over some of the concepts that are important to understand when logging traces to LangSmith. A `Trace` is essentially a series of steps that your application takes to go from input to output. Each of these individual steps is represented by a `Run`. A `Project` is simply a collection of traces. The following diagram displays these concepts in the context of a simple RAG app, which retrieves documents from an index and generates an answer.
-
-<ThemedImage
-  alt="LangSmith Primitives"
-  sources={{
-    light: require("./static/concepts/primitives.png").default,
-    dark: require("./static/concepts/primitives-dark.png").default,
-  }}
-/>
-<div
-  style={{
-    display: "flex",
-    flexDirection: "column",
-    textAlign: "center",
-    fontSize: "14px",
-    marginTop: "5px",
-  }}
->
-  Primitive datatypes in LangSmith
-</div>
-
-## Runs
-
-A `Run` is a span representing a single unit of work or operation within your LLM application. This could be anything from single call to an LLM or chain, to a prompt formatting call, to a runnable lambda invocation. If you are familiar with [OpenTelemetry](https://opentelemetry.io/), you can think of a run as a span.
-![Run](static/concepts/run.png)
-
-## Traces
-
-A `Trace` is a collection of runs that are related to a single operation. For example, if you have a user request that triggers a chain, and that chain makes a call to an LLM, then to an output parser, and so on, all of these runs would be part of the same trace. If you are familiar with [OpenTelemetry](https://opentelemetry.io/), you can think of a LangSmith trace as a collection of spans. Runs are bound to a trace by a unique trace ID.
-![Trace](static/concepts/trace.png)
-
-## Projects
-
-A `Project` is a collection of traces. You can think of a project as a container for all the traces that are related to a single application or service. You can have multiple projects, and each project can have multiple traces.
-![Project](static/concepts/project.png)
-
-## Feedback
-
-`Feedback` allows you to score an individual run based on certain criteria.
-Each feedback entry consists of a feedback tag and feedback score, and is bound to a run by a unique run ID.
-Feedback can currently be continuous or discrete (categorical), and you can reuse feedback tags across different runs within an organization.
-
-Collecting feedback on runs can be done in three main ways:
-
-1. [In the UI](faq/logging_feedback#annotating-traces-with-feedback) - Annotate runs directly in the UI
-2. [With the SDK](faq/logging_feedback#capturing-feedback-programmatically) - Programmatically log feedback to LangSmith
-3. [With Online Evaluators](../monitoring/faq/online_evaluation) - Automatically run evaluators on a sample of your production traces to generate feedback in realtime
-
-![Feedback](static/concepts/feedback.png)
-
-## Tags
-
-`Tags` are collections of strings that can be attached to runs. They are used to categorize runs and make it easier to search for them in the LangSmith UI. Tags can be used to filter runs in the LangSmith UI, and can be used to group runs together for analysis. [Learn how to tag your traces in the LangSmith SDK.](faq/customizing_trace_attributes#adding-metadata-and-tags-to-traces)
-![Tags](static/concepts/tags.png)
-
-## Metadata
-
-`Metadata` is a collection of key-value pairs that can be attached to runs. Metadata can be used to store additional information about a run, such as the version of the application that generated the run, the environment in which the run was generated, or any other information that you want to associate with a run.
-Similar to tags, you can use metadata to filter runs in the LangSmith UI, and can be used to group runs together for analysis. [Learn how to add metadata to your traces in the LangSmith SDK.](faq/customizing_trace_attributes#adding-metadata-and-tags-to-traces)
-![Metadata](static/concepts/metadata.png)
diff --git a/versioned_docs/version-old/tracing/faq/_category_.json b/versioned_docs/version-old/tracing/faq/_category_.json
deleted file mode 100644
index b9e125a41..000000000
--- a/versioned_docs/version-old/tracing/faq/_category_.json
+++ /dev/null
@@ -1,5 +0,0 @@
-{
-  "position": 2,
-  "collapsed": true,
-  "collapsible": true
-}
\ No newline at end of file
diff --git a/versioned_docs/version-old/tracing/faq/custom_llm_token_counting.mdx b/versioned_docs/version-old/tracing/faq/custom_llm_token_counting.mdx
deleted file mode 100644
index e54907d5c..000000000
--- a/versioned_docs/version-old/tracing/faq/custom_llm_token_counting.mdx
+++ /dev/null
@@ -1,236 +0,0 @@
----
-sidebar_label: Token Counting for Custom LLMs
-sidebar_position: 7
----
-
-# Custom LLM Token Counting
-
-This guide shows how to get your custom functions to have their token count tracked by LangSmith. The key is to coerce your inputs and outputs to conform with a minimal version OpenAI's API format.
-We will review adding support for both chat models (llms that expect a list of chat messages as inputs and return with a chat message) and completion models (models that expect a string as input and return a string).
-
-:::note
-This guide assumes you are using the `traceable` decorator, though the same principles can be applied to other tracing methods.
-:::
-
-## Chat Models (messages in, message out)
-
-For chat models, your inputs must contain a list of messages as input. The output must return an object that, when serialized, contains the key `choices` with a list of dicts. Each dict must contain the key `message` with a dict value. The message dict must contain the key `content` with a string value and the key `role`.
-
-```python
-from langsmith import traceable
-
-@traceable(run_type="llm")
-def my_chat_model(messages: list):
-    return {
-        "choices": [
-            {
-                "message": {
-                    "content": "hello, " + messages[1]["content"],
-                    "role": "assistant",
-                }
-            }
-        ]
-    }
-
-# Usage
-my_chat_model(
-    [
-        {"role": "system", "content": "You are a bot."},
-        {"role": "user", "content": "SolidGoldMagikarp"},
-    ]
-)
-```
-
-You can configure the model and other arguments as well. The `model` key is used to match cost information:
-
-```python
-@traceable(run_type="llm")
-def my_chat_model_with_model(messages: list, model: str):
-    return {
-        "choices": [
-            {
-                "message": {
-                    "content": "hello, " + messages[1]["content"],
-                    "role": "assistant",
-                }
-            }
-        ]
-    }
-
-my_chat_model_with_model(
-    [
-        {"role": "system", "content": "You are a bot."},
-        {"role": "user", "content": "SolidGoldMagikarp"},
-    ],
-    model="gpt-3.5-turbo",
-)
-```
-
-### Streaming
-
-For streaming, you can "reduce" the outputs into the same format as the non-streaming version:
-
-```python
-def _reduce_chunks(chunks: list):
-    all_text = "".join([chunk["choices"][0]["message"]["content"] for chunk in chunks])
-    return {"choices": [{"message": {"content": all_text, "role": "assistant"}}]}
-
-@traceable(run_type="llm", reduce_fn=_reduce_chunks)
-def my_streaming_chat_model(messages: list, model: str):
-    for chunk in ["hello, " + messages[1]["content"]]:
-        yield {
-            "choices": [
-                {
-                    "message": {
-                        "content": chunk,
-                        "role": "assistant",
-                    }
-                }
-            ]
-        }
-
-list(
-    my_streaming_chat_model(
-        [
-            {"role": "system", "content": "You are a bot."},
-            {"role": "user", "content": "SolidGoldMagikarp but streaming"},
-        ],
-        model="gpt-3.5-turbo",
-    )
-)
-```
-
-Note: Tool calling and other messages are also supported, following the OpenAI format.
-
-### Manually Providing Token Counts
-
-By default, LangSmith uses tiktoken to count tokens, using our best guess at the model's tokenizer based on the `model` parameter you provide.
-To manually provide token counts, you can add a `usage` key to the function's response, containing a dictionary with the keys `prompt_tokens`, `completion_tokens`, and `total_tokens`. You must also add `batch_size=1` to the extra dictionary in the `run_tree.extra` object.
-
-```python
-from langsmith.run_helpers import get_current_run_tree
-
-@traceable(run_type="llm")
-def my_chat_model_with_usage(messages: list, model: str = "gpt-3.5-turbo"):
-    run_tree = get_current_run_tree()
-    run_tree.extra["batch_size"] = 1
-    return {
-        "choices": [
-            {
-                "message": {
-                    "content": "hello, " + messages[1]["content"],
-                    "role": "assistant",
-                }
-            }
-        ],
-        "usage": {
-            "prompt_tokens": 9_999,
-            "completion_tokens": 32,
-            "total_tokens": 10_031,
-        },
-    }
-
-my_chat_model_with_usage(
-    messages=[
-        {"role": "system", "content": "You are a bot."},
-        {"role": "user", "content": "SolidGoldMagikarp but with usage"},
-    ],
-)
-```
-
-This is also supported via streaming:
-
-```python
-def _reduce_chunks_with_usage(chunks: list):
-    all_text = "".join(
-        [
-            chunk["choices"][0]["message"]["content"]
-            for chunk in chunks
-            if "choices" in chunk
-        ]
-    )
-    usages = [chunk["usage"] for chunk in chunks if "usage" in chunk]
-    usage = {}
-    if usages:
-        total_tokens = sum([usage["total_tokens"] for usage in usages])
-        prompt_tokens = sum([usage["prompt_tokens"] for usage in usages])
-        completion_tokens = sum([usage["completion_tokens"] for usage in usages])
-        usage = {
-            "prompt_tokens": prompt_tokens,
-            "completion_tokens": completion_tokens,
-            "total_tokens": total_tokens,
-        }
-    return {
-        "choices": [{"message": {"content": all_text, "role": "assistant"}}],
-        "usage": usage,
-    }
-
-@traceable(run_type="llm", reduce_fn=_reduce_chunks_with_usage)
-def my_streaming_chat_model_with_usage(messages: list, model: str = "gpt-3.5-turbo"):
-    run_tree = get_current_run_tree()
-    run_tree.extra["batch_size"] = 1
-    for chunk in ["hello, " + messages[1]["content"]]:
-        yield {
-            "choices": [
-                {
-                    "message": {
-                        "content": chunk,
-                        "role": "assistant",
-                    }
-                }
-            ],
-        }
-    yield {
-        "usage": {
-            "prompt_tokens": 9_999,
-            "completion_tokens": 32,
-            "total_tokens": 10_031,
-        }
-    }
-
-list(
-    my_streaming_chat_model_with_usage(
-        messages=[
-            {"role": "system", "content": "You are a bot."},
-            {"role": "user", "content": "SolidGoldMagikarp but with usage"},
-        ]
-    )
-)
-```
-
-## Completion Models (string in, string out)
-
-For completion models, your inputs must contain a key `prompt` with a string value. Other inputs are also permitted. The output must return an object that, when serialized, contains the key `choices` with a list of dicts. Each dict must contain the key `text` with a string value.
-
-```python
-@traceable(run_type="llm")
-def my_llm(prompt: str):
-    return {"choices": [{"text": "hello, " + prompt}]}
-
-my_llm("SolidGoldMagikarp")
-```
-
-If you want to add additional "invocation params" such as the model name, you can just add those keys. The `model` key can be used to let the cost estimator know which model is being used.
-
-```python
-@traceable(run_type="llm")
-def my_llm_with_model(prompt: str, model: str):
-    return {"choices": [{"text": "hello, " + prompt}]}
-
-my_llm_with_model("SolidGoldMagikarp", model="gpt-3.5-turbo-instruct")
-```
-
-For streaming, you can "reduce" the outputs into the same format as the non-streaming version:
-
-```python
-def _reduce_chunks(chunks: list):
-    all_text = "".join([chunk["choices"][0]["text"] for chunk in chunks])
-    return {"choices": [{"text": all_text}]}
-
-@traceable(run_type="llm", reduce_fn=_reduce_chunks)
-def my_streaming_llm(prompt: str, model: str):
-    for chunk in ["hello, " + prompt]:
-        yield {"choices": [{"text": chunk}]}
-
-list(my_streaming_llm("SolidGoldMagikarp but streaming", model="gpt-3.5-turbo-instruct"))
-```
diff --git a/versioned_docs/version-old/tracing/faq/customizing_trace_attributes.mdx b/versioned_docs/version-old/tracing/faq/customizing_trace_attributes.mdx
deleted file mode 100644
index 2adf09c12..000000000
--- a/versioned_docs/version-old/tracing/faq/customizing_trace_attributes.mdx
+++ /dev/null
@@ -1,452 +0,0 @@
----
-sidebar_label: Customize Trace Attributes
-sidebar_position: 2
----
-
-import {
-  CodeTabs,
-  PythonBlock,
-  TypeScriptBlock,
-  LangChainPyBlock,
-  LangChainJSBlock,
-  APIBlock,
-} from "@site/src/components/InstructionsWithCode";
-
-# How to customize attributes of traces
-
-Oftentimes, you will want to customize various attributes of the traces you log to LangSmith.
-
-### Logging to a specific project
-
-As mentioned in the Concepts section, LangSmith uses the concept of a `Project` to group traces. If left unspecified, the tracer project is set to `default`. You can set the `LANGCHAIN_PROJECT` environment variable to configure a custom project name for an entire application run. This should be done before executing your program.
-
-```bash
-export LANGCHAIN_PROJECT="My Project"
-```
-
-### Changing the destination project at runtime
-
-When global environment variables are too broad, you can also set the project name at program runtime. This is useful when you want to log traces to different projects within the same application.
-
-<CodeTabs
-  tabs={[
-    PythonBlock(`import openai
-from langsmith import traceable
-from langsmith.run_trees import RunTree\n
-client = openai.Client()\n
-messages = [
-    {"role": "system", "content": "You are a helpful assistant."},
-    {"role": "user", "content": "Hello!"}
-]\n
-# Use the @traceable decorator with the 'project_name' parameter to log traces to LangSmith
-# Ensure that the LANGCHAIN_TRACING_V2 environment variables are set for @traceable to work
-@traceable(
-    run_type="llm",
-    name="OpenAI Call Decorator",
-)
-def call_openai(
-    messages: list[dict], model: str = "gpt-3.5-turbo"
-) -> str:
-    return client.chat.completions.create(
-        model=model,
-        messages=messages,
-    ).choices[0].message.content\n
-# You can specify the Project via the project_name parameter
-call_openai(
-    messages,
-    # highlight-next-line
-    langsmith_extra={"project_name": "My Project"},
-)\n
-# The wrapped OpenAI client accepts all the same langsmith_extra parameters
-# as @traceable decorated functions, and logs traces to langsmith automatically
-from langsmith import wrappers
-wrapped_client = wrappers.wrap_openai(client)
-wrapped_client.chat.completions.create(
-    model="gpt-3.5-turbo",
-    messages=messages,
-    # highlight-next-line
-    langsmith_extra={"project_name": "My Project"},
-)\n\n
-# Alternatively, create a RunTree object
-# You can set the project name using the project_name parameter
-rt = RunTree(
-    run_type="llm",
-    name="OpenAI Call RunTree",
-    inputs={"messages": messages},
-    # highlight-next-line
-    project_name="My Project"
-)
-chat_completion = client.chat.completions.create(
-    model="gpt-3.5-turbo",
-    messages=messages,
-)
-# End and submit the run
-await rt.end(outputs=chat_completion)
-rt.post()
-`),
-    TypeScriptBlock(`import OpenAI from "openai";
-import { RunTree } from "langsmith";\n
-const client = new OpenAI()\n
-const messages = [
-    {role: "system", content: "You are a helpful assistant."},
-    {role: "user", content: "Hello!"}
-]\n
-// Create a RunTree object
-// You can set the project name using the project_name parameter
-const rt = new RunTree({
-    run_type: "llm",
-    name: "OpenAI Call RunTree",
-    inputs: { messages },
-    // highlight-next-line
-    project_name: "My Project"
-})
-await rt.postRun();
-const chatCompletion = await client.chat.completions.create({
-    model: "gpt-3.5-turbo",
-    messages: messages,
-});
-// End and submit the run
-await rt.end(chatCompletion);
-await rt.patchRun();`),
-    LangChainPyBlock(`# You can set the project name for a specific tracer instance:
-from langchain.callbacks.tracers import LangChainTracer\n
-tracer = LangChainTracer(project_name="My Project")
-chain.invoke({"query": "How many people live in canada as of 2023?"}, config={"callbacks": [tracer]})\n\n
-# LangChain python also supports a context manager for tracing a specific block of code.
-# You can set the project name using the project_name parameter.
-from langchain_core.tracers.context import tracing_v2_enabled
-with tracing_v2_enabled(project_name="My Project"):
-    chain.invoke({"query": "How many people live in canada as of 2023?"})
-`),
-    LangChainJSBlock(`// You can set the project name for a specific tracer instance:
-import { LangChainTracer } from "langchain/callbacks";\n
-const tracer = new LangChainTracer({ projectName: "My Project" });
-await chain.invoke(
-  {
-    query: "How many people live in canada as of 2023?"
-  },
-  { callbacks: [tracer] }
-);
-`),
-  ]}
-  groupId="client-language"
-/>
-
-### Adding metadata and tags to traces
-
-LangSmith supports sending arbitrary metadata and tags along with traces. This is useful for associating additional information with a trace, such as the environment in which it was executed, or the user who initiated it.
-For more information on metadata and tags, see the [Concepts](../../tracing/concepts) page. For information on how to query traces and runs by metadata and tags, see the [Querying Traces](../../tracing/faq/querying_traces) page.
-
-<CodeTabs
-  tabs={[
-    PythonBlock(`import openai
-from langsmith import traceable
-from langsmith.run_trees import RunTree\n
-client = openai.Client()\n
-messages = [
-    {"role": "system", "content": "You are a helpful assistant."},
-    {"role": "user", "content": "Hello!"}
-]\n
-# Use the @traceable decorator with tags and metadata
-# Ensure that the LANGCHAIN_TRACING_V2 environment variables are set for @traceable to work
-@traceable(
-    run_type="llm",
-    name="OpenAI Call Decorator",
-    # highlight-next-line
-    tags=["my-tag"],
-    # highlight-next-line
-    metadata={"my-key": "my-value"}
-)
-def call_openai(
-    messages: list[dict], model: str = "gpt-3.5-turbo"
-) -> str:
-    return client.chat.completions.create(
-        model=model,
-        messages=messages,
-    ).choices[0].message.content\n
-call_openai(
-    messages,
-    # You can provide tags and metadata at invocation time 
-    # via the langsmith_extra parameter
-    # highlight-next-line
-    langsmith_extra={"tags": ["my-other-tag"], "metadata": {"my-other-key": "my-value"}}
-)\n
-# Alternatively, you can create a RunTree object with tags and metadata
-rt = RunTree(
-    run_type="llm",
-    name="OpenAI Call RunTree",
-    inputs={"messages": messages},
-    # highlight-next-line
-    tags=["my-tag"],
-    # highlight-next-line
-    extra={"metadata": {"my-key": "my-value"}}
-)
-chat_completion = client.chat.completions.create(
-    model="gpt-3.5-turbo",
-    messages=messages,
-)
-# End and submit the run
-await rt.end(outputs=chat_completion)
-rt.post()`),
-    TypeScriptBlock(`import OpenAI from "openai";
-import { RunTree } from "langsmith";\n
-const client = new OpenAI();\n
-const messages = [
-    {role: "system", content: "You are a helpful assistant."},
-    {role: "user", content: "Hello!"}
-]\n
-// Create a RunTree object
-const rt = new RunTree({
-    run_type: "llm",
-    name: "OpenAI Call RunTree",
-    inputs: { messages },
-    // highlight-next-line
-    tags: ["my-tag"],
-    // highlight-next-line
-    extra: {metadata: {"my-key": "my-value"}}
-})
-await rt.postRun();
-const chatCompletion = await client.chat.completions.create({
-    model: "gpt-3.5-turbo",
-    messages: messages,
-});
-// End and submit the run
-await rt.end(chatCompletion)
-await rt.patchRun()`),
-    LangChainPyBlock(`from langchain_openai import ChatOpenAI
-from langchain_core.prompts import ChatPromptTemplate
-from langchain_core.output_parsers import StrOutputParser\n
-prompt = ChatPromptTemplate.from_messages([
-  ("system", "You are a helpful AI."),
-  ("user", "{input}")
-])
-chat_model = ChatOpenAI()
-output_parser = StrOutputParser()\n
-# Tags and metadata can be configured with RunnableConfig
-chain = (prompt | chat_model | output_parser).with_config({"tags": ["top-level-tag"], "metadata": {"top-level-key": "top-level-value"}})\n
-# Tags and metadata can also be passed at runtime
-chain.invoke({"input": "What is the meaning of life?"}, {"tags": ["shared-tags"], "metadata": {"shared-key": "shared-value"}})`),
-    LangChainJSBlock(`import { ChatOpenAI } from "@langchain/openai";
-import { ChatPromptTemplate } from "@langchain/core/prompts";
-import { StringOutputParser } from "@langchain/core/output_parsers";\n
-const prompt = ChatPromptTemplate.fromMessages([
-  ["system", "You are a helpful AI."],
-  ["user", "{input}"]
-])
-const model = new ChatOpenAI({ modelName: "gpt-3.5-turbo" });
-const outputParser = new StringOutputParser();\n
-// Tags and metadata can be configured with RunnableConfig
-const chain = (prompt.pipe(model).pipe(outputParser)).withConfig({"tags": ["top-level-tag"], "metadata": {"top-level-key": "top-level-value"}});\n
-// Tags and metadata can also be passed at runtime
-await chain.invoke({input: "What is the meaning of life?"}, {tags: ["shared-tags"], metadata: {"shared-key": "shared-value"}})`),
-  ]}
-  groupId="client-language"
-/>
-
-### Customizing the run name
-
-When you create a run, you can specify a name for the run. This name is used to identify the run in LangSmith and can be used to filter and group runs. The name is also used as the title of the run in the LangSmith UI.
-
-<CodeTabs
-  tabs={[
-    PythonBlock(`import openai
-from langsmith import traceable
-from langsmith.run_trees import RunTree\n
-client = openai.Client()\n
-messages = [
-    {"role": "system", "content": "You are a helpful assistant."},
-    {"role": "user", "content": "Hello!"}
-]\n
-# Use the @traceable decorator with the name parameter
-# Ensure that the LANGCHAIN_TRACING_V2 environment variables are set for @traceable to work
-@traceable(
-    run_type="llm",
-    # highlight-next-line
-    name="OpenAI Call Decorator",
-)
-def call_openai(
-    messages: list[dict], model: str = "gpt-3.5-turbo"
-) -> str:
-    return client.chat.completions.create(
-        model=model,
-        messages=messages,
-    ).choices[0].message.content\n
-call_openai(messages)\n
-# Alternatively, use the name parameter of the RunTree object
-rt = RunTree(
-    run_type="llm",
-    # highlight-next-line
-    name="OpenAI Call RunTree",
-    inputs={"messages": messages},
-)
-chat_completion = client.chat.completions.create(
-    model="gpt-3.5-turbo",
-    messages=messages,
-)
-# End and submit the run
-await rt.end(outputs=chat_completion)
-rt.post()`),
-    TypeScriptBlock(`import OpenAI from "openai";
-import { RunTree } from "langsmith";\n
-const client = new OpenAI();\n
-const messages = [
-    {role: "system", content: "You are a helpful assistant."},
-    {role: "user", content: "Hello!"}
-]\n
-// Create a RunTree object
-const rt = new RunTree({
-    run_type: "llm",
-    // highlight-next-line
-    name: "OpenAI Call RunTree",
-    inputs: { messages },
-})
-await rt.postRun()
-const chatCompletion = await client.chat.completions.create({
-    model: "gpt-3.5-turbo",
-    messages: messages,
-});
-// End and submit the run
-await rt.end(chatCompletion)
-await rt.patchRun()`),
-    LangChainPyBlock(`# When tracing within LangChain, run names default to the class name of the traced object (e.g., 'ChatOpenAI').
-# (Note: this is not currently supported directly on LLM objects.)
-...
-configured_chain = chain.with_config({"run_name": "MyCustomChain"})
-configured_chain.invoke({"query": "What is the meaning of life?"})`),
-    LangChainJSBlock(`// When tracing within LangChain, run names default to the class name of the traced object (e.g., 'ChatOpenAI').
-// (Note: this is not currently supported directly on LLM objects.)
-...
-const configuredChain = chain.withConfig({ runName: "MyCustomChain" });
-await configuredChain.invoke({query: "What is the meaning of life?"});
-`),
-  ]}
-  groupId="client-language"
-/>
-
-For more examples of with LangChain, check out the [recipe on customizing run names](https://github.com/langchain-ai/langsmith-cookbook/blob/main/tracing-examples/runnable-naming/run-naming.ipynb).
-
-### Updating a run
-
-The following fields can be updated when patching a run with the SDK or API.
-
-- `end_time`: `datetime.datetime`
-- `error`: `str | None`
-- `outputs`: `dict | None`
-- `events`: `list[dict] | None`
-
-### Masking inputs and outputs
-
-In some situations, you may need to hide the inputs and outputs of your traces for privacy or security reasons. LangSmith provides a way to filter the inputs and outputs of your traces before they are sent to the LangSmith backend, so our servers never see the original values.
-
-If you want to completely hide the inputs and outputs of your traces, you can set the following environment variables when running your application:
-
-```bash
-LANGCHAIN_HIDE_INPUTS=true
-LANGCHAIN_HIDE_OUTPUTS=true
-```
-
-This works for both the LangSmith SDK and LangChain.
-
-You can also customize and override this behavior for a given Client instance. This can be done by setting the `hide_inputs` and `hide_outputs` parameters on the `Client` object.
-
-<CodeTabs
-  tabs={[
-    PythonBlock(`import openai
-from langsmith import Client
-from langsmith.wrappers import wrap_openai\n
-openai_client = wrap_openai(openai.Client())
-langsmith_client = Client(
-    hide_inputs=lambda inputs: {}, hide_outputs=lambda outputs: {}
-)\n
-# The linked run will have its metadata present, but the inputs will be hidden
-openai_client.chat.completions.create(
-    model="gpt-3.5-turbo",
-    messages=[
-        {"role": "system", "content": "You are a helpful assistant."},
-        {"role": "user", "content": "Hello!"},
-    ],
-    langsmith_extra={"client": langsmith_client},
-)\n
-# The linked run will not have hidden inputs and outputs
-openai_client.chat.completions.create(
-    model="gpt-3.5-turbo",
-    messages=[
-        {"role": "system", "content": "You are a helpful assistant."},
-        {"role": "user", "content": "Hello!"},
-    ],
-)
-`),
-    TypeScriptBlock(`import { Client } from "langsmith";
-import { wrapOpenAI } from "langsmith/wrappers";
-import OpenAI from "openai";\n
-const langsmithClient = new Client({
-  hideInputs: (inputs) => ({}),
-  hideOutputs: (outputs) => ({}),
-});\n
-(async () => {
-  // The linked run will have its metadata present, but the inputs will be hidden
-  const filteredOAIClient = wrapOpenAI(new OpenAI(), {
-    client: langsmithClient,
-  });
-  await filteredOAIClient.chat.completions.create({
-    model: "gpt-3.5-turbo",
-    messages: [
-      { role: "system", content: "You are a helpful assistant." },
-      { role: "user", content: "Hello!" },
-    ],
-  });
-  const openaiClient = wrapOpenAI(new OpenAI());
-  // The linked run will not have hidden inputs and outputs
-  await openaiClient.chat.completions.create({
-    model: "gpt-3.5-turbo",
-    messages: [
-      { role: "system", content: "You are a helpful assistant." },
-      { role: "user", content: "Hello!" },
-    ],
-  });
-})();
-`),
-    LangChainPyBlock(`from langchain_core.tracers.context import tracing_v2_enabled
-from langchain_openai import ChatOpenAI
-from langsmith import Client\n\n
-def filter_inputs(inputs: dict):
-    # You can define custom filtering here
-    return {}\n\n
-def filter_outputs(outputs: dict):
-    # You can define custom filtering here
-    return {}\n\n
-llm = ChatOpenAI()\n
-# You can configure tracing using the context manager below
-# or by directly creating a LangChainTracer object
-with tracing_v2_enabled(
-    "test-filtering",
-    client=Client(hide_inputs=filter_inputs, hide_outputs=filter_outputs),
-) as cb:
-    llm.invoke("Say foo")
-    # The linked run will have its metadata present, but the inputs will be hidden
-    print(cb.get_run_url())\n
-with tracing_v2_enabled("test-filtering", client=Client()) as cb:
-    llm.invoke("Say bar")
-    # The linked run will not have hidden inputs and outputs
-    print(cb.get_run_url())
-`),
-    LangChainJSBlock(`import { ChatOpenAI } from "@langchain/openai";
-import { LangChainTracer } from "@langchain/core/tracers/tracer_langchain";
-import { Client} from "langsmith";\n
-(async () => {
-    const llm = new ChatOpenAI();
-    const client = new Client({
-        hideInputs: (inputs) => ({}),
-        hideOutputs: (outputs) => ({}),
-    })
-    const tracer = new LangChainTracer({ client });
-    // The traced run will have its metadata present, but the inputs will be hidden
-    await llm.invoke("Say foo", { callbacks: [tracer] });
-    const unfilteredTracer = new LangChainTracer();
-    // The traced run will not have hidden inputs and outputs
-    await llm.invoke("Say bar", { callbacks: [unfilteredTracer] });
-})();
-`),
-  ]}
-  groupId="client-language"
-/>
diff --git a/versioned_docs/version-old/tracing/faq/index.mdx b/versioned_docs/version-old/tracing/faq/index.mdx
deleted file mode 100644
index ce6449f93..000000000
--- a/versioned_docs/version-old/tracing/faq/index.mdx
+++ /dev/null
@@ -1,44 +0,0 @@
----
-sidebar_label: How-To Guides
-sidebar_position: 0
----
-
-# How-To Guides
-
-In this section you will find guides for how to use LangSmith tracing functionality
-
-**[Core Functionality](faq/logging_and_viewing)**
-
-- [How to log traces](faq/logging_and_viewing#logging-traces)
-- [How to view traces](faq/logging_and_viewing#viewing-traces)
-- [How to select a sampling rate for traces](faq/logging_and_viewing#setting-a-sampling-rate-for-tracing)
-- [How to turn off tracing](faq/logging_and_viewing#turning-off-tracing)
-- [How to log distributed traces](faq/logging_and_viewing#distributed-tracing)
-- [How to get the URL of run](faq/logging_and_viewing#getting-the-url-of-a-logged-run)
-- [How to delete traces](faq/logging_and_viewing#deleting-traces-in-a-project)
-
-**[Customize Trace Attributes](faq/customizing_trace_attributes)**
-
-- [How to log to a specific project](faq/customizing_trace_attributes#logging-to-a-specific-project)
-- [How to change the destination project at runtime](faq/customizing_trace_attributes#changing-the-destination-project-at-runtime)
-- [How to add metadata and tags to traces](faq/customizing_trace_attributes#adding-metadata-and-tags-to-traces)
-- [How to customize the run name](faq/customizing_trace_attributes#customizing-the-run-name)
-- [How to update a run](faq/customizing_trace_attributes#updating-a-run)
-- [How to mask inputs and outputs](faq/customizing_trace_attributes#masking-inputs-and-outputs)
-
-**[LangChain Specific Guides](faq/langchain_specific_guides)**
-
-- [How to group runs from multi-turn interactions](faq/langchain_specific_guides#grouping-runs-from-multi-turn-interactions)
-- [How to get a run ID from a LangChain call](faq/langchain_specific_guides#getting-a-run-id-from-a-langchain-call)
-- [How to trace without environment variables](faq/langchain_specific_guides#tracing-without-environment-variables)
-- [How to ensure all traces are submitted before exiting](faq/langchain_specific_guides#ensuring-all-traces-are-submitted-before-exiting)
-
-**[Querying Traces](faq/querying_traces)**
-
-- [How to use keyword arguments](faq/querying_traces#using-keyword-arguments)
-- [How to filter runs](faq/querying_traces#run-filtering)
-
-**[Capturing Feedback](faq/logging_feedback)**
-
-- [How to log feedback](faq/logging_feedback#collecting-feedback-programmatically)
-- [How to annotate traces](faq/logging_feedback#annotating-traces-with-feedback)
diff --git a/versioned_docs/version-old/tracing/faq/langchain_specific_guides.mdx b/versioned_docs/version-old/tracing/faq/langchain_specific_guides.mdx
deleted file mode 100644
index 5c8d27efc..000000000
--- a/versioned_docs/version-old/tracing/faq/langchain_specific_guides.mdx
+++ /dev/null
@@ -1,220 +0,0 @@
----
-sidebar_label: LangChain-Specific Guides
-sidebar_position: 6
----
-
-import {
-  CodeTabs,
-  PythonBlock,
-  TypeScriptBlock,
-  LangChainPyBlock,
-  LangChainJSBlock,
-  APIBlock,
-} from "@site/src/components/InstructionsWithCode";
-
-import { AccessRunIdBlock } from "@site/src/components/TracingFaq";
-
-# LangChain-specific guides
-
-This sections contains guides that are specific to users using LangChain (both Python and JavaScript).
-
-### Grouping runs from multi-turn interactions
-
-When using LangChain, you may want to group runs from multi-turn interactions together.
-
-With chatbots, copilots, and other common LLM design patterns, users frequently interact with your model over multiple interactions. Each invocation of your model is logged as a separate trace, but you can group these traces together using metadata (see [how to add metadata to a run](#how-do-i-add-metadata-or-tags-to-a-run) above for more information).
-Below is a minimal example with LangChain, but **the same idea applies when using the LangSmith SDK or API.**
-
-<CodeTabs
-  tabs={[
-    LangChainPyBlock(`from langchain_core.messages import AIMessage, HumanMessage
-from langchain_core.output_parsers import StrOutputParser
-from langchain_core.prompts import ChatPromptTemplate, MessagesPlaceholder
-from langchain_openai import ChatOpenAI\n
-chain = (
-    ChatPromptTemplate.from_messages(
-        [
-            ("system", "You are a helpful AI."),
-            MessagesPlaceholder(variable_name="chat_history"),
-            ("user", "{message}"),
-        ]
-    )
-    | ChatOpenAI(model="gpt-3.5-turbo")
-    | StrOutputParser()
-)\n
-conversation_id = "101e8e66-9c68-4858-a1b4-3b0e3c51a933"\n
-chat_history = []
-message = HumanMessage(content="Hi there")
-response = ""
-for chunk in chain.stream(
-    {
-        "message": message,
-        "chat_history": chat_history,
-    },
-    # highlight-next-line
-    config={"metadata": {"conversation_id": conversation_id}},
-):
-    print(chunk, end="")
-    response += chunk
-print()
-chat_history.extend(
-    [
-        message,
-        AIMessage(content=response),
-    ]
-)\n
-# ... Next message comes in
-next_message = HumanMessage(content="I don't need much assistance, actually.")
-for chunk in chain.stream(
-    {
-        "message": next_message,
-        "chat_history": chat_history,
-    },
-    # highlight-next-line
-    config={"metadata": {"conversation_id": conversation_id}},
-):
-    print(chunk, end="")
-    response += chunk
-`),
-    LangChainJSBlock(`import { ChatOpenAI } from "@langchain/openai";
-import { ChatPromptTemplate } from "@langchain/core/prompts";
-import { StringOutputParser } from "@langchain/core/output_parsers";\n
-const prompt = ChatPromptTemplate.fromMessages([
-  ["system", "You are a helpful AI."],
-  ["user", "{message}"],
-]);
-const chain = prompt
-  .pipe(new ChatOpenAI({ model: "gpt-3.5-turbo" }))
-  .pipe(new StringOutputParser());\n
-const conversationId = "101e8e66-9c68-4858-a1b4-3b0e3c51a933";
-const chatHistory = [];
-const message = { content: "Hi there" };
-let response = "";
-for await (const chunk of await chain.stream(
-  {
-    message,
-  },
-  {
-    // highlight-next-line
-    metadata: { conversation_id: conversationId },
-  }
-)) {
-  process.stdout.write(chunk);
-  response += chunk;
-}
-console.log();
-chatHistory.push(message, { content: response });\n
-// ... Next message comes in
-const nextMessage = { content: "I don't need much assistance, actually." };
-for await (const chunk of await chain.stream(
-  {
-    message: nextMessage,
-  },
-  {
-    // highlight-next-line
-    metadata: { conversation_id: conversationId },
-  }
-)) {
-  process.stdout.write(chunk);
-  response += chunk;
-}`),
-  ]}
-  groupId="client-language"
-/>
-
-To view all the traces from that conversation in LangSmith, you can query the project using a metadata filter:
-
-```bash
-has(metadata, '{"conversation_id":"101e8e66-9c68-4858-a1b4-3b0e3c51a933"}')
-```
-
-This will return all traces with the specified conversation ID.
-
-### Getting a run ID from a LangChain call
-
-In Typescript, the run ID is returned in the call response under the `__run` key. In python, we recommend using the run collector callback.
-Below is an example:
-
-<AccessRunIdBlock />
-
-If using the API or SDK, you can send the run ID as a parameter to `RunTree` or the `traceable` decorator.
-
-### Tracing without environment variables
-
-Some situations don't permit the use of environment variables or don't expose `process.env`. This is mostly pertinent when running LangChain apps in certain JavaScript runtime environments. To add tracing in these situations, you can manually create the `LangChainTracer` callback and pass it to the chain, LLM, or other LangChain component, either when initializing or in the call itself. This is the same tactic used for [changing the tracer project](#how-do-i-change-the-tracer-project) within a program.
-
-Example:
-
-<CodeTabs
-  tabs={[
-    LangChainPyBlock(`from langchain.callbacks import LangChainTracer
-from langchain_openai import ChatOpenAI
-from langsmith import Client\n
-callbacks = [
-  LangChainTracer(
-    project_name="YOUR_PROJECT_NAME_HERE",
-    client=Client(
-      api_url="https://api.smith.langchain.com",
-      api_key="YOUR_API_KEY_HERE"
-    )
-  )
-]\n
-llm = ChatOpenAI()
-llm.invoke("Hello, world!", config={"callbacks": callbacks})
-`),
-    LangChainJSBlock(`import { Client } from "langsmith";
-import { LangChainTracer } from "langchain/callbacks";
-import { ChatOpenAI } from "langchain/chat_models/openai";\n
-const callbacks = [
-  new LangChainTracer({
-    projectName: "YOUR_PROJECT_NAME_HERE",
-    client: new Client({
-      apiUrl: "https://api.smith.langchain.com",
-      apiKey: "YOUR_API_KEY_HERE",
-    }),
-  }),
-];
-const llm = new ChatOpenAI({});
-await llm.invoke("Hello, world!", { callbacks });
-`),
-  ]}
-  groupId="client-language"
-/>
-
-This tactic is also useful for when you have multiple chains running in a shared environment but want to log their run traces to different projects.
-
-### Ensuring all traces are submitted before exiting
-
-In LangChain Python, LangSmith's tracing is done in a background thread to avoid obstructing your production application. This means that your process may end before all traces are successfully posted to LangSmith. This is especially prevalent in a serverless environment, where your VM may be terminated immediately once your chain or agent completes.
-
-In LangChain JS, prior to `@langchain/core` version `0.3.0`, the default was to block for a short period of time for the trace to finish due to the greater popularity of serverless environments. Versions `>=0.3.0` have the same default as Python.
-You can explicitly make callbacks synchronous by setting the `LANGCHAIN_CALLBACKS_BACKGROUND` environment variable to `"false"` or asynchronous by setting it to `"true"`. You can also check out [this guide](https://js.langchain.com/docs/how_to/callbacks_serverless) for more options for awaiting backgrounded callbacks in serverless environments.
-
-For both languages, LangChain exposes methods to wait for traces to be submitted before exiting your application.
-Below is an example:
-
-<CodeTabs
-  tabs={[
-    LangChainPyBlock(`from langchain_openai import ChatOpenAI
-from langchain.callbacks.tracers.langchain import wait_for_all_tracers\n
-llm = ChatOpenAI()
-try:
-    llm.invoke("Hello, World!")
-finally:
-    # highlight-next-line
-    wait_for_all_tracers()
-`),
-    LangChainJSBlock(`import { ChatOpenAI } from "langchain/chat_models/openai";
-import { awaitAllCallbacks } from "langchain/callbacks";\n
-try {
-  const llm = new ChatOpenAI();
-  const response = await llm.invoke("Hello, World!");
-} catch (e) {
-  // handle error
-} finally {
-  await awaitAllCallbacks();
-}
-`),
-  ]}
-  groupId="client-language"
-/>
diff --git a/versioned_docs/version-old/tracing/faq/logging_and_viewing.mdx b/versioned_docs/version-old/tracing/faq/logging_and_viewing.mdx
deleted file mode 100644
index 6ee3e4af8..000000000
--- a/versioned_docs/version-old/tracing/faq/logging_and_viewing.mdx
+++ /dev/null
@@ -1,502 +0,0 @@
----
-sidebar_label: Core Functionality
-sidebar_position: 1
----
-
-import {
-  CodeTabs,
-  PythonBlock,
-  TypeScriptBlock,
-  APIBlock,
-} from "@site/src/components/InstructionsWithCode";
-
-import { AccessRunIdBlock } from "@site/src/components/TracingFaq";
-
-# How to log and view traces to LangSmith
-
-LangSmith makes it easy to log and view traces from your LLM application, regardless of which language or framework you use.
-
-## Annotating your code for tracing
-
-### Using `@traceable` / `traceable`
-
-LangSmith makes it easy to log traces with minimal changes to your existing code with the `@traceable` decorator in Python and `traceable` function in TypeScript.
-
-:::note
-The `LANGCHAIN_TRACING_V2` environment variable must be set to `'true'` in order for traces to be logged to LangSmith, even when using `@traceable` or `traceable`. This allows you to toggle tracing on and off without changing your code.
-
-Additionally, you will need to set the `LANGCHAIN_API_KEY` environment variable to your API key (see [Setup](/) for more information).
-
-By default, the traces will be logged to a project named `default`.
-To log traces to a different project, see [this section](customizing_trace_attributes#logging-to-a-specific-project).
-:::
-
-<CodeTabs
-  tabs={[
-    PythonBlock(
-      `from langsmith import traceable\n
-from openai import Client\n
-openai = Client()\n\n
-@traceable
-def format_prompt(subject):
-    return [
-        {
-            "role": "system",
-            "content": "You are a helpful assistant.",
-        },
-        {
-            "role": "user",
-            "content": f"What's a good name for a store that sells {subject}?"
-        }
-    ]\n
-@traceable(run_type="llm")
-def invoke_llm(messages):
-    return openai.chat.completions.create(
-        messages=prompt, model="gpt-3.5-turbo", temperature=0
-    )\n
-@traceable
-def parse_output(response):
-    return response.choices[0].message.content\n
-@traceable
-def run_pipeline():
-    messages = format_prompt("colorful socks")
-    response = invoke_llm(messages)
-    return parse_output(response)\n
-run_pipeline()
-`,
-      `The \`@traceable\` decorator is a simple way to log traces from the LangSmith Python SDK. Simply decorate any function with \`@traceable\`.`
-    ),
-    TypeScriptBlock(
-      `import { traceable } from "langsmith/traceable";
-import OpenAI from "openai";\n
-const openai = new OpenAI();\n
-const formatPrompt = traceable((subject: string) => {
-    return [
-        {
-            role: "system" as const,
-            content: "You are a helpful assistant.",
-        },
-        {
-            role: "user" as const,
-            content: \`What's a good name for a store that sells \${subject}?\`
-        }
-    ];
-}, { name: "formatPrompt" });\n
-const invokeLLM = traceable(async (messages: { role: string; content: string }[]) => {
-    return openai.chat.completions.create({
-        model: "gpt-3.5-turbo",
-        messages: messages,
-        temperature: 0
-    });
-}, { run_type: "llm", name: "invokeLLM" });\n
-const parseOutput = traceable((response: any) => {
-    return response.choices[0].message.content;
-}, { name: "parseOutput" });\n
-const runPipeline = traceable(async () => {
-    const messages = await formatPrompt("colorful socks");
-    const response = await invokeLLM(messages);
-    return parseOutput(response);
-}, { name: "runPipeline" });\n
-await runPipeline()
-`,
-      `The \`traceable\` function is a simple way to log traces from the LangSmith TypeScript SDK. Simply wrap any function with \`traceable\`.\n
-Note that when wrapping a sync function with \`traceable\`, (e.g. \`formatPrompt\` in the example below), you should use the \`await\` keyword when calling it to ensure the trace is logged correctly.`
-    ),
-  ]}
-  groupId="client-language"
-/>
-
-### Wrapping the OpenAI client
-
-The `wrap_openai`/`wrapOpenAI` methods in Python/TypeScript allow you to wrap your OpenAI client in order to automatically log traces -- no decorator or function wrapping required!
-The wrapper works seamlessly with the `@traceable` decorator or `traceable` function and you can use both in the same application.
-
-:::note
-The `LANGCHAIN_TRACING_V2` environment variable must be set to `'true'` in order for traces to be logged to LangSmith, even when using `wrap_openai` or `wrapOpenAI`. This allows you to toggle tracing on and off without changing your code.
-
-Additionally, you will need to set the `LANGCHAIN_API_KEY` environment variable to your API key (see [Setup](/) for more information).
-
-By default, the traces will be logged to a project named `default`.
-To log traces to a different project, see [this section](customizing_trace_attributes#logging-to-a-specific-project).
-:::
-
-<CodeTabs
-  tabs={[
-    PythonBlock(`import openai
-from langsmith import traceable
-from langsmith.wrappers import wrap_openai\n
-client = wrap_openai(openai.Client())\n
-@traceable(run_type="tool", name="Retrieve Context")
-def my_tool(question: str) -> str:
-    return "During this morning's meeting, we solved all world conflict."\n
-@traceable(name="Chat Pipeline")
-def chat_pipeline(question: str):
-    context = my_tool(question)
-    messages = [
-        { "role": "system", "content": "You are a helpful assistant. Please respond to the user's request only based on the given context." },
-        { "role": "user", "content": f"Question: {question}\nContext: {context}"}
-    ]
-    chat_completion = client.chat.completions.create(
-        model="gpt-3.5-turbo", messages=messages
-    )
-    return chat_completion.choices[0].message.content\n
-chat_pipeline("Can you summarize this morning's meetings?")`),
-    TypeScriptBlock(`import OpenAI from "openai";
-import { traceable } from "langsmith/traceable";
-import { wrapOpenAI } from "langsmith/wrappers";\n
-const client = wrapOpenAI(new OpenAI());\n
-const myTool = traceable(async (question: string) => {
-    return "During this morning's meeting, we solved all world conflict.";
-}, { name: "Retrieve Context", run_type: "tool" });\n
-const chatPipeline = traceable(async (question: string) => {
-    const context = await myTool(question);
-    const messages = [
-        {
-            role: "system",
-            content:
-                "You are a helpful assistant. Please respond to the user's request only based on the given context.",
-        },
-        { role: "user", content: \`Question: \${question} Context: \${context}\` },
-    ];
-    const chatCompletion = await client.chat.completions.create({
-        model: "gpt-3.5-turbo",
-        messages: messages,
-    });
-    return chatCompletion.choices[0].message.content;
-}, { name: "Chat Pipeline" });\n
-await chatPipeline("Can you summarize this morning's meetings?");`),
-  ]}
-  groupId="client-language"
-/>
-
-### Using the `RunTree` API
-
-Another, more explicit way to log traces to LangSmith is via the `RunTree` API. This API allows you more control over your tracing - you can manually
-create runs and children runs to assemble your trace. You still need to set your `LANGCHAIN_API_KEY`, but `LANGCHAIN_TRACING_V2` is not
-necessary for this method.
-
-<CodeTabs
-  tabs={[
-    PythonBlock(`import openai
-from langsmith.run_trees import RunTree
-# This can be a user input to your app
-question = "Can you summarize this morning's meetings?"
-# Create a top-level run
-pipeline = RunTree(
-    name="Chat Pipeline",
-    run_type="chain",
-    inputs={"question": question}
-)
-pipeline.post()
-# This can be retrieved in a retrieval step
-context = "During this morning's meeting, we solved all world conflict."
-messages = [
-    { "role": "system", "content": "You are a helpful assistant. Please respond to the user's request only based on the given context." },
-    { "role": "user", "content": f"Question: {question}\\nContext: {context}"}
-]
-# Create a child run
-child_llm_run = pipeline.create_child(
-    name="OpenAI Call",
-    run_type="llm",
-    inputs={"messages": messages},
-)
-child_llm_run.post()
-# Generate a completion
-client = openai.Client()
-chat_completion = client.chat.completions.create(
-    model="gpt-3.5-turbo", messages=messages
-)
-# End the runs and log them
-child_llm_run.end(outputs=chat_completion)
-child_llm_run.patch()
-pipeline.end(outputs={"answer": chat_completion.choices[0].message.content})
-pipeline.patch()`),
-    TypeScriptBlock(`import OpenAI from "openai";
-import { RunTree } from "langsmith";
-// This can be a user input to your app
-const question = "Can you summarize this morning's meetings?";
-const pipeline = new RunTree({
-    name: "Chat Pipeline",
-    run_type: "chain",
-    inputs: { question }
-});
-// This can be retrieved in a retrieval step
-const context = "During this morning's meeting, we solved all world conflict.";
-const messages = [
-    { role: "system", content: "You are a helpful assistant. Please respond to the user's request only based on the given context." },
-    { role: "user", content: \`Question: \${question}\nContext: \${context}\` }
-];
-// Create a child run
-const childRun = await pipeline.createChild({
-    name: "OpenAI Call",
-    run_type: "llm",
-    inputs: { messages },
-});
-await childRun.postRun();
-// Generate a completion
-const client = new OpenAI();
-const chatCompletion = await client.chat.completions.create({
-    model: "gpt-3.5-turbo",
-    messages: messages,
-});
-// End the runs and log them
-childRun.end(chatCompletion);
-await childRun.patchRun();
-await pipeline.end({ outputs: { answer: chatCompletion.choices[0].message.content } });
-await pipeline.patchRun();`),
-  ]}
-  groupId="client-language"
-/>
-
-## Viewing Traces
-
-To view traces, navigate to the project details page for your project (by default, all traces are logged to the "default" project).
-Then, click on a row in the traces table to expand the trace. This will bring up a run tree, which shows the parent-child relationships between runs, as well as the inputs and outputs of each run.
-You can also view feedback, metadata, and other information in the tabs.
-![Trace](../static/faq/trace.png)
-
-## Setting a sampling rate for tracing
-
-To downsample the number of traces logged to LangSmith, set the `LANGCHAIN_TRACING_SAMPLING_RATE` environment variable to
-any float between 0 (no traces) and 1 (all traces). This requires a python SDK version >= 0.0.84, and a JS SDK version >= 0.0.64.
-For instance, setting the following environment variable will filter out 25% of traces:
-
-```bash
-export LANGCHAIN_TRACING_SAMPLING_RATE=0.75
-```
-
-This works for the `traceable` decorator and `RunTree` objects.
-
-## Distributed Tracing
-
-LangSmith supports distributed tracing out of the box, linking runs within a trace across services using context propagation headers (`langsmith-trace` and optional `baggage` for metadata/tags).
-
-Example client-server setup:
-
-- Trace starts on client
-- Continues on server
-
-```python
-# client.py
-from langsmith.run_helpers import get_current_run_tree, traceable
-import httpx
-
-@traceable
-async def my_client_function():
-    headers = {}
-    async with httpx.AsyncClient(base_url="...") as client:
-        if run_tree := get_current_run_tree():
-            # add langsmith-id to headers
-            headers.update(run_tree.to_headers())
-        return await client.post("/my-route", headers=headers)
-```
-
-Then the server (or other service) can continue the trace by passing the headers in as `langsmith_extra`:
-
-```python
-# server.py
-from langsmith import traceable
-from langsmith.run_helpers import tracing_context
-from fastapi import FastAPI, Request
-
-
-@traceable
-async def my_application():
-    ...
-
-
-app = FastAPI()  # Or Flask, Django, or any other framework
-
-
-@app.post("/my-route")
-async def fake_route(request: Request):
-    # request.headers:  {"langsmith-trace": "..."}
-    # as well as optional metadata/tags in `baggage`
-    # highlight-next-line
-    with tracing_context(parent=request.headers):
-        return await my_application()
-
-```
-
-The example above uses the `tracing_context` context manager. You can also directly specify the parent run context in the `trace` context manager or `traceable` decorator.
-
-```python
-from langsmith.run_helpers import traceable, trace
-# ... same as above
-@app.post("/my-route")
-async def fake_route(request: Request):
-    # request.headers:  {"langsmith-trace": "..."}
-    # as well as optional metadata/tags in `baggage`
-    # highlight-next-line
-    my_application(langsmith_extra={"parent": request.headers})
-    # Or using the `trace` context manager
-    with trace(parent=request.headers) as run_tree:
-        ...
-        run_tree.end(outputs={"answer": "42"})
-        ...
-```
-
-## Turning off tracing
-
-If you've decided you no longer want to trace your runs, you can remove the environment variables configured to start tracing in the first place.
-By unsetting the `LANGCHAIN_TRACING_V2` environment variable, traces will no longer be logged to LangSmith.
-Note that this currently does not affect the `RunTree` objects.
-
-This setting works both with LangChain and the LangSmith SDK, in both Python and TypeScript.
-
-## Getting the run ID of a logged run
-
-The example below shows how to get the run ID of a logged run using the LangSmith SDK. **To get the run ID of a run using LangChain, you can follow the guide [here](langchain_specific_guides#getting-a-run-id-from-a-langchain-call).**
-
-<CodeTabs
-  tabs={[
-    PythonBlock(`import openai\n
-from uuid import uuid4
-from langsmith import traceable
-from langsmith.run_trees import RunTree
-from langsmith.wrappers import wrap_openai\n
-messages = [
-    { "role": "system", "content": "You are a helpful assistant. Please respond to the user's request only based on the given context." },
-    { "role": "user", "content": "Is sunshine good for you?" }
-]\n
-# Collect run ID using RunTree
-run_id = uuid4()
-rt = RunTree(
-    name="OpenAI Call RunTree",
-    run_type="llm",
-    inputs={"messages": messages},
-    id=run_id
-)
-client = openai.Client()
-chat_completion = client.chat.completions.create(
-    model="gpt-3.5-turbo", messages=messages
-)
-rt.end(outputs=chat_completion)
-rt.post()
-print("RunTree Run ID: ", run_id)\n
-# Collect run ID using openai_wrapper
-run_id = uuid4()
-client = wrap_openai(openai.Client())
-completion = client.chat.completions.create(
-    model="gpt-3.5-turbo", messages=messages, langsmith_extra={
-        "run_id": run_id,
-    },
-)
-print("OpenAI Wrapper Run ID: ", run_id)\n
-# Collect run id using traceable decorator
-run_id = uuid4()
-@traceable(
-    run_type="llm",
-    name="OpenAI Call Decorator",
-)
-def call_openai(
-    messages: list[dict], model: str = "gpt-3.5-turbo"
-) -> str:
-    return client.chat.completions.create(
-        model=model,
-        messages=messages,
-    ).choices[0].message.content
-result = call_openai(
-    messages,
-    langsmith_extra={
-        "run_id": run_id,
-    },
-)
-print("Traceable Run ID: ", run_id)`),
-    TypeScriptBlock(`import OpenAI from "openai";
-import { RunTree } from "langsmith";
-import {v4 as uuidv4} from "uuid";\n
-const client = new OpenAI();\n
-const messages = [
-    {role: "system", content: "You are a helpful assistant."},
-    {role: "user", content: "Is sunshine food for you?"}
-];\n
-const runId = uuidv4();
-const rt = new RunTree({
-    run_type: "llm",
-    name: "OpenAI Call RunTree",
-    inputs: { messages },
-    id: runId
-})
-await rt.postRun();
-const chatCompletion = await client.chat.completions.create({
-    model: "gpt-3.5-turbo",
-    messages: messages,
-});
-rt.end(chatCompletion)
-await rt.patchRun()
-console.log("Run ID: ", runId);`),
-    APIBlock(`import openai
-import requests\n
-from datetime import datetime
-from uuid import uuid4\n
-# Send your API Key in the request headers
-headers = {
-    "x-api-key": "ls__..."
-}\n
-messages = [
-    { "role": "system", "content": "You are a helpful assistant. Please respond to the user's request only based on the given context." },
-    { "role": "user", "content": "Is sunshine good for you?" }
-]\n
-start_time = datetime.utcnow().isoformat()
-client = openai.Client()
-chat_completion = client.chat.completions.create(
-    model="gpt-3.5-turbo", messages=messages
-)\n
-run_id = uuid4()
-requests.post(
-    "https://api.smith.langchain.com/runs",
-    json={
-        "id": run_id.hex,
-        "name": "OpenAI Call",
-        "run_type": "llm",
-        "inputs": {"messages": messages},
-        "start_time": start_time,
-        "outputs": {"answer": chat_completion.choices[0].message.content},
-        "end_time": datetime.utcnow().isoformat(),
-    },
-    headers=headers
-)
-print("API Run ID: ", run_id)`),
-  ]}
-  groupId="client-language"
-/>
-
-## Getting the URL of a logged run
-
-Runs are logged to whichever project you have configured ("default" if none is set), and you can view them by opening the corresponding project details page. To programmatically access the run's URL, you can
-use the LangSmith client. Below is an example. To get the run ID of a run, you can follow the guide [here](#getting-the-run-id-of-a-logged-run).
-
-<CodeTabs
-  tabs={[
-    PythonBlock(`from langsmith import Client\n
-client = Client()
-run = client.read_run("<run_id>")
-print(run.url)`),
-    TypeScriptBlock(`import { Client } from "langsmith";\n
-const client = new Client();
-const runUrl = await client.getRunUrl({runId: "<run_id>"});
-console.log(runUrl);
-`),
-  ]}
-  groupId="client-language"
-/>
-
-## Deleting traces in a project
-
-You can delete a project, along with all its associated traces and other information, in the UI or by using the LangSmith client.
-
-Below is an example using the SDK:
-
-<CodeTabs
-  tabs={[
-    PythonBlock(`from langsmith import Client\n
-client = Client()
-client.delete_project(project_name="<project_name>")`),
-    TypeScriptBlock(`import { Client } from "langsmith";\n
-const client = new Client();
-await client.deleteProject({projectName: "<project_name>"});
-`),
-  ]}
-  groupId="client-language"
-/>
diff --git a/versioned_docs/version-old/tracing/faq/logging_feedback.mdx b/versioned_docs/version-old/tracing/faq/logging_feedback.mdx
deleted file mode 100644
index eafc082ca..000000000
--- a/versioned_docs/version-old/tracing/faq/logging_feedback.mdx
+++ /dev/null
@@ -1,81 +0,0 @@
----
-sidebar_label: Capturing Feedback
-sidebar_position: 4
----
-
-import {
-  CodeTabs,
-  PythonBlock,
-  TypeScriptBlock,
-  LangChainPyBlock,
-  LangChainJSBlock,
-  APIBlock,
-} from "@site/src/components/InstructionsWithCode";
-
-# How to Collect Feedback for Traces
-
-Feedback allows you to understand how your users are experiencing your application and helps draw attention to problematic traces. LangSmith makes it easy to collect feedback for traces and view it in the context of the trace, as well as filter traces based on feedback.
-For more information on how to score your application programmatically using a testing workflow, see the [Evaluation](../../evaluation) section.
-
-### Capturing feedback programmatically
-
-It's often helpful to expose a simple mechanism (such as a thumbs-up, thumbs-down button) to collect user feedback for your application responses. You can then use the LangSmith SDK or API to send feedback for a trace.
-To get the run_id of a logged run, see [this guide](./logging_and_viewing#getting-the-run-id-of-a-logged-run).
-
-<CodeTabs
-  tabs={[
-    PythonBlock(`from langsmith import Client\n
-client = Client()\n
-# ... Run your application and get the run_id...
-# This information can be the result of a user-facing feedback form\n
-client.create_feedback(
-    run_id,
-    key="feedback-key",
-    score=1.0,
-    comment="comment",
-)`),
-    TypeScriptBlock(`import { Client } from "langsmith";
-const client = new Client();\n
-// ... Run your application and get the run_id...
-// This information can be the result of a user-facing feedback form\n
-await client.createFeedback(
-    runId,
-    "feedback-key",
-    {
-        score: 1.0,
-        comment: "comment",
-    }
-);`),
-    APIBlock(`import requests\n
-# Send your API Key in the request headers
-headers = {
-    "x-api-key": "ls__...",
-}\n
-requests.post(
-    "https://api.smith.langchain.com/feedback",
-    headers=headers,
-    json={
-        "run_id": run_id.hex,
-        "key": "feedback-key",
-        "score": 1.0,
-        "comment": "comment",
-    },
-)`),
-  ]}
-  groupId="client-language"
-/>
-
-### Annotating traces with feedback
-
-LangSmith allows you to manually annotate traces with feedback within the application. This can be useful for adding context to a trace, such as a user's comment or a note about a specific issue.
-You can annotate a trace either inline or by sending the trace to an Annotation Queue, which allows you closely inspect and log feedbacks to runs one at a time.
-Feedback tags are associated with your tenant.
-
-You can click the top right corner of the trace to annotate it inline
-![Annotate Inline](../static/faq/annotate_inline.png)
-
-Or you can send the trace to the Annotation Queue
-![Send to Queue](../static/faq/send_to_annotation_queue.png)
-
-You can annotate the trace in an Annotation Queue using one of the feedback tags associated with your tenant (or create a new one)
-![Annotation In Queue](../static/faq/annotate_in_queue.png)
diff --git a/versioned_docs/version-old/tracing/faq/querying_feedback.mdx b/versioned_docs/version-old/tracing/faq/querying_feedback.mdx
deleted file mode 100644
index 5bad8b389..000000000
--- a/versioned_docs/version-old/tracing/faq/querying_feedback.mdx
+++ /dev/null
@@ -1,169 +0,0 @@
----
-sidebar_label: Querying Feedback
-sidebar_position: 5
----
-
-import {
-  CodeTabs,
-  PythonBlock,
-  TypeScriptBlock,
-} from "@site/src/components/InstructionsWithCode";
-
-# Querying Feedback
-
-LangSmith makes it easy to fetch feedback associated with your runs. The `Run` object itself has aggregate `feedback_stats` on its body, which may
-satisfy your needs. If you want the additional feedback metadata (or full list of feedback objects), you can use the SDK or API to list feedback objects based on run IDs, feedback keys, and feedback source types.
-
-Using the `list_feedback` method in the SDK or [`/feedback`](https://api.smith.langchain.com/redoc#tag/feedback/operation/list_feedback_feedback_get) endpoint in the API, you can fetch feedback to analyze. Most simple requests can be satisfied using the following arguments:
-
-- `run_ids`: Fetch feedback for specific runs by providing their IDs.
-- `feedback_keys`: Filter feedback by specific keys, such as 'correctness' or 'quality'.
-- `feedback_source_types`: Filter feedback by the source type, such as 'model' for model-generated feedback or 'api' for feedback submitted via the API.
-
-All the examples below assume you have created a LangSmith client and configured it with your API key to connect to the LangSmith server.
-
-<CodeTabs
-  tabs={[
-    PythonBlock(`from langsmith import Client\n
-client = Client()`),
-    TypeScriptBlock(`import { Client, Feedback } from "langsmith";\n
-const client = new Client();`),
-  ]}
-  groupId="client-language"
-/>
-Below are some examples of ways to list feedback using the available arguments:
-
-#### List all feedback for a specific run
-
-<CodeTabs
-  tabs={[
-    PythonBlock(`run_feedback = client.list_feedback(run_ids=["<run_id>"])`),
-    TypeScriptBlock(`const runFeedback: Feedback[] = [];
-for await (const feedback of client.listFeedback({
-  runIds: ["<run_id>"],
-})) {
-  runFeedback.push(feedback);
-}`),
-  ]}
-  groupId="client-language"
-/>
-
-#### List all feedback with a specific key
-
-<CodeTabs
-  tabs={[
-    PythonBlock(
-      `correctness_feedback = client.list_feedback(feedback_key=["correctness"])`
-    ),
-    TypeScriptBlock(`const correctnessFeedback: Feedback[] = [];
-for await (const feedback of client.listFeedback({
-  feedbackKeys: ["correctness"],
-})) {
-  correctnessFeedback.push(feedback);
-}`),
-  ]}
-  groupId="client-language"
-/>
-
-#### List all model-generated feedback
-
-<CodeTabs
-  tabs={[
-    PythonBlock(
-      `model_feedback = client.list_feedback(feedback_source_type=["model"])`
-    ),
-    TypeScriptBlock(`const modelFeedback: Feedback[] = [];
-for await (const feedback of client.listFeedback({
-  feedbackSourceTypes: ["model"],
-})) {
-  modelFeedback.push(feedback);
-}`),
-  ]}
-  groupId="client-language"
-/>
-
-## Use Cases
-
-Here are a few common use cases for querying feedback:
-
-#### Compare model-generated and human feedback for a set of runs
-
-After querying for a set of runs, you can compare the model-generated and human feedback for those specific runs:
-
-<CodeTabs
-  tabs={[
-    PythonBlock(`# Query for runs
-runs = client.list_runs(project_name="<your_project>", filter='gt(start_time, "2023-07-15T00:00:00Z")')\n
-# Extract run IDs
-run_ids = [run.id for run in runs]\n
-# Fetch model-generated feedback for the runs
-model_feedback = client.list_feedback(run_ids=run_ids, feedback_source_type=["model"])\n 
-# Fetch human feedback for the runs
-human_feedback = client.list_feedback(run_ids=run_ids, feedback_source_type=["api"])`),
-    TypeScriptBlock(`// Query for runs
-const runs: Run[] = [];
-for await (const run of client.listRuns({
-  projectName: "<your_project>",
-  filter: 'gt(start_time, "2023-07-15T00:00:00Z")',
-})) {
-  runs.push(run);
-}\n
-// Extract run IDs
-const runIds = runs.map(run => run.id);\n
-// Fetch model-generated feedback for the runs
-const modelFeedback: Feedback[] = [];
-for await (const feedback of client.listFeedback({
-  runIds,
-  feedbackSourceTypes: ["model"],
-})) {
-  modelFeedback.push(feedback);
-}\n
-// Fetch human feedback for the runs
-const humanFeedback: Feedback[] = [];
-for await (const feedback of client.listFeedback({
-  runIds,
-  feedbackSourceTypes: ["api"],
-})) {
-  humanFeedback.push(feedback);
-}`),
-  ]}
-  groupId="client-language"
-/>
-
-#### Analyze feedback for a specific key and set of runs
-
-If you're interested in analyzing feedback for a specific key, such as 'correctness' or 'quality', for a set of runs, you can query for the runs and then filter the feedback by key:
-
-<CodeTabs
-  tabs={[
-    PythonBlock(`# Query for runs
-runs = client.list_runs(project_name="<your_project>", filter='gt(start_time, "2023-07-15T00:00:00Z")')\n
-# Extract run IDs  
-run_ids = [run.id for run in runs]\n
-# Fetch correctness feedback for the runs
-correctness_feedback = client.list_feedback(run_ids=run_ids, feedback_key=["correctness"])\n
-# Analyze the correctness scores
-scores = [feedback.score for feedback in correctness_feedback]`),
-    TypeScriptBlock(`// Query for runs
-const runs: Run[] = [];
-for await (const run of client.listRuns({
-  projectName: "<your_project>",
-  filter: 'gt(start_time, "2023-07-15T00:00:00Z")',
-})) {
-  runs.push(run);
-}\n
-// Extract run IDs
-const runIds = runs.map(run => run.id);\n
-// Fetch correctness feedback for the runs
-const correctnessFeedback: Feedback[] = [];
-for await (const feedback of client.listFeedback({
-  runIds,
-  feedbackKeys: ["correctness"],
-})) {
-  correctnessFeedback.push(feedback);
-}\n
-// Analyze the correctness scores
-const scores = correctnessFeedback.map(feedback => feedback.score);`),
-  ]}
-  groupId="client-language"
-/>
diff --git a/versioned_docs/version-old/tracing/faq/querying_traces.mdx b/versioned_docs/version-old/tracing/faq/querying_traces.mdx
deleted file mode 100644
index a07e5efec..000000000
--- a/versioned_docs/version-old/tracing/faq/querying_traces.mdx
+++ /dev/null
@@ -1,698 +0,0 @@
----
-sidebar_label: Querying Traces
-sidebar_position: 3
-toc_max_heading_level: 4
----
-
-import {
-  CodeTabs,
-  PythonBlock,
-  TypeScriptBlock,
-} from "@site/src/components/InstructionsWithCode";
-
-# How to query traces and runs
-
-LangSmith makes it easy to query for traces and runs. In addition to the filtering experience presented in the UI, you can also use the SDK or API to query for traces and runs.
-
-Using the `list_runs` method in the SDK or [`/runs/query`](https://api.smith.langchain.com/redoc#tag/run/operation/query_runs_runs_query_post) endpoint in the API, you can filter runs to analyze and export. Most simple requests can be satisfied using simple top level arguments:
-
-| Keys                          | Description                                                                                                                                                                                                                    |
-| ----------------------------- | ------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------ |
-| `project_id` / `project_name` | The project(s) to fetch runs from - can be a single project or a list of projects.                                                                                                                                             |
-| `trace_id`                    | Fetch runs that are part of a specific trace.                                                                                                                                                                                  |
-| `run_type`                    | The type of run to get, such as `llm`, `chain`, `tool`, `retriever`, etc.                                                                                                                                                      |
-| `dataset_name` / `dataset_id` | Fetch runs that are associated with an example row in the specified dataset. This is useful for comparing prompts or models over a given dataset.                                                                              |
-| `reference_example_id`        | Fetch runs that are associated with a specific example row. This is useful for comparing prompts or models on a given input.                                                                                                   |
-| `parent_run_id`               | Fetch runs that are children of a given run. This is useful for fetching runs grouped together using the context manager or for fetching an agent trajectory.                                                                  |
-| `error`                       | Fetch runs that errored or did not error.                                                                                                                                                                                      |
-| `run_ids`                     | Fetch runs with a given list of run ids. Note: **This will ignore all other filtering arguments.**                                                                                                                             |
-| `filter`                      | Fetch runs that match a given structured filter statement. See the [run filtering guide](#run-filtering) below for more information.                                                                                           |
-| `trace_filter`                | Filter to apply to the ROOT run in the trace tree. This is meant to be used in conjunction with the regular `filter` parameter to let you filter runs by attributes of the root run within a trace.                            |
-| `tree_filter`                 | Filter to apply to OTHER runs in the trace tree, including sibling and child runs. This is meant to be used in conjunction with the regular `filter` parameter to let you filter runs by attributes of any run within a trace. |
-| `is_root`                     | Only return root runs.                                                                                                                                                                                                         |
-| `select`                      | Select the fields to return in the response. By default, all fields are returned.                                                                                                                                              |
-| `query` (_experimental_)      | Query the experimental natural language API, which translates your query into a filter statement.                                                                                                                              |
-
-## Using keyword arguments
-
-For simple queries, such as filtering by project, run time, name, or run ID's, you can directly use keyword arguments in the list_runs method. These correspond directly to query params in the REST API. All the examples below assume you have created a LangSmith client and configured it with your API key to connect to the LangSmith server.
-
-<CodeTabs
-  tabs={[
-    PythonBlock(`from langsmith import Client\n
-client = Client()`),
-    TypeScriptBlock(`import { Client, Run } from "langsmith";\n
-const client = new Client();`),
-  ]}
-  groupId="client-language"
-/>
-
-Below are some examples of ways to list runs using keyword arguments:
-
-#### List all runs in a project
-
-<CodeTabs
-  tabs={[
-    PythonBlock(
-      `project_runs = client.list_runs(project_name="<your_project>")`
-    ),
-    TypeScriptBlock(`// Download runs in a project
-const projectRuns: Run[] = [];
-for await (const run of client.listRuns({
-  projectName: "<your_project>",
-})) {
-  projectRuns.push(run);
-};`),
-  ]}
-  groupId="client-language"
-/>
-
-#### List LLM and Chat runs in the last 24 hours
-
-<CodeTabs
-  tabs={[
-    PythonBlock(`todays_llm_runs = client.list_runs(
-    project_name="<your_project>",
-    start_time=datetime.now() - timedelta(days=1),
-    run_type="llm",
-)`),
-    TypeScriptBlock(`const todaysLlmRuns: Run[] = [];
-for await (const run of client.listRuns({
-  projectName: "<your_project>",
-  startTime: new Date(Date.now() - 1000 * 60 * 60 * 24),
-  runType: "llm",
-})) {
-  todaysLlmRuns.push(run);
-};`),
-  ]}
-  groupId="client-language"
-/>
-
-#### List traces in a project
-
-Root runs (or run traces), are runs that have no parents. These are assigned an 'execution_order' of 1. You can use this to filter for root runs.
-
-<CodeTabs
-  tabs={[
-    PythonBlock(`root_runs = client.list_runs(
-    project_name="<your_project>",
-    is_root=True
-)`),
-    TypeScriptBlock(`const rootRuns: Run[] = [];
-for await (const run of client.listRuns({
-  projectName: "<your_project>",
-  isRoot: 1,
-})) {
-  rootRuns.push(run);
-};`),
-  ]}
-  groupId="client-language"
-/>
-
-#### List runs without errors
-
-<CodeTabs
-  tabs={[
-    PythonBlock(
-      `correct_runs = client.list_runs(project_name="<your_project>", error=False)`
-    ),
-    TypeScriptBlock(`const correctRuns: Run[] = [];
-for await (const run of client.listRuns({
-  projectName: "<your_project>",
-  error: false,
-})) {
-  correctRuns.push(run);
-};`),
-  ]}
-  groupId="client-language"
-/>
-
-#### List runs by run ID
-
-If you have a list of run IDs, you can list them directly:
-
-<CodeTabs
-  tabs={[
-    PythonBlock(`run_ids = ['a36092d2-4ad5-4fb4-9c0d-0dba9a2ed836','9398e6be-964f-4aa4-8ae9-ad78cd4b7074']
-selected_runs = client.list_runs(id=run_ids)`),
-    TypeScriptBlock(`const runIds = [
-  "a36092d2-4ad5-4fb4-9c0d-0dba9a2ed836",
-  "9398e6be-964f-4aa4-8ae9-ad78cd4b7074",
-];
-const selectedRuns: Run[] = [];
-for await (const run of client.listRuns({
-  id: runIds,
-})) {
-  selectedRuns.push(run);
-};`),
-  ]}
-  groupId="client-language"
-/>
-
-:::important Ignores Other Arguments
-If you provide a list of run IDs in the way described above, it will ignore all other filtering arguments like `project_name`, `run_type`, etc. and directly return the runs matching the given IDs.
-:::
-
-## Run Filtering
-
-Listing runs with query params is useful for simple queries, but doesn't support many common needs, such as filtering by metadata, tags, or other fields.
-
-LangSmith supports a filter query language to permit more complex filtering operations when fetching runs. This guide will provide a high level overview of the grammar as well as a few examples of when it can be useful.
-
-If you'd prefer a more visual guide, you can get a taste of the language by viewing the table of runs on any of your projects' pages. We provide some recommended filters to get you started that you can copy and use the SDK.
-
-### Grammar
-
-The filtering grammar is based on common comparators on fields in the run object. Supported comparators include:
-
-- `gte` (greater than or equal to)
-- `gt` (greater than)
-- `lte` (less than or equal to)
-- `lt` (less than)
-- `eq` (equal to)
-- `neq` (not equal to)
-- `has` (check if run contains a tag or metadata json blob)
-- `search` (search for a substring in a string field)
-
-Additionally, you can combine multiple comparisons through `and` and `or` operators.
-
-These can be applied on fields of the run object, such as its `id`, `name`, `run_type`, `start_time` / `end_time`, `latency`, `total_tokens`, `error`, `execution_order`, `tags`, and any associated feedback through `feedback_key` and `feedback_score`.
-
-### Examples
-
-The following examples assume you have configured your environment appropriately and have runs stored in LangSmith.
-
-#### List all runs called "extractor" whose root of the trace was assigned feedback "user_score" score of 1
-
-<CodeTabs
-  tabs={[
-    PythonBlock(`client.list_runs(
-    project_name="<your_project>", 
-    filter='eq(name, "extractor")',
-    trace_filter='and(eq(feedback_key, "user_score"), eq(feedback_score, 1))'
-)`),
-    TypeScriptBlock(`client.listRuns({
-  projectName: "<your_project>",
-  filter: 'eq(name, "extractor")',
-  traceFilter: 'and(eq(feedback_key, "user_score"), eq(feedback_score, 1))'
-})`),
-  ]}
-  groupId="client-language"
-/>
-
-#### List runs with "star_rating" key whose score is greater than 4
-
-<CodeTabs
-  tabs={[
-    PythonBlock(`client.list_runs(
-    project_name="<your_project>", 
-    filter='and(eq(feedback_key, "star_rating"), gt(feedback_score, 4))'
-)`),
-    TypeScriptBlock(`client.listRuns({
-  projectName: "<your_project>", 
-  filter: 'and(eq(feedback_key, "star_rating"), gt(feedback_score, 4))'
-})`),
-  ]}
-  groupId="client-language"
-/>
-
-#### List runs that took longer than 5 seconds to complete
-
-<CodeTabs
-  tabs={[
-    PythonBlock(
-      `client.list_runs(project_name="<your_project>", filter='gt(latency, "5s")')`
-    ),
-    TypeScriptBlock(
-      `client.listRuns({projectName: "<your_project>", filter: 'gt(latency, "5s")'})`
-    ),
-  ]}
-  groupId="client-language"
-/>
-
-#### List all runs where `total_tokens` is greater than 5000
-
-<CodeTabs
-  tabs={[
-    PythonBlock(
-      `client.list_runs(project_name="<your_project>", filter='gt(total_tokens, 5000)')`
-    ),
-    TypeScriptBlock(
-      `client.listRuns({projectName: "<your_project>", filter: 'gt(total_tokens, 5000)'})`
-    ),
-  ]}
-  groupId="client-language"
-/>
-
-#### List all runs that have "error" not equal to null
-
-<CodeTabs
-  tabs={[
-    PythonBlock(
-      `client.list_runs(project_name="<your_project>", filter='neq(error, null)')`
-    ),
-    TypeScriptBlock(
-      `client.listRuns({projectName: "<your_project>", filter: 'neq(error, null)'})`
-    ),
-  ]}
-  groupId="client-language"
-/>
-
-#### List all runs where `start_time` is greater than a specific timestamp
-
-<CodeTabs
-  tabs={[
-    PythonBlock(
-      `client.list_runs(project_name="<your_project>", filter='gt(start_time, "2023-07-15T12:34:56Z")')`
-    ),
-    TypeScriptBlock(
-      `client.listRuns({projectName: "<your_project>", filter: 'gt(start_time, "2023-07-15T12:34:56Z")'})`
-    ),
-  ]}
-  groupId="client-language"
-/>
-
-#### List all runs that contain the string "substring"
-
-<CodeTabs
-  tabs={[
-    PythonBlock(
-      `client.list_runs(project_name="<your_project>", filter='search("substring")')`
-    ),
-    TypeScriptBlock(
-      `client.listRuns({projectName: "<your_project>", filter: 'search("substring")'})`
-    ),
-  ]}
-  groupId="client-language"
-/>
-
-#### List all runs that are tagged with the git hash "2aa1cf4"
-
-<CodeTabs
-  tabs={[
-    PythonBlock(
-      `client.list_runs(project_name="<your_project>", filter='has(tags, "2aa1cf4")')`
-    ),
-    TypeScriptBlock(
-      `client.listRuns({projectName: "<your_project>", filter: 'has(tags, "2aa1cf4")'})`
-    ),
-  ]}
-  groupId="client-language"
-/>
-
-#### List all "chain" type runs that took more than 10 seconds and
-
-had `total_tokens` greater than 5000
-
-<CodeTabs
-  tabs={[
-    PythonBlock(`client.list_runs(
-  project_name="<your_project>",
-  filter='and(eq(run_type, "chain"), gt(latency, 10), gt(total_tokens, 5000))'
-)`),
-    TypeScriptBlock(`client.listRuns({
-  projectName: "<your_project>",
-  filter: 'and(eq(run_type, "chain"), gt(latency, 10), gt(total_tokens, 5000))'
-})`),
-  ]}
-  groupId="client-language"
-/>
-
-#### List all runs that started after a specific timestamp and either
-
-have "error" not equal to null or a "Correctness" feedback score equal to 0
-
-<CodeTabs
-  tabs={[
-    PythonBlock(
-      `client.list_runs(
-  project_name="<your_project>",
-  filter='and(gt(start_time, "2023-07-15T12:34:56Z"), or(neq(error, null), and(eq(feedback_key, "Correctness"), eq(feedback_score, 0.0))))'
-)`
-    ),
-    TypeScriptBlock(
-      `client.listRuns({
-  projectName: "<your_project>",
-  filter: 'and(gt(start_time, "2023-07-15T12:34:56Z"), or(neq(error, null), and(eq(feedback_key, "Correctness"), eq(feedback_score, 0.0))))'
-})`
-    ),
-  ]}
-  groupId="client-language"
-/>
-
-#### Complex query: List all runs where `tags` include "experimental" or "beta" and
-
-`latency` is greater than 2 seconds
-
-<CodeTabs
-  tabs={[
-    PythonBlock(
-      `client.list_runs(
-  project_name="<your_project>",
-  filter='and(or(has(tags, "experimental"), has(tags, "beta")), gt(latency, 2))'
-)`
-    ),
-    TypeScriptBlock(
-      `client.listRuns({
-  projectName: "<your_project>",
-  filter: 'and(or(has(tags, "experimental"), has(tags, "beta")), gt(latency, 2))'
-})`
-    ),
-  ]}
-  groupId="client-language"
-/>
-
-#### Search trace trees by full text You can use the `search()` function without
-
-any specific field to do a full text search across all string fields in a run. This
-allows you to quickly find traces that match a search term.
-
-<CodeTabs
-  tabs={[
-    PythonBlock(
-      `client.list_runs(
-  project_name="<your_project>", 
-  filter='search("image classification")'
-)`
-    ),
-    TypeScriptBlock(
-      `client.listRuns({
-  projectName: "<your_project>",
-  filter: 'search("image classification")'  
-})`
-    ),
-  ]}
-  groupId="client-language"
-/>
-
-#### Check for presence of metadata
-
-If you want to check for the presence of metadata, you can use the `eq` operator, optionally with an `and` statement to match by value. This is useful if you want to log more structured information
-about your runs.
-
-<CodeTabs
-  tabs={[
-    PythonBlock(`
-to_search = {
-    "user_id": ""
-}\n
-# Check for any run with the "user_id" metadata key
-client.list_runs(
-  project_name="default",
-  filter="eq(metadata_key, 'user_id')"
-)
-# Check for runs with user_id=4070f233-f61e-44eb-bff1-da3c163895a3
-client.list_runs(
-  project_name="default",
-  filter="and(eq(metadata_key, 'user_id'), eq(metadata_value, '4070f233-f61e-44eb-bff1-da3c163895a3'))"
-)`),
-    TypeScriptBlock(`// Check for any run with the "user_id" metadata key
-client.listRuns({
-  projectName: 'default',
-  filter: \`eq(metadata_key, 'user_id')\`
-});
-// Check for runs with user_id=4070f233-f61e-44eb-bff1-da3c163895a3
-client.listRuns({
-  projectName: 'default',
-  filter: \`and(eq(metadata_key, 'user_id'), eq(metadata_value, '4070f233-f61e-44eb-bff1-da3c163895a3'))\`
-});`),
-  ]}
-  groupId="client-language"
-/>
-
-#### Check for environment details in metadata.
-
-A common pattern is to add environment
-information to your traces via metadata. If you want to filter for runs containing
-environment metadata, you can use the same pattern as above:
-
-<CodeTabs
-  tabs={[
-    PythonBlock(`client.list_runs(
-  project_name="default",
-  filter="and(eq(metadata_key, 'environment'), eq(metadata_value, 'production'))"
-)`),
-    TypeScriptBlock(`client.listRuns({
-  projectName: 'default',
-  filter: \`and(eq(metadata_key, 'environment'), eq(metadata_value, 'production'))\`
-});`),
-  ]}
-  groupId="client-language"
-/>
-
-#### Check for conversation ID in metadata
-
-Another common way to associate traces
-in the same conversation is by using a shared conversation ID. If you want to filter
-runs based on a conversation ID in this way, you can search for that ID in the metadata.
-
-<CodeTabs
-  tabs={[
-    PythonBlock(`client.list_runs(
-  project_name="default",
-  filter="and(eq(metadata_key, 'conversation_id'), eq(metadata_value, 'a1b2c3d4-e5f6-7890'))"
-)`),
-    TypeScriptBlock(`client.listRuns({
-  projectName: 'default',
-  filter: \`and(eq(metadata_key, 'conversation_id'), eq(metadata_value, 'a1b2c3d4-e5f6-7890'))\`
-});`),
-  ]}
-  groupId="client-language"
-/>
-
-#### Combine multiple filters
-
-If you want to combine multiple conditions to refine your search, you can use the `and` operator along with other
-filtering functions. Here's how you can search for runs named "ChatOpenAI" that also
-have a specific `conversation_id` in their metadata:
-
-<CodeTabs
-  tabs={[
-    PythonBlock(`client.list_runs(
-  project_name="default",
-  filter="and(eq(name, 'ChatOpenAI'), eq(metadata_key, 'conversation_id'), eq(metadata_value, '69b12c91-b1e2-46ce-91de-794c077e8151'))"
-)`),
-    TypeScriptBlock(`client.listRuns({
-  projectName: 'default',
-  filter: \`and(eq(name, 'ChatOpenAI'), eq(metadata_key, 'conversation_id'), eq(metadata_value, '69b12c91-b1e2-46ce-91de-794c077e8151'))\`
-});`),
-  ]}
-  groupId="client-language"
-/>
-
-#### Tree Filter
-
-List all runs named "RetrieveDocs" whose root run has a "user_score" feedback of 1 and any run in the full trace is named "ExpandQuery".
-
-This type of query is useful if you want to extract a specific run conditional on various states or steps being reached within the trace.
-
-<CodeTabs
-  tabs={[
-    PythonBlock(`client.list_runs(
-    project_name="<your_project>",
-    filter='eq(name, "RetrieveDocs")',
-    trace_filter='and(eq(feedback_key, "user_score"), eq(feedback_score, 1))',
-    tree_filter='eq(name, "ExpandQuery")'
-)`),
-    TypeScriptBlock(`client.listRuns({
-  projectName: "<your_project>",
-  filter: 'eq(name, "RetrieveDocs")',
-  traceFilter: 'and(eq(feedback_key, "user_score"), eq(feedback_score, 1))',
-  treeFilter: 'eq(name, "ExpandQuery")'
-})`),
-  ]}
-  groupId="client-language"
-/>
-
-## Advanced Examples
-
-#### Export flattened trace view with child tool usage
-
-The following Python example demonstrates how to export a flattened view of traces, including information on the tools (from nested runs) used by the agent within each trace.
-This can be used to analyze the behavior of your agents across multiple traces.
-
-This example queries all tool runs within a specified number of days and groups them by their parent (root) run ID. It then fetches the relevant information for each root run, such as the run name, inputs, outputs, and combines that information with the child run information.
-
-To optimize the query, the example:
-
-1. Selects only the necessary fields when querying tool runs to reduce query time.
-2. Fetches root runs in batches while processing tool runs concurrently.
-
-<CodeTabs
-  tabs={[
-    PythonBlock(`from collections import defaultdict
-from concurrent.futures import Future, ThreadPoolExecutor
-from datetime import datetime, timedelta\n
-from langsmith import Client
-from tqdm.auto import tqdm\n
-client = Client()
-project_name = "my-project"
-num_days = 30\n
-# List all tool runs
-tool_runs = client.list_runs(
-    project_name=project_name,
-    start_time=datetime.now() - timedelta(days=num_days),
-    run_type="tool",
-    # We don't need to fetch inputs, outputs, and other values that # may increase the query time
-    # highlight-next-line
-    select=["trace_id", "name", "run_type"],
-)\n
-data = []
-futures: list[Future] = []
-trace_cursor = 0
-trace_batch_size = 50\n
-tool_runs_by_parent = defaultdict(lambda: defaultdict(set))
-# Do not exceed rate limit
-# highlight-next-line
-with ThreadPoolExecutor(max_workers=2) as executor:
-    # Group tool runs by parent run ID
-    for run in tqdm(tool_runs):
-        # Collect all tools invoked within a given trace
-        tool_runs_by_parent[run.trace_id]["tools_involved"].add(run.name)
-        # maybe send a batch of parent run IDs to the server
-        # this lets us query for the root runs in batches
-        # while still processing the tool runs
-        if len(tool_runs_by_parent) % trace_batch_size == 0:
-            if this_batch := list(tool_runs_by_parent.keys())[
-                trace_cursor : trace_cursor + trace_batch_size
-            ]:
-                trace_cursor += trace_batch_size
-                futures.append(
-                    executor.submit(
-                        client.list_runs,
-                        project_name=project_name,
-                        run_ids=this_batch,
-                        select=["name", "inputs", "outputs", "run_type"],
-                    )
-                )
-    if this_batch := list(tool_runs_by_parent.keys())[trace_cursor:]:
-        futures.append(
-            executor.submit(
-                client.list_runs,
-                project_name=project_name,
-                run_ids=this_batch,
-                select=["name", "inputs", "outputs", "run_type"],
-            )
-        )\n
-for future in tqdm(futures):
-    root_runs = future.result()
-    for root_run in root_runs:
-        root_data = tool_runs_by_parent[root_run.id]
-        data.append(
-            {
-                "run_id": root_run.id,
-                "run_name": root_run.name,
-                "run_type": root_run.run_type,
-                "inputs": root_run.inputs,
-                "outputs": root_run.outputs,
-                "tools_involved": list(root_data["tools_involved"]),
-            }
-        )\n
-# (Optional): Convert to a pandas DataFrame\n
-import pandas as pd\n
-df = pd.DataFrame(data)
-df.head()`),
-  ]}
-  groupId="client-language"
-/>
-
-#### Export retriever inputs/outputs for traces with a specific feedback score
-
-This query is useful if you want to fine-tune embeddings or diagnose end-to-end system performance issues based on retriever behavior.
-The following Python example demonstrates how to export retriever inputs and outputs within traces that have a specific feedback score.
-
-<CodeTabs
-  tabs={[
-    PythonBlock(`from collections import defaultdict
-from concurrent.futures import Future, ThreadPoolExecutor
-from datetime import datetime, timedelta\n
-import pandas as pd
-from langsmith import Client
-from tqdm.auto import tqdm\n
-client = Client()
-project_name = "your-project-name"
-num_days = 1\n
-# List all tool runs
-retriever_runs = client.list_runs(
-    project_name=project_name,
-    start_time=datetime.now() - timedelta(days=num_days),
-    # highlight-next-line
-    run_type="retriever",
-    # This time we do want to fetch the inputs and outputs, since they
-    # may be adjusted by query expansion steps.
-    select=["trace_id", "name", "run_type", "inputs", "outputs"],
-    trace_filter='eq(feedback_key, "user_score")',
-)\n
-data = []
-futures: list[Future] = []
-trace_cursor = 0
-trace_batch_size = 50\n
-retriever_runs_by_parent = defaultdict(lambda: defaultdict(list))
-# Do not exceed rate limit
-with ThreadPoolExecutor(max_workers=2) as executor:
-    # Group retriever runs by parent run ID
-    for run in tqdm(retriever_runs):
-        # Collect all retriever calls invoked within a given trace
-        for k, v in run.inputs.items():
-            retriever_runs_by_parent[run.trace_id][f"retriever.inputs.{k}"].append(v)
-        for k, v in (run.outputs or {}).items():
-            # Extend the docs
-            retriever_runs_by_parent[run.trace_id][f"retriever.outputs.{k}"].extend(v)
-        # maybe send a batch of parent run IDs to the server
-        # this lets us query for the root runs in batches
-        # while still processing the retriever runs
-        if len(retriever_runs_by_parent) % trace_batch_size == 0:
-            if this_batch := list(retriever_runs_by_parent.keys())[
-                trace_cursor : trace_cursor + trace_batch_size
-            ]:
-                trace_cursor += trace_batch_size
-                futures.append(
-                    executor.submit(
-                        client.list_runs,
-                        project_name=project_name,
-                        run_ids=this_batch,
-                        select=[
-                            "name",
-                            "inputs",
-                            "outputs",
-                            "run_type",
-                            "feedback_stats",
-                        ],
-                    )
-                )
-    if this_batch := list(retriever_runs_by_parent.keys())[trace_cursor:]:
-        futures.append(
-            executor.submit(
-                client.list_runs,
-                project_name=project_name,
-                run_ids=this_batch,
-                select=["name", "inputs", "outputs", "run_type"],
-            )
-        )\n
-for future in tqdm(futures):
-    root_runs = future.result()
-    for root_run in root_runs:
-        root_data = retriever_runs_by_parent[root_run.id]
-        feedback = {
-            f"feedback.{k}": v.get("avg")
-            for k, v in (root_run.feedback_stats or {}).items()
-        }
-        inputs = {f"inputs.{k}": v for k, v in root_run.inputs.items()}
-        outputs = {f"outputs.{k}": v for k, v in (root_run.outputs or {}).items()}
-        data.append(
-            {
-                "run_id": root_run.id,
-                "run_name": root_run.name,
-                **inputs,
-                **outputs,
-                **feedback,
-                **root_data,
-            }
-        )\n
-# (Optional): Convert to a pandas DataFrame
-import pandas as pd
-df = pd.DataFrame(data)
-df.head()`),
-  ]}
-  groupId="client-language"
-/>
diff --git a/versioned_docs/version-old/tracing/index.mdx b/versioned_docs/version-old/tracing/index.mdx
deleted file mode 100644
index 27b7cdea8..000000000
--- a/versioned_docs/version-old/tracing/index.mdx
+++ /dev/null
@@ -1,24 +0,0 @@
----
-sidebar_label: Overview
-sidebar_position: 0
----
-
-# Tracing Overview
-
-Tracing is a powerful tool for understanding the behavior of your LLM application.
-LangSmith has best-in-class tracing capabilities, regardless of whether or not you are using LangChain.
-
-Tracing can help you track down issues like:
-
-- An unexpected end result
-- Why an agent is looping
-- Why a chain was slower than expected
-- How many tokens an agent used at each step
-
-To get started, check out the [Quick Start Guide](./tracing/quick_start).
-
-After that, peruse the [Concepts Section](./tracing/concepts) to better understand the different components involved with tracing.
-
-If you want to learn how to accomplish a particular task, check out our comprehensive [How-To Guides](./tracing/faq)
-
-For example use cases, check out the [Use Cases](./tracing/use_cases) page.
diff --git a/versioned_docs/version-old/tracing/integrations/index.mdx b/versioned_docs/version-old/tracing/integrations/index.mdx
deleted file mode 100644
index 8314cf453..000000000
--- a/versioned_docs/version-old/tracing/integrations/index.mdx
+++ /dev/null
@@ -1,14 +0,0 @@
----
-sidebar_label: Integrations
-sidebar_position: 3
-table_of_contents: true
----
-
-import DocCardList from "@theme/DocCardList";
-
-# Integrations
-
-This section includes examples and techniques for how you can use LangSmith's tracing capabilities to integrate
-with a variety of frameworks and SDKs, as well as arbitrary functions.
-
-<DocCardList />
diff --git a/versioned_docs/version-old/tracing/integrations/python.mdx b/versioned_docs/version-old/tracing/integrations/python.mdx
deleted file mode 100644
index 86a888f23..000000000
--- a/versioned_docs/version-old/tracing/integrations/python.mdx
+++ /dev/null
@@ -1,144 +0,0 @@
----
-sidebar_label: Python
-table_of_contents: true
----
-
-# Python Integrations
-
-LangSmith allows you to log traces in various ways.
-
-## LangChain
-
-To log traces with [LangChain](https://python.langchain.com/), all you need to do is set an environment variable.
-
-```shell
-export LANGCHAIN_API_KEY=<your-api-key>
-export LANGCHAIN_TRACING_V2=true
-```
-
-After that, you can use LangChain as you normally would and all traces will get logged to LangSmith!
-
-## OpenAI SDK
-
-We provide a convenient wrapper for the [OpenAI SDK](https://platform.openai.com/docs/api-reference).
-
-In order to use, you first need to set your LangSmith API key.
-
-```shell
-export LANGCHAIN_API_KEY=<your-api-key>
-```
-
-Next, you will need to install the LangSmith SDK:
-
-```shell
-pip install -U langsmith
-```
-
-After that, you can wrap the OpenAI client:
-
-```python
-from openai import OpenAI
-from langsmith import wrappers
-
-client = wrappers.wrap_openai(OpenAI())
-```
-
-Now, you can use the OpenAI client as you normally would, but now everything is logged to LangSmith!
-
-```python
-client.chat.completions.create(
-    model="gpt-4",
-    messages=[{"role": "user", "content": "Say this is a test"}],
-)
-```
-
-Oftentimes, you use the OpenAI client inside of other functions.
-You can get nested traces by using this wrapped client and decorating those functions with `@traceable`.
-See [this documentation](../faq/logging_and_viewing.mdx) for more documentation how to use this decorator
-
-```python
-from langsmith import traceable
-
-@traceable
-def my_function(text: str):
-    return client.chat.completions.create(
-        model="gpt-4",
-        messages=[{"role": "user", "content": f"Say {text}"}],
-    )
-
-my_function("hello world")
-```
-
-## Instructor
-
-We provide a convenient integration with [Instructor](https://jxnl.github.io/instructor/).
-
-In order to use, you first need to set your LangSmith API key.
-
-```shell
-export LANGCHAIN_API_KEY=<your-api-key>
-```
-
-Next, you will need to install the LangSmith SDK:
-
-```shell
-pip install -U langsmith
-```
-
-After that, you can wrap the OpenAI client:
-
-```python
-from openai import OpenAI
-from langsmith import wrappers
-
-client = wrappers.wrap_openai(OpenAI())
-```
-
-After this, you can patch the wrapped OpenAI client using `instructor`:
-
-```python
-import instructor
-
-client = instructor.patch(client)
-```
-
-Now, you can use `instructor` as you normally would, but now everything is logged to LangSmith!
-
-```python
-from pydantic import BaseModel
-
-
-class UserDetail(BaseModel):
-    name: str
-    age: int
-
-
-user = client.chat.completions.create(
-    model="gpt-3.5-turbo",
-    response_model=UserDetail,
-    messages=[
-        {"role": "user", "content": "Extract Jason is 25 years old"},
-    ]
-)
-```
-
-Oftentimes, you use `instructor` inside of other functions.
-You can get nested traces by using this wrapped client and decorating those functions with `@traceable`.
-See [this documentation](../faq/logging_and_viewing.mdx) for more documentation how to use this decorator
-
-```python
-# You can customize the run name with the `name` keyword argument
-# highlight-next-line
-@traceable(name="Extract User Details")
-def my_function(text: str) -> UserDetail:
-    return client.chat.completions.create(
-        model="gpt-3.5-turbo",
-        response_model=UserDetail,
-        messages=[
-            {"role": "user", "content": f"Extract {text}"},
-        ]
-    )
-
-
-my_function("Jason is 25 years old")
-```
diff --git a/versioned_docs/version-old/tracing/integrations/typescript.mdx b/versioned_docs/version-old/tracing/integrations/typescript.mdx
deleted file mode 100644
index 95beacd99..000000000
--- a/versioned_docs/version-old/tracing/integrations/typescript.mdx
+++ /dev/null
@@ -1,300 +0,0 @@
----
-sidebar_label: TypeScript
-table_of_contents: true
----
-
-# TypeScript Integrations
-
-## LangChain.js
-
-To log traces with [LangChain.js](https://js.langchain.com/), you'll need to set a few environment variables.
-
-```shell
-export LANGCHAIN_API_KEY=<your-api-key>
-export LANGCHAIN_TRACING_V2=true
-```
-
-And optionally:
-
-```shell
-LANGCHAIN_PROJECT=<some-custom-session-name>
-```
-
-After that, you can use LangChain as you normally would and all traces will get logged to LangSmith!
-
-## OpenAI SDK
-
-The easiest way to trace calls from the [OpenAI SDK](https://platform.openai.com/docs/api-reference) with LangSmith
-is using the `wrapOpenAI` wrapper function available in LangSmith 0.1.3 and up.
-
-In order to use, you first need to set your LangSmith API key:
-
-```shell
-export LANGCHAIN_API_KEY=<your-api-key>
-```
-
-Next, you will need to install the LangSmith SDK and the OpenAI SDK:
-
-```shell
-npm install langsmith openai
-```
-
-After that, initialize your OpenAI client and wrap the client with `wrapOpenAI` method to
-enable tracing for the completions and chat completions methods:
-
-```ts
-import { OpenAI } from "openai";
-import { wrapOpenAI } from "langsmith/wrappers";
-
-const openai = wrapOpenAI(new OpenAI());
-```
-
-This new client takes the same exact arguments and has the same return type as the original method,
-but will log everything to LangSmith.
-
-```ts
-await openai.chat.completions.create({
-  model: "gpt-3.5-turbo",
-  messages: [{ content: "Hi there!", role: "user" }],
-});
-```
-
-```
-{
-  id: 'chatcmpl-8sOWEOYVyehDlyPcBiaDtTxWvr9v6',
-  object: 'chat.completion',
-  created: 1707974654,
-  model: 'gpt-3.5-turbo-0613',
-  choices: [
-    {
-      index: 0,
-      message: { role: 'assistant', content: 'Hello! How can I help you today?' },
-      logprobs: null,
-      finish_reason: 'stop'
-    }
-  ],
-  usage: { prompt_tokens: 10, completion_tokens: 9, total_tokens: 19 },
-  system_fingerprint: null
-}
-```
-
-Alternatively, you can use the `traceable` function to wrap the client methods you want to use:
-
-```ts
-import { OpenAI } from "openai";
-import { traceable } from "langsmith/traceable";
-
-const openai = new OpenAI();
-
-const createCompletion = traceable(
-  openai.chat.completions.create.bind(openai.chat.completions),
-  { name: "OpenAI Chat Completion", run_type: "llm" }
-);
-
-await createCompletion({
-  model: "gpt-3.5-turbo",
-  messages: [{ content: "Hi there!", role: "user" }],
-});
-```
-
-Note the use of `.bind` to preserve the function's context. The `run_type` field in the extra config object marks the function as an LLM call,
-and enables token usage tracking for OpenAI.
-
-This also works for streaming:
-
-```ts
-const stream = await createCompletion({
-  model: "gpt-3.5-turbo",
-  stream: true,
-  messages: [{ content: "Hi there!", role: "user" }],
-});
-```
-
-```ts
-for await (const chunk of stream) {
-  console.log(chunk);
-}
-```
-
-### Nested tracing
-
-Oftentimes, you use the OpenAI client inside of other functions or as part of a longer
-sequence. You can automatically get nested traces by using this wrapped method
-within other functions wrapped with `traceable`.
-
-```ts
-const nestedTrace = traceable(async (text: string) => {
-  const completion = await createCompletion({
-    model: "gpt-3.5-turbo",
-    messages: [{ content: text, role: "user" }],
-  });
-  return completion;
-});
-
-await nestedTrace("Why is the sky blue?");
-```
-
-```
-{
-  "id": "chatcmpl-8sPToJQLLVepJvyeTfzZMOMVIKjMo",
-  "object": "chat.completion",
-  "created": 1707978348,
-  "model": "gpt-3.5-turbo-0613",
-  "choices": [
-    {
-      "index": 0,
-      "message": {
-        "role": "assistant",
-        "content": "The sky appears blue because of a phenomenon known as Rayleigh scattering. The Earth's atmosphere is composed of tiny molecules, such as nitrogen and oxygen, which are much smaller than the wavelength of visible light. When sunlight interacts with these molecules, it gets scattered in all directions. However, shorter wavelengths of light (blue and violet) are scattered more compared to longer wavelengths (red, orange, and yellow). \n\nAs a result, when sunlight passes through the Earth's atmosphere, the blue and violet wavelengths are scattered in all directions, making the sky appear blue. This scattering of shorter wavelengths is also responsible for the vibrant colors observed during sunrise and sunset, when the sunlight has to pass through a thicker portion of the atmosphere, causing the longer wavelengths to dominate the scattered light."
-      },
-      "logprobs": null,
-      "finish_reason": "stop"
-    }
-  ],
-  "usage": {
-    "prompt_tokens": 13,
-    "completion_tokens": 154,
-    "total_tokens": 167
-  },
-  "system_fingerprint": null
-}
-```
-
-:::tip
-[Click here](https://smith.langchain.com/public/4af46ef6-b065-46dc-9cf0-70f1274edb01/r) to see an example LangSmith trace of the above.
-:::
-
-## Next.js
-
-You can use the `traceable` wrapper function in Next.js apps to wrap arbitrary functions much like in the example above.
-
-One neat trick you can use for Next.js and other similar server frameworks is to wrap the entire exported handler for a route
-to group traces for the any sub-runs. Here's an example:
-
-```ts
-import { NextRequest, NextResponse } from "next/server";
-
-import { OpenAI } from "openai";
-import { traceable } from "langsmith/traceable";
-
-export const runtime = "edge";
-
-const handler = traceable(
-  async function () {
-    const openai = new OpenAI();
-    const createCompletion = traceable(
-      openai.chat.completions.create.bind(openai.chat.completions),
-      { name: "OpenAI Chat Completion", run_type: "llm" }
-    );
-
-    const completion = await createCompletion({
-      model: "gpt-3.5-turbo",
-      messages: [{ content: "Why is the sky blue?", role: "user" }],
-    });
-
-    const response1 = completion.choices[0].message.content;
-
-    const completion2 = await createCompletion({
-      model: "gpt-3.5-turbo",
-      messages: [
-        { content: "Why is the sky blue?", role: "user" },
-        { content: response1, role: "assistant" },
-        { content: "Cool thank you!", role: "user" },
-      ],
-    });
-
-    const response2 = completion2.choices[0].message.content;
-
-    return {
-      text: response2,
-    };
-  },
-  {
-    name: "Simple Next.js handler",
-  }
-);
-
-export async function POST(req: NextRequest) {
-  const result = await handler();
-  return NextResponse.json(result);
-}
-```
-
-The two OpenAI calls within the handler will be traced with appropriate inputs, outputs,
-and token usage information.
-
-:::tip
-[Click here](https://smith.langchain.com/public/faaf26ad-8c59-4622-bcfe-b7d896733ca6/r) to see an example LangSmith trace of the above.
-:::
-
-## Vercel AI SDK
-
-The [Vercel AI SDK](https://sdk.vercel.ai/docs) contains integrations with a variety of model providers.
-Here's an example of how you can trace outputs in a Next.js handler:
-
-```ts
-import { traceable } from "langsmith/traceable";
-import { OpenAIStream, StreamingTextResponse } from "ai";
-
-// Note: There are no types for the Mistral API client yet.
-import MistralClient from "@mistralai/mistralai";
-
-const client = new MistralClient(process.env.MISTRAL_API_KEY || "");
-
-export async function POST(req: Request) {
-  // Extract the `messages` from the body of the request
-  const { messages } = await req.json();
-
-  const mistralChatStream = traceable(client.chatStream.bind(client), {
-    name: "Mistral Stream",
-    run_type: "llm",
-  });
-
-  const response = await mistralChatStream({
-    model: "mistral-tiny",
-    maxTokens: 1000,
-    messages,
-  });
-
-  // Convert the response into a friendly text-stream. The Mistral client responses are
-  // compatible with the Vercel AI SDK OpenAIStream adapter.
-  const stream = OpenAIStream(response as any);
-
-  // Respond with the stream
-  return new StreamingTextResponse(stream);
-}
-```
-
-See the [AI SDK docs](https://sdk.vercel.ai/docs) for more examples.
-
-## Arbitrary SDKs
-
-You can use the generic `wrapSDK` method to add tracing for arbitrary SDKs.
-
-Do note that this will trace ALL methods in the SDK, not just chat completion endpoints.
-If the SDK you are wrapping has other methods, we recommend using it for only LLM calls.
-
-Here's an example using the Anthropic SDK:
-
-```ts
-import { wrapSDK } from "langsmith/wrappers";
-import { Anthropic } from "@anthropic-ai/sdk";
-
-const originalSDK = new Anthropic();
-const sdkWithTracing = wrapSDK(originalSDK);
-
-const response = await sdkWithTracing.messages.create({
-  messages: [
-    {
-      role: "user",
-      content: `What is 1 + 1? Respond only with "2" and nothing else.`,
-    },
-  ],
-  model: "claude-3-sonnet-20240229",
-  max_tokens: 1024,
-});
-```
-
-:::tip
-[Click here](https://smith.langchain.com/public/0e7248af-bbed-47cf-be9f-5967fea1dec1/r) to see an example LangSmith trace of the above.
-:::
diff --git a/versioned_docs/version-old/tracing/quick_start.mdx b/versioned_docs/version-old/tracing/quick_start.mdx
deleted file mode 100644
index 520da486c..000000000
--- a/versioned_docs/version-old/tracing/quick_start.mdx
+++ /dev/null
@@ -1,150 +0,0 @@
----
-sidebar_label: Quick Start
-sidebar_position: 1
-table_of_contents: true
----
-
-import Tabs from "@theme/Tabs";
-import TabItem from "@theme/TabItem";
-import {
-  TypeScriptSDKTracingCodeBlock,
-  LangChainInstallationCodeTabs,
-  LangChainQuickStartCodeTabs,
-  ConfigureEnvironmentCodeTabs,
-  PythonSDKTracingCodeBlock,
-  PythonAPITracingCodeBlock,
-  ConfigureSDKEnvironmentCodeTabs,
-} from "@site/src/components/QuickStart";
-import { ClientInstallationCodeTabs } from "@site/src/components/ClientInstallation";
-import { CodeTabs, shell } from "@site/src/components/InstructionsWithCode";
-
-# Tracing Quick Start
-
-You can get started with LangSmith tracing using either LangChain, the Python SDK, the TypeScript SDK, or the API. The following sections provide a quick start guide for each of these options.
-
-First, create an API key by navigating to the <a href="https://smith.langchain.com/settings">settings page</a>, then follow the instructions below:
-
-<Tabs
-  groupId="client-language"
-  defaultValue="python-sdk"
-  values={[
-    { label: "Python SDK", value: "python-sdk" },
-    { label: "TypeScript SDK", value: "typescript-sdk" },
-    { label: "LangChain", value: "langchain" },
-    { label: "API", value: "api" },
-  ]}
->
-  <TabItem value="python-sdk">
-    <h2>1. Install the LangSmith library</h2>
-    <p>Start by installing the Python library.</p>
-    <CodeTabs tabs={[shell`pip install langsmith`]} />
-    <h2>2. Configure your environment</h2>
-    <ConfigureSDKEnvironmentCodeTabs />
-    <h2>3. Log a trace</h2>
-    <p>
-      We provide multiple ways to log traces to LangSmith. Below, we'll
-      highlight how to use our simple <code>@traceable</code> decorator. See
-      more in the <a href="./integrations">Integrations</a> section.
-    </p>
-    <PythonSDKTracingCodeBlock />
-    <h2>4. View the trace</h2>
-    <p>
-      By default, the trace will be logged to the project with the name{" "}
-      <code>default</code>. You can change the project you log to by following
-      the instructions{" "}
-      <a href="./faq/customizing_trace_attributes#logging-to-a-specific-project">
-        here
-      </a>
-      . An example of a trace logged using the above code is made public and can
-      be viewed <a href="https://smith.langchain.com/public/279036f1-a06c-487a-bf74-d5d72af5fd9f/r">
-        here
-      </a>.
-    </p>
-  </TabItem>
-  <TabItem value="typescript-sdk">
-    <h2>1. Install the LangSmith library</h2>
-    <p>Start by installing the TypeScript library.</p>
-    <CodeTabs
-      tabs={[
-        shell({ value: "npm", label: "npm" })`npm install langsmith`,
-        shell({ value: "yarn", label: "yarn" })`yarn add langsmith`,
-        shell({ value: "pnpm", label: "pnpm" })`pnpm add langsmith`,
-        shell({ value: "bun", label: "bun" })`bun add langsmith`,
-      ]}
-    />
-    <h2>2. Configure your environment</h2>
-    <ConfigureSDKEnvironmentCodeTabs />
-    <h2>3. Log a Trace</h2>
-    <p>
-      We provide multiple ways to log traces to LangSmith. Below, we'll
-      highlight how to use our simple <code>traceable</code> higher order
-      function (HOF). See more in the <a href="./integrations">Integrations</a>{" "}
-      section.
-    </p>
-    <TypeScriptSDKTracingCodeBlock />
-    <h2>4. View the trace</h2>
-    <p>
-      By default, the trace will be logged to the project with the name{" "}
-      <code>default</code>. You can change the project you log to by following
-      the instructions{" "}
-      <a href="./faq/customizing_trace_attributes#logging-to-a-specific-project">
-        here
-      </a>
-      . An example of a trace logged using the above code is made public and can
-      be viewed <a href="https://smith.langchain.com/public/90baed21-d367-442b-9448-5066a3fe71ab/r">
-        here
-      </a>.
-    </p>
-
-  </TabItem>
-  <TabItem value="langchain">
-    <h2>1. Install or upgrade LangChain</h2>
-    <LangChainInstallationCodeTabs />
-    <h2>2. Configure your environment</h2>
-    <ConfigureEnvironmentCodeTabs />
-    <h2>3. Log a trace</h2>
-    <p>
-      No extra code is needed to log a trace to LangSmith. Just run your
-      LangChain code as you normally would.
-    </p>
-    <LangChainQuickStartCodeTabs />
-    <h2>4. View the trace</h2>
-    <p>
-      By default, the trace will be logged to the project with the name{" "}
-      <code>default</code>. You can change the project you log to by following
-      the instructions{" "}
-      <a href="./faq/customizing_trace_attributes#logging-to-a-specific-project">
-        here
-      </a>
-      . An example of a trace logged using the above code is made public and can
-      be viewed <a href="https://smith.langchain.com/public/e6a46eb2-d785-4804-a1e3-23f167a04300/r">
-        here
-      </a>.
-    </p>
-  </TabItem>
-  <TabItem value="api">
-    <h2>1. Log a trace</h2>
-    <p>
-      Log a trace using the{" "}
-      <a href="https://api.smith.langchain.com/redoc">LangSmith API</a>.
-    </p>
-    <p>
-      Here, we'll show you to use the <code>requests</code> library in Python to
-      log a trace, but you can use any HTTP client in any language.
-    </p>
-    <PythonAPITracingCodeBlock />
-    <h2>2. View the trace</h2>
-    <p>
-      By default, the trace will be logged to the project with the name{" "}
-      <code>default</code>. You can change the project you log to by following
-      the instructions{" "}
-      <a href="./faq/customizing_trace_attributes#logging-to-a-specific-project">
-        here
-      </a>
-      . An example of a trace logged using the above code is made public and can
-      be viewed <a href="https://smith.langchain.com/public/c0fcc401-f163-4546-aad8-1641e9fd6e91/r">
-        here
-      </a>.
-    </p>
-  </TabItem>
-</Tabs>
diff --git a/versioned_docs/version-old/tracing/static/concepts/feedback.png b/versioned_docs/version-old/tracing/static/concepts/feedback.png
deleted file mode 100644
index 10b4d4861..000000000
Binary files a/versioned_docs/version-old/tracing/static/concepts/feedback.png and /dev/null differ
diff --git a/versioned_docs/version-old/tracing/static/concepts/metadata.png b/versioned_docs/version-old/tracing/static/concepts/metadata.png
deleted file mode 100644
index fb1e15552..000000000
Binary files a/versioned_docs/version-old/tracing/static/concepts/metadata.png and /dev/null differ
diff --git a/versioned_docs/version-old/tracing/static/concepts/primitives-dark.png b/versioned_docs/version-old/tracing/static/concepts/primitives-dark.png
deleted file mode 100644
index 51162eb52..000000000
Binary files a/versioned_docs/version-old/tracing/static/concepts/primitives-dark.png and /dev/null differ
diff --git a/versioned_docs/version-old/tracing/static/concepts/primitives.png b/versioned_docs/version-old/tracing/static/concepts/primitives.png
deleted file mode 100644
index c334bd175..000000000
Binary files a/versioned_docs/version-old/tracing/static/concepts/primitives.png and /dev/null differ
diff --git a/versioned_docs/version-old/tracing/static/concepts/project.png b/versioned_docs/version-old/tracing/static/concepts/project.png
deleted file mode 100644
index 0933e5fd1..000000000
Binary files a/versioned_docs/version-old/tracing/static/concepts/project.png and /dev/null differ
diff --git a/versioned_docs/version-old/tracing/static/concepts/run.png b/versioned_docs/version-old/tracing/static/concepts/run.png
deleted file mode 100644
index 658b9e616..000000000
Binary files a/versioned_docs/version-old/tracing/static/concepts/run.png and /dev/null differ
diff --git a/versioned_docs/version-old/tracing/static/concepts/tags.png b/versioned_docs/version-old/tracing/static/concepts/tags.png
deleted file mode 100644
index 90ac6a07c..000000000
Binary files a/versioned_docs/version-old/tracing/static/concepts/tags.png and /dev/null differ
diff --git a/versioned_docs/version-old/tracing/static/concepts/trace.png b/versioned_docs/version-old/tracing/static/concepts/trace.png
deleted file mode 100644
index 22f29a097..000000000
Binary files a/versioned_docs/version-old/tracing/static/concepts/trace.png and /dev/null differ
diff --git a/versioned_docs/version-old/tracing/static/faq/annotate_in_queue.png b/versioned_docs/version-old/tracing/static/faq/annotate_in_queue.png
deleted file mode 100644
index 5125238a7..000000000
Binary files a/versioned_docs/version-old/tracing/static/faq/annotate_in_queue.png and /dev/null differ
diff --git a/versioned_docs/version-old/tracing/static/faq/annotate_inline.png b/versioned_docs/version-old/tracing/static/faq/annotate_inline.png
deleted file mode 100644
index 424162038..000000000
Binary files a/versioned_docs/version-old/tracing/static/faq/annotate_inline.png and /dev/null differ
diff --git a/versioned_docs/version-old/tracing/static/faq/send_to_annotation_queue.png b/versioned_docs/version-old/tracing/static/faq/send_to_annotation_queue.png
deleted file mode 100644
index a32a2a67b..000000000
Binary files a/versioned_docs/version-old/tracing/static/faq/send_to_annotation_queue.png and /dev/null differ
diff --git a/versioned_docs/version-old/tracing/static/faq/trace.png b/versioned_docs/version-old/tracing/static/faq/trace.png
deleted file mode 100644
index b6af01c3b..000000000
Binary files a/versioned_docs/version-old/tracing/static/faq/trace.png and /dev/null differ
diff --git a/versioned_docs/version-old/tracing/use_cases/few-shot-datasets.mdx b/versioned_docs/version-old/tracing/use_cases/few-shot-datasets.mdx
deleted file mode 100644
index f4de681ad..000000000
--- a/versioned_docs/version-old/tracing/use_cases/few-shot-datasets.mdx
+++ /dev/null
@@ -1,299 +0,0 @@
----
-sidebar_label: Few-shot prompting with LangSmith datasets
-sidebar_position: 4
-toc_max_heading_level: 4
----
-
-# Few-shot prompting with LangSmith datasets
-
-Datasets are useful for more than just testing, evaluation, and fine-tuning. They can also be used to curate examples for few-shot "learning."
-The overall flow for this looks something like:
-
-- Capture samples by tracing a chain or LLM, either in a live deployment or on example data.
-- Filter samples based on user feedback or other custom criteria (did/didn't error, AI-assisted evaluation, etc.)
-- Create dataset(s) from filtered samples.
-- Use within ExampleSelectors and FewShotPromptTemplates to improve in-context learning.
-- Repeat :)
-  This can help improve the quality of the model, permit usage of cheaper models, and more.
-  As a motivating example, we will show how we can use a few examples from a chain powered by OpenAI's `gpt4` model to improve the quality of a "history Q&A" bot powered by the local `GPT4All` model.
-
-## Setup
-
-First, we will need to install LangChain and GPT4All
-
-```bash
-pip install -U langchain langchain_openai langsmith gpt4all
-```
-
-Then configure your environment:
-
-```bash
-export LANGCHAIN_API_KEY=<your key>
-export LANGCHAIN_TRACING_V2_ENABLED=true
-export OPENAI_API_KEY=<your key>
-```
-
-## Step 1: Trace Prototype Model
-
-Run your chain prototype to collect example traces. This data could come from a live deployment, staging environment, prototyping dataset, or any other source.
-If you already have some traced data you believe to be good candidates for few-shot prompting, you can skip this step.
-To get started quickly, we will use some example questions we want to ask our chain.
-
-#### Create a dataset
-
-The 'History of Flanders' dataset here is used mainly for convenience. We use it in the `evaluate` method to quickly capture traces. You can also select runs from any project
-for the few-shot dataset.
-
-```python
-from langsmith import Client
-
-client = Client()
-
-questions = [
-    "When and where was the printing press invented by Johannes Gutenberg?",
-    "What were the most significant contributions of Flemish painters of the Renaissance?",
-    "What are the main characteristics of the Flemish language?",
-    "What were the main causes and consequences of the Flemish Revolt?",
-    "What are some of the most important works of Flemish literature in the 19th and 20th centuries?",
-    "What are some of the most important films produced in Flanders in the 20th century?",
-    "What were the key goals of the Flemish Movement?",
-    "What are the main responsibilities of the Flemish Community?",
-    "What are the main drivers of the Flemish economy in the 21st century?",
-    "What are the main arguments for and against Flemish independence?",
-    "What are the main challenges facing Flanders in the 21st century?",
-    "How did the invention of the printing press by Johannes Gutenberg impact Flemish history?",
-    "How did the development of Flemish painting in the 15th and 16th centuries impact Flemish history?",
-    "How did the development of the Flemish language impact Flemish history?",
-    "How did the Flemish Revolt (1568-1609) impact Flemish history?",
-    "How did the development of Flemish literature in the 19th and 20th centuries impact Flemish history?",
-    "How did the development of Flemish cinema in the 20th century impact Flemish history?",
-    "How did the development of the Flemish Movement (19th-20th centuries) impact Flemish history?",
-    "How did the creation of the Flemish Community (1970) impact Flemish history?",
-    "How did the development of the Flemish economy in the 21st century impact Flemish history?",
-    "How did the rise of Flemish nationalism in the 21st century impact Flemish history?",
-]
-shared_dataset_name = "History of Flanders"
-ds = client.create_dataset(
-    dataset_name=shared_dataset_name, description="Some questions about Flanders",
-)
-client.create_examples(
-    inputs=[{"input": q} for q in questions], dataset_id=ds.id
-)
-```
-
-#### Run chain over dataset
-
-We will use a gpt-4 powered LLMChain and the `evaluate` method to kick things off.
-
-```python
-from langchain_openai import ChatOpenAI
-from langchain_core.prompts import PromptTemplate
-from langsmith.evaluation import evaluate
-
-def prototype_predict(inputs):
-    llm = ChatOpenAI(model="gpt-4-turbo-preview", temperature=0.0)
-    prompt = PromptTemplate.from_template(
-        template="Help out as best you can.\nQuestion: {input}\nResponse: ",
-    )
-    chain = prompt | llm
-    return chain.invoke({"input": inputs["input"]})
-
-prototype_project_name = "History Prototype Test"
-prototype_results = evaluate(
-    prototype_predict,
-    data=shared_dataset_name,
-    experiment_prefix=prototype_project_name,
-)
-```
-
-## Step 2: Create Few-Shot Dataset
-
-The traces you've captured can be used for few-shot example prompting! Below, add the inputs and outputs from the traced runs to a dataset. You can review the data in the web app to delete or edit examples you don't like.
-You could also add or filter by feedback to make sure the dataset(s) capture the style you want to use. For instance, you may want to put good and bad examples in separate datasets and include examples of both in your final prompt.
-
-```python
-few_shot_dataset_name = "History Few Shot Dataset"
-few_shot_dataset = client.create_dataset(few_shot_dataset_name)
-runs = client.list_runs(
-    project_name=prototype_results.experiment_name,
-    run_type="chain",
-)
-for run in runs:
-    client.create_example_from_run(run, dataset_id=few_shot_dataset.id)
-```
-
-## Step 3: Establish Baseline
-
-We're about ready to try out our few-shot prompting model. But first, we want to establish a baseline. Otherwise, we won't be able to tell if it actually helped!
-Let's take Nomic's GPT4All model to power a private, local history QA bot. To see how well it does, we will create a "development dataset" to see its responses.
-Once we have a baseline, we can try changing the prompts, models, or other parameters to get better results.
-
-```python
-dev_questions = [
-    "What was the significance of the adoption of Christianity in Armenia in 301 AD?",
-    "Who was responsible for the creation of the Armenian Alphabet in 405 AD and why was it significant?",
-    "Can you describe some of the major accomplishments during the Golden Age of Armenian Art and Literature?",
-    "What is unique about the architecture of the Zvartnots Cathedral in Armenia?",
-    "Who wrote 'The Knight in the Panther's Skin' and why is it considered a masterpiece of Georgian literature?",
-    "What cultural developments took place in Georgia during the rule of Queen Tamar?",
-    "Can you describe the style and significance of Armenian Miniature Painting developed in the 13th to 14th centuries?",
-    "What are some key characteristics of the Georgian Renaissance in terms of architecture and arts?",
-    "What makes the Svetitskhoveli Cathedral an iconic symbol of Georgian architectural style?",
-    "How did the Mkhitarist Order contribute to the preservation of Armenian culture and literature?",
-    "How did the creation of the Armenian alphabet impact the cultural and literary development of Armenia?",
-    "What factors contributed to the Golden Age of Armenian Art and Literature?",
-    "What was the cultural and religious significance of the Zvartnots Cathedral in Armenia?",
-    "How did 'The Knight in the Panther's Skin' reflect Georgian cultural values and beliefs?",
-    "What kind of cultural and artistic advancements were made during the rule of Queen Tamar in Georgia?",
-    "What is the significance of Armenian Miniature Painting in the context of medieval art?",
-    "How did the Georgian Renaissance influence subsequent architectural and artistic styles in Georgia?",
-    "What are some of the key architectural features of the Svetitskhoveli Cathedral in Georgia?",
-    "How did the establishment of the Mkhitarist Order impact Armenian diaspora communities in Europe?",
-    "How did the religious and cultural changes in Armenia and Georgia from the 4th to the 18th centuries influence their respective art and architecture?"
-]
-dev_dataset_name = "History Dev Set"
-dev_dataset = client.create_dataset(
-    dataset_name=dev_dataset_name, description="Some history questions.",
-)
-client.create_examples(inputs=[{"input": q} for q in dev_questions], dataset_id=dev_dataset.id)
-```
-
-#### Define the chain to benchmark
-
-```python
-from langchain_community.llms import GPT4All
-from langchain_core.prompts import PromptTemplate
-
-gpt4all_model = GPT4All(model="orca-mini-3b.ggmlv3.q4_0.bin")
-base_prompt = PromptTemplate.from_template(
-    template="Help out as best you can.\nQuestion: {input}\nResponse: ",
-)
-
-def benchmark_predict(inputs):
-    return (base_prompt | gpt4all_model).invoke(inputs)
-```
-
-#### Run the chain
-
-Run the chain on the dev dataset and inspect the results. Define some AI-assisted evaluators to give some visibility on the quality here.
-
-```python
-from langsmith.evaluation import LangChainStringEvaluator
-from langsmith.schemas import Example, Run
-
-def labeled_criteria_data(run: Run, example: Example):
-    return {
-        "prediction": run.outputs["text"],
-        "input": example.inputs["input"],
-    }
-
-helpfulness_evaluator = LangChainStringEvaluator(
-    "labeled_criteria",
-    config={"criteria": "helpfulness"},
-    prepare_data=labeled_criteria_data,
-)
-completeness_evaluator = LangChainStringEvaluator(
-    "labeled_criteria",
-    config={"criteria": "Is the submission complete, providing adequate depth in its answer?"},
-    prepare_data=labeled_criteria_data,
-)
-original_dev_res = evaluate(
-    benchmark_predict,
-    data=dev_dataset_name,
-    evaluators=[helpfulness_evaluator, completeness_evaluator],
-    experiment_prefix="zero-shot chain test",
-)
-```
-
-You can view some of the evaluation feedback by reading the project.
-
-```python
-# More details are visible in the web app, but you can see feedback stats
-# directly using the SDK
-original_dev_res.aggregate_feedback
-```
-
-## Step 4: Create Few-Shot Example Model
-
-That did reasonably well, but I think we can do better. We liked the style of response provided by the prototype model and want to achieve a similar style with the local example.
-We will accomplish this with a few-shot example selector. In the example below, fetch the examples from the few-shot dataset created previously and add them to a vector store.
-
-```python
-from langchain_core.prompts import SemanticSimilarityExampleSelector
-from langchain.embeddings import OpenAIEmbeddings
-from langchain.vectorstores import Chroma
-
-embeddings = OpenAIEmbeddings()
-examples = [
-     {"input": example.inputs["input"], "output": example.outputs["text"]}
-    for example in
-    client.list_examples(dataset_name=few_shot_dataset_name)
-]
-to_vectorize = [
-    " ".join(example.values())
-    for example in examples
-]
-vectorstore = Chroma.from_texts(
-    to_vectorize, embeddings, metadatas=examples
-)
-example_selector = SemanticSimilarityExampleSelector(
-    vectorstore=vectorstore
-)
-```
-
-**The [FewShotPromptTemplate](https://api.python.langchain.com/en/latest/prompts/langchain.prompts.few_shot.FewShotPromptTemplate.html#langchain.prompts.few_shot.FewShotPromptTemplate) is used to inject examples into the prompt using the example_selector created above.**
-In this case, we used a SemanticSimilarityExampleSelector, which returns examples that are the most 'similar' based on vector similarity.
-The overall flow looks something like:
-
-- An input is passed to the LLMChain.
-- The input is passed from the FewShotPromptTemplate to the example_selector, which returns the top N most 'similar' examples.
-- The `example_prompt` is used to format each selected example.
-- The selected examples are inserted between the prefix and suffix to form the final prompt.
-
-```python
-from langchain_core.prompts import FewShotPromptTemplate, PromptTemplate
-# Define how each selected example will be formatted
-# when inserted into the whole prompt
-example_prompt = PromptTemplate(
-    input_variables=["input", "output"],
-    template="Question: {input}\nResponse: {output}\n\n",
-)
-# Define the overall prompt.
-few_shot_prompt = FewShotPromptTemplate(
-    example_selector=example_selector,
-    example_prompt=example_prompt,
-    prefix="Help out as best you can.\n",
-    suffix="Question: {input}\nResponse: ",
-    input_variables=["input"]
-)
-```
-
-#### Benchmark the few-shot model
-
-Now we can run the chain again, this time using the few-shot prompt template. We will use the same evaluators as before to compare the results.
-
-```python
-def fewshot_predict(inputs):
-    return (few_shot_prompt | gpt4all_model).invoke(inputs)
-
-few_shot_dev_res = evaluate(
-    fewshot_predict,
-    data=dev_dataset_name,
-    evaluators=[helpfulness_evaluator, completeness_evaluator],
-    experiment_prefix="few-shot chain test",
-)
-```
-
-#### Compare results
-
-Both the helpfulness and completeness of the responses improved!
-
-```python
-few_shot_dev_res.aggregate_feedback
-```
-
-## Review
-
-In this example, we used LangSmith datasets to curate examples and connected them to a few-shot example selector to improve the quality of the prompt used with a smaller local model.
-This tactic can be extended in many ways to help improve the quality, style, API awareness, and other characteristics of your chain or agent without having to
-fine-tune the underlying LLM weights.
diff --git a/versioned_docs/version-old/tracing/use_cases/index.mdx b/versioned_docs/version-old/tracing/use_cases/index.mdx
deleted file mode 100644
index 580eac945..000000000
--- a/versioned_docs/version-old/tracing/use_cases/index.mdx
+++ /dev/null
@@ -1,14 +0,0 @@
----
-sidebar_label: Use Cases
-sidebar_position: 5
----
-
-import DocCardList from "@theme/DocCardList";
-
-# Use Cases Guides
-
-The following guides are provided to serve as examples for how you can use LangSmith's tracing capabilities to answer
-common questions about your application. These are not meant to be exhaustive, nor are they optimized
-for your use case. They are meant as a reference to help you get started.
-
-<DocCardList />
diff --git a/versioned_docs/version-old/tracing/use_cases/summarize-usage.mdx b/versioned_docs/version-old/tracing/use_cases/summarize-usage.mdx
deleted file mode 100644
index fac4eb38f..000000000
--- a/versioned_docs/version-old/tracing/use_cases/summarize-usage.mdx
+++ /dev/null
@@ -1,135 +0,0 @@
----
-sidebar_label: Summarize app usage
-sidebar_position: 3
----
-
-# Summarize App Usage
-
-Most usage of LLM applications is in the form of unstructured data. LangChain can be used to
-cluster and summarize how people are using an application so you can build a better product.
-
-In this example, you will perform simple k-means clustering and an LLM call to summarize logged user activity.
-
-## Prerequisites
-
-This example assumes you've configured your environment to connect to LangSmith.
-
-```bash
-export LANGCHAIN_API_KEY=<your api key>
-```
-
-It also uses OpenAI for the embeddings and Anthropic to run the LLM. You can replace these with your models of choice or
-install the following:
-
-```bash
-pip install -U langchain openai anthropic
-export OPENAI_API_KEY=<your api key>
-export ANTHROPIC_API_KEY=<your api key>
-```
-
-## Step 1: Sample recent runs
-
-For this example, we will randomly sample from the past day's runs. You can take a much larger sample,
-depending on your needs.
-
-```python
-import random
-from datetime import datetime, timedelta
-
-from langsmith import Client
-
-# Update these values to match your project
-# and run schema.
-project_name = "my-project"
-input_key = "question"
-max_to_analyze = 10_000
-yesterday = datetime.now() - timedelta(days=1)
-
-client = Client()
-runs = list(
-    client.list_runs(
-        project_name=project_name,
-        start_time=yesterday,
-        execution_order=1, # Ignore child runs
-    )
-)
-
-inputs = [str(run.inputs[input_key]) for run in runs if input_key in run.inputs]
-sampled = inputs
-if len(inputs) > max_to_analyze:
-    sampled = random.sample(sampled, max_to_analyze)
-```
-
-## Step 2: Embed the inputs for clustering
-
-Embeddings provide vector representations of text that we can use to cluster semantically similar inputs.
-
-```python
-import numpy as np
-from langchain.embeddings import OpenAIEmbeddings
-
-embedder = OpenAIEmbeddings()
-embeddings = embedder.embed_documents(sampled)
-arr = np.stack(embeddings)
-```
-
-Now, cluster the embeddings:
-
-```python
-from sklearn.cluster import KMeans
-
-# Reduce n_clusters in case you're trying this walkthrough out on a small project
-n_clusters = min(10, len(sampled)//4)
-
-kmeans = KMeans(n_clusters=n_clusters, n_init='auto', init="k-means++", random_state=42)
-kmeans.fit(arr)
-```
-
-## Step 3: Summarize each cluster
-
-Now it's time to produce the summaries! We will use Claude-2 using the `ChatAnthropic` model with a 100k token context window.
-You can check out the prompt we're using [on the hub](https://smith.langchain.com/hub/wfh/summarize_logs).
-
-```python
-import anthropic
-from langchain import hub
-from langchain.chat_models import ChatAnthropic
-from langchain.schema.output_parser import StrOutputParser
-
-
-def _truncate_inputs(input_logs: list) -> str:
-    max_prompt_tokens = 80_000
-    # Truncate to max_prompt_tokens
-    tokenizer = anthropic.Anthropic().get_tokenizer()
-    inputs = "\n\n".join(input_logs)
-    truncated_ids = tokenizer.encode(inputs).ids[:max_prompt_tokens]
-    return {
-        "logs": tokenizer.decode(truncated_ids)
-    }
-
-prompt = hub.pull("wfh/summarize_logs")
-chain = (
-    _truncate_inputs
-    | prompt
-    | ChatAnthropic(
-        model="claude-2",
-        temperature=1,
-        max_tokens_to_sample=1000,
-    )
-    | StrOutputParser()
-)
-
-input_arr = np.array(sampled)
-batch_inputs = [
-    input_arr[kmeans.labels_ == i] for i in range(n_clusters)
-]
-summaries = chain.batch(batch_inputs, {"max_concurrency": 2})
-for summary in summaries:
-    print(summary)
-```
-
-Congratulations! You have now clustered and summarized user activity for an application.
-
-This is just a simple example of how to use LangChain to analyze your application logs. You will likely
-want to combine this with other techniques, such as [run filtering](../faq/querying_traces) to select relevant
-examples. You can also update the prompt to ask more targed questions or to provide additional context.
diff --git a/versioned_docs/version-old/tracing/use_cases/track-sentiment.mdx b/versioned_docs/version-old/tracing/use_cases/track-sentiment.mdx
deleted file mode 100644
index 82d0413da..000000000
--- a/versioned_docs/version-old/tracing/use_cases/track-sentiment.mdx
+++ /dev/null
@@ -1,111 +0,0 @@
----
-sidebar_label: Monitor application sentiment
-sidebar_position: 2
----
-
-# Monitor Application Sentiment
-
-In this guide, you will use create an evaluator to predict the sentiment of user queries in your production application. This technique can be flexibly applied to traced runs to add additional measurements to your unstructured data.
-
-:::note Bias in Sentiment Analysis
-Predicting sentiment from text has known [biases](https://arxiv.org/abs/1805.04508) and limitations. It's important to understand the implications of this before deciding whether it's appropriate to use sentiment and other NLP metrics in instrumenting your application.
-:::
-
-## Prerequisites
-
-This guide assumes you have already deployed an LLM application and are logging traces in a monitoring project. While all the steps should work in a debug project as well, the signal is likely to be less useful.
-
-## Step 1: Define Evaluator
-
-You will be using an LLMChain to do the sentiment classification on the run's inputs. We will use a GPT-3.5 turbo model here, but you can use any model you like.
-
-```python
-from langsmith.evaluation import EvaluationResult, RunEvaluator
-from langsmith.schemas import Example, Run
-
-from langchain.chains import LLMChain
-from langchain_openai import ChatOpenAI
-
-
-class SentimentEvaluator(RunEvaluator):
-    def __init__(self):
-        prompt = """Is the predominant sentiment in the following statement positive, negative, or neutral?
----------
-Statement: {input}
----------
-Respond in one word: positive, negative, or neutral.
-Sentiment:"""
-
-        llm = ChatOpenAI(model="gpt-3.5-turbo", temperature=0.0)
-        self.chain = LLMChain.from_string(llm=llm, template=prompt)
-
-    def evaluate_run(self, run: Run, example: Example) -> EvaluationResult:
-        input_str = str(list(run.inputs.values())[0])
-        prediction = self.chain.run(input_str)
-        # Strip the prompt
-        prediction = prediction.strip()
-        score = {"positive": 1, "negative": -1, "neutral": 0}.get(prediction)
-        return EvaluationResult(
-            key="sentiment",
-            value=prediction,
-            score=score,
-        )
-```
-
-## Step 2: Evaluate
-
-Now that you've defined your evaluator, use it to predict the sentiment of run inputs. You can do this by iterating over the runs in your project and evaluating each run with the object you just defined.
-
-```python
-from langsmith import Client
-
-client = Client()
-evaluator = SentimentEvaluator()
-for run in client.list_runs(
-    project_name="my-project",
-    execution_order=1, # Do not return child / nested runs
-):
-        client.evaluate_run(run, evaluator)
-```
-
-## Step 3: View aggregate feedback
-
-The sentiment predictions are logged as feedback and can be viewed in the application UI. You can view the aggregate sentiment scores over the project and filter by feedback values.
-
-You can use the client to filter and export run and feedback information.
-
-```python
-# Get the aggregate stats for the project
-project = client.read_project(project_name="my-project")
-aggregate_feedback = project.feedback_stats
-
-# Get feedback per run
-rowwise_feedback = [
-    run.feedback_stats
-    for run in client.list_runs(
-        project_name="my-project",
-        execution_order=1,
-        )
-]
-
-# Get runs that were scored as negative
-negative_runs = client.list_runs(
-    project_name="my-project",
-    query="and(eq(feedback_key, "sentiment"), eq(feedback_score, -1))",
-)
-```
-
-If you use [tags or metadata](../../tracing/faq/customizing_trace_attributes#adding-metadata-and-tags-to-traces) to organize runs within a project, you can use these for subset and cohort analysis.
-
-```python
-# Get feedback for runs
-# with the tag "my-tag"
-rowwise_feedback = [
-    run.feedback_stats
-    for run in client.list_runs(
-        project_name="my-project",
-        execution_order=1,
-        query='has(tags, "my-tag")'
-        )
-]
-```
diff --git a/versioned_docs/version-old/user_guide.mdx b/versioned_docs/version-old/user_guide.mdx
deleted file mode 100644
index d1fc487a3..000000000
--- a/versioned_docs/version-old/user_guide.mdx
+++ /dev/null
@@ -1,190 +0,0 @@
----
-sidebar_label: User Guide
-sidebar_position: 1
----
-
-# LangSmith User Guide
-
-LangSmith is a platform for LLM application development, monitoring, and testing. In this guide, we’ll highlight the breadth of workflows LangSmith supports and how they fit into each stage of the application development lifecycle. We hope this will inform users how to best utilize this powerful platform or give them something to consider if they’re just starting their journey.
-
-![Lifecycle](static/LangSmith_Diagram-GA-final.png)
-
-## Prototyping
-
-Prototyping LLM applications often involves quick experimentation between prompts, model types, retrieval strategy and other parameters.
-The ability to rapidly understand how the model is performing — and debug where it is failing — is incredibly important for this phase.
-
-#### Debugging
-
-When developing new LLM applications, we suggest having LangSmith tracing enabled by default.
-Oftentimes, it isn’t necessary to look at every single trace. However, when things go wrong (an unexpected end result, infinite agent loop, slower than expected execution, higher than expected token usage), it’s extremely helpful to debug by looking through the application traces. LangSmith gives clear visibility and debugging information at each step of an LLM sequence, making it much easier to identify and root-cause issues.
-We provide native rendering of chat messages, functions, and retrieve documents.
-
-import debugging from "./static/user_guide/debugging.mp4";
-
-<video
-  controls
-  autoPlay
-  muted
-  style={{ width: "100%", borderRadius: "8px", overflow: "hidden" }}
->
-  <source src={debugging} />
-</video>
-
-#### Initial Test Set
-
-While many developers still ship an initial version of their application based on “vibe checks”, we’ve seen an increasing number of engineering teams start to adopt a more test driven approach. LangSmith allows developers to create datasets, which are collections of inputs and reference outputs, and use these to run tests on their LLM applications.
-These test cases can be uploaded in bulk, created on the fly, or exported from application traces. LangSmith also makes it easy to run custom evaluations (both LLM and heuristic based) to score test results.
-
-import running_tests from "./static/user_guide/running_tests.mp4";
-
-<video
-  controls
-  autoPlay
-  muted
-  style={{ width: "100%", borderRadius: "8px", overflow: "hidden" }}
->
-  <source src={running_tests} />
-</video>
-
-#### Comparison View
-
-When prototyping different versions of your applications and making changes, it’s important to see whether or not you’ve regressed with respect to your initial test cases.
-Oftentimes, changes in the prompt, retrieval strategy, or model choice can have huge implications in responses produced by your application.
-In order to get a sense for which variant is performing better, it’s useful to be able to view results for different configurations on the same datapoints side-by-side. We’ve invested heavily in a user-friendly comparison view for test runs to track and diagnose regressions in test scores across multiple revisions of your application.
-
-import comparison from "./static/user_guide/comparison.mp4";
-
-<video
-  controls
-  autoPlay
-  muted
-  style={{ width: "100%", borderRadius: "8px", overflow: "hidden" }}
->
-  <source src={comparison} />
-</video>
-
-#### Playground
-
-LangSmith provides a playground environment for rapid iteration and experimentation.
-This allows you to quickly test out different prompts and models. You can open the playground from any prompt or model run in your trace.
-Every playground run is logged in the system and can be used to create test cases or compare with other runs.
-
-import playground from "./static/user_guide/playground.mp4";
-
-<video
-  controls
-  autoPlay
-  muted
-  style={{ width: "100%", borderRadius: "8px", overflow: "hidden" }}
->
-  <source src={playground} />
-</video>
-
-## Beta Testing
-
-Beta testing allows developers to collect more data on how their LLM applications are performing in real-world scenarios. In this phase, it’s important to develop an understanding for the types of inputs the app is performing well or poorly on and how exactly it’s breaking down in those cases. Both feedback collection and run annotation are critical for this workflow. This will help in curation of test cases that can help track regressions/improvements and development of automatic evaluations.
-
-#### Capturing Feedback
-
-When launching your application to an initial set of users, it’s important to gather human feedback on the responses it’s producing. This helps draw attention to the most interesting runs and highlight edge cases that are causing problematic responses. LangSmith allows you to attach feedback scores to logged traces (oftentimes, this is hooked up to a feedback button in your app), then filter on traces that have a specific feedback tag and score. A common workflow is to filter on traces that receive a poor user feedback score, then drill down into problematic points using the detailed trace view.
-
-import feedback_filtering from "./static/user_guide/feedback_filtering.mp4";
-
-<video
-  controls
-  autoPlay
-  muted
-  style={{ width: "100%", borderRadius: "8px", overflow: "hidden" }}
->
-  <source src={feedback_filtering} />
-</video>
-
-#### Annotating Traces
-
-LangSmith also supports sending runs to annotation queues, which allow annotators to closely inspect interesting traces and annotate them with respect to different criteria. Annotators can be PMs, engineers, or even subject matter experts. This allows users to catch regressions across important evaluation criteria.
-
-import annotating_traces from "./static/user_guide/annotating_traces.mp4";
-
-<video
-  controls
-  autoPlay
-  muted
-  style={{ width: "100%", borderRadius: "8px", overflow: "hidden" }}
->
-  <source src={annotating_traces} />
-</video>
-
-#### Adding Runs to a Dataset
-
-As your application progresses through the beta testing phase, it's essential to continue collecting data to refine and improve its performance. LangSmith enables you to add runs as examples to datasets (from both the project page and within an annotation queue), expanding your test coverage on real-world scenarios. This is a key benefit in having your logging system and your evaluation/testing system in the same platform.
-
-import datasets from "./static/user_guide/datasets.mp4";
-
-<video
-  controls
-  autoPlay
-  muted
-  style={{ width: "100%", borderRadius: "8px", overflow: "hidden" }}
->
-  <source src={datasets} />
-</video>
-
-## Production
-
-Closely inspecting key data points, growing benchmarking datasets, annotating traces, and drilling down into important data in trace view are workflows you’ll also want to do once your app hits production.
-
-However, especially at the production stage, it’s crucial to get a high-level overview of application performance with respect to latency, cost, and feedback scores. This ensures that it's delivering desirable results at scale.
-
-Online evaluations and automations allow you to process and score production traces in near real-time.
-
-Additionally, threads provide a seamless way to group traces from a single conversation, making it easier to track the performance of your application across multiple turns.
-
-#### Monitoring and A/B Testing
-
-LangSmith provides monitoring charts that allow you to track key metrics over time. You can expand to view metrics for a given period and drill down into a specific data point to get a trace table for that time period — this is especially handy for debugging production issues.
-
-LangSmith also allows for tag and metadata grouping, which allows users to mark different versions of their applications with different identifiers and view how they are performing side-by-side within each chart. This is helpful for A/B testing changes in prompt, model, or retrieval strategy.
-
-import monitoring from "./static/user_guide/monitoring.mp4";
-
-<video
-  controls
-  autoPlay
-  muted
-  style={{ width: "100%", borderRadius: "8px", overflow: "hidden" }}
->
-  <source src={monitoring} />
-</video>
-
-#### Automations
-
-Automations are a powerful feature in LangSmith that allow you to perform actions on traces in near real-time. This can be used to automatically score traces, send them to annotation queues, or send them to datasets.
-
-To define an automation, simply provide a filter condition, a sampling rate, and an action to perform. Automations are particularly helpful for processing traces at production scale.
-
-import online_eval from "./static/user_guide/online_eval.mp4";
-
-<video
-  controls
-  autoPlay
-  muted
-  style={{ width: "100%", borderRadius: "8px", overflow: "hidden" }}
->
-  <source src={online_eval} />
-</video>
-
-#### Threads
-
-Many LLM applications are multi-turn, meaning that they involve a series of interactions between the user and the application. LangSmith provides a threads view that groups traces from a single conversation together, making it easier to track the performance of and annotate your application across multiple turns.
-
-import threads from "./static/user_guide/threads.mp4";
-
-<video
-  controls
-  autoPlay
-  muted
-  style={{ width: "100%", borderRadius: "8px", overflow: "hidden" }}
->
-  <source src={threads} />
-</video>
diff --git a/versioned_sidebars/version-old-sidebars.json b/versioned_sidebars/version-old-sidebars.json
deleted file mode 100644
index de2f8594e..000000000
--- a/versioned_sidebars/version-old-sidebars.json
+++ /dev/null
@@ -1,84 +0,0 @@
-{
-  "sidebar": [
-    "index",
-    "user_guide",
-    {
-      "type": "category",
-      "label": "Tracing",
-      "collapsed": true,
-      "collapsible": true,
-      "items": [{ "type": "autogenerated", "dirName": "tracing" }],
-      "link": {
-        "type": "doc",
-        "id": "tracing/index"
-      }
-    },
-    {
-      "type": "category",
-      "label": "Evaluation",
-      "collapsed": true,
-      "collapsible": true,
-      "items": [{ "type": "autogenerated", "dirName": "evaluation" }],
-      "link": {
-        "type": "doc",
-        "id": "evaluation/index"
-      }
-    },
-    {
-      "type": "category",
-      "label": "Production Monitoring & Automations",
-      "collapsed": true,
-      "collapsible": true,
-      "items": [{ "type": "autogenerated", "dirName": "monitoring" }],
-      "link": {
-        "type": "doc",
-        "id": "monitoring/index"
-      }
-    },
-    {
-      "type": "category",
-      "label": "Prompt Hub",
-      "collapsed": true,
-      "collapsible": true,
-      "items": [{ "type": "autogenerated", "dirName": "hub" }],
-      "link": {
-        "type": "generated-index",
-        "description": "Discover, share, and version control prompts in the Prompt Hub."
-      }
-    },
-    {
-      "type": "category",
-      "label": "Proxy",
-      "collapsed": true,
-      "collapsible": true,
-      "items": [{ "type": "autogenerated", "dirName": "proxy" }],
-      "link": {
-        "type": "generated-index",
-        "description": "Proxy your LLM calls to automatically Cache and Trace."
-      }
-    },
-    "pricing",
-    {
-      "type": "category",
-      "label": "Self-Hosting",
-      "collapsed": true,
-      "collapsible": true,
-      "items": [{ "type": "autogenerated", "dirName": "self_hosting" }],
-      "link": {
-        "type": "generated-index",
-        "description": "Self-hosting LangSmith requires an enterprise license. Check out the guides below for more information."
-      }
-    },
-    {
-      "type": "category",
-      "label": "Cookbook",
-      "collapsed": true,
-      "collapsible": true,
-      "items": [{ "type": "autogenerated", "dirName": "cookbook" }],
-      "link": {
-        "type": "generated-index",
-        "description": "Learn from hands-on code examples using LangSmith Cookbook."
-      }
-    }
-  ]
-}
\ No newline at end of file
diff --git a/versions.json b/versions.json
index 95598e1da..fe51488c7 100644
--- a/versions.json
+++ b/versions.json
@@ -1,3 +1 @@
-[
-  "old"
-]
+[]