From b6a19eb914ca580170b55c5d792ef6c3ec0e4d95 Mon Sep 17 00:00:00 2001
From: anakin87 <stefanofiorucci@gmail.com>
Date: Wed, 10 Jun 2026 14:06:02 +0200
Subject: [PATCH 1/6] update tutorials to use transformers integration

---
 index.toml                                    |   10 +-
 tutorials/27_First_RAG_Pipeline.ipynb         | 2173 ++++++++---------
 tutorials/29_Serializing_Pipelines.ipynb      |  159 +-
 tutorials/33_Hybrid_Retrieval.ipynb           |   26 +-
 tutorials/34_Extractive_QA_Pipeline.ipynb     |  333 +--
 ...r_and_TransformersZeroShotTextRouter.ipynb |  374 +--
 .../44_Creating_Custom_SuperComponents.ipynb  |  121 +-
 ...oQuant_Quantization_with_HuggingFace.ipynb |   74 +-
 8 files changed, 1124 insertions(+), 2146 deletions(-)

diff --git a/index.toml b/index.toml
index d08c6af..69c02fb 100644
--- a/index.toml
+++ b/index.toml
@@ -12,7 +12,7 @@ notebook = "27_First_RAG_Pipeline.ipynb"
 aliases = []
 completion_time = "10 min"
 created_at = 2023-12-05
-dependencies = ["datasets>=2.6.1", "sentence-transformers>=4.1.0", "mistral-haystack"]
+dependencies = ["datasets>=2.6.1", "sentence-transformers>=4.1.0", "mistral-haystack", "transformers-haystack"]
 featured = true
 
 [[tutorial]]
@@ -35,7 +35,7 @@ notebook = "29_Serializing_Pipelines.ipynb"
 aliases = []
 completion_time = "10 min"
 created_at = 2024-01-29
-dependencies = ["transformers[torch]"]
+dependencies = ["transformers-haystack"]
 
 [[tutorial]]
 title = "Preprocessing Different File Types"
@@ -98,7 +98,7 @@ notebook = "34_Extractive_QA_Pipeline.ipynb"
 aliases = []
 completion_time = "10 min"
 created_at = 2024-02-09
-dependencies = ["accelerate", "sentence-transformers", "datasets", "transformers<5"]
+dependencies = ["accelerate", "sentence-transformers", "datasets", "transformers<5", "transformers-haystack"]
 
 [[tutorial]]
 title = "Evaluating RAG Pipelines"
@@ -154,7 +154,7 @@ notebook = "41_Query_Classification_with_TransformersTextRouter_and_Transformers
 aliases = []
 completion_time = "25 min"
 created_at = 2024-10-15
-dependencies = ["sentence-transformers>=4.1.0", "gradio", "torch", "sentencepiece", "datasets", "accelerate", "transformers<5"]
+dependencies = ["sentence-transformers>=4.1.0", "gradio", "torch", "sentencepiece", "datasets", "accelerate", "transformers<5", "transformers-haystack"]
 
 [[tutorial]]
 title = "Retrieving a Context Window Around a Sentence"
@@ -258,6 +258,6 @@ notebook = "49_TurboQuant_Quantization_with_HuggingFace.ipynb"
 aliases = []
 completion_time = "20 min"
 created_at = 2026-03-30
-dependencies = ["haystack-ai", "turboquant-vllm", "transformers"]
+dependencies = ["haystack-ai", "turboquant-vllm", "transformers-haystack"]
 featured = false
 python_version = "3.12"
\ No newline at end of file
diff --git a/tutorials/27_First_RAG_Pipeline.ipynb b/tutorials/27_First_RAG_Pipeline.ipynb
index a83ef1f..ed0518a 100644
--- a/tutorials/27_First_RAG_Pipeline.ipynb
+++ b/tutorials/27_First_RAG_Pipeline.ipynb
@@ -1,1197 +1,1160 @@
 {
-  "cells": [
-    {
-      "cell_type": "markdown",
-      "metadata": {},
-      "source": [
-        "# Tutorial: Creating Your First QA Pipeline with Retrieval-Augmentation\n",
-        "\n",
-        "- **Level**: Beginner\n",
-        "- **Time to complete**: 10 minutes\n",
-        "- **Components Used**: [`InMemoryDocumentStore`](https://docs.haystack.deepset.ai/docs/inmemorydocumentstore), [`SentenceTransformersDocumentEmbedder`](https://docs.haystack.deepset.ai/docs/sentencetransformersdocumentembedder), [`SentenceTransformersTextEmbedder`](https://docs.haystack.deepset.ai/docs/sentencetransformerstextembedder), [`InMemoryEmbeddingRetriever`](https://docs.haystack.deepset.ai/docs/inmemoryembeddingretriever), [`ChatPromptBuilder`](https://docs.haystack.deepset.ai/docs/chatpromptbuilder), and a [`ChatGenerator`](https://docs.haystack.deepset.ai/docs/generators) such as [`OpenAIChatGenerator`](https://docs.haystack.deepset.ai/docs/openaichatgenerator), [`MistralChatGenerator`](https://docs.haystack.deepset.ai/docs/mistralchatgenerator), or [`HuggingFaceLocalChatGenerator`](https://docs.haystack.deepset.ai/docs/huggingfacelocalchatgenerator).\n",
-        "- **Prerequisites**: Access to a large language model, either an **API key** from a provider or a **locally or on-premises hosted** model (for example on Colab runtime).\n",
-        "- **Goal**: After completing this tutorial, you'll have learned the new prompt syntax and how to use ChatPromptBuilder with a ChatGenerator to build a generative question-answering pipeline with retrieval-augmentation."
-      ]
-    },
-    {
-      "cell_type": "markdown",
-      "metadata": {
-        "id": "LFqHcXYPO-qZ"
-      },
-      "source": [
-        "## Overview\n",
-        "\n",
-        "This tutorial shows you how to create a generative question-answering pipeline using the retrieval-augmentation ([RAG](https://www.deepset.ai/blog/llms-retrieval-augmentation)) approach with Haystack. The process involves four main components: [SentenceTransformersTextEmbedder](https://docs.haystack.deepset.ai/docs/sentencetransformerstextembedder) for creating an embedding for the user query, [InMemoryEmbeddingRetriever](https://docs.haystack.deepset.ai/docs/inmemoryembeddingretriever) for fetching relevant documents, [ChatPromptBuilder](https://docs.haystack.deepset.ai/docs/chatpromptbuilder) for creating a template prompt, and a [ChatGenerator](https://docs.haystack.deepset.ai/docs/generators) for generating the final answer.\n",
-        "\n",
-        "The LLM behind that generator can be **hosted in the cloud**, for example with [OpenAI](https://haystack.deepset.ai/integrations/openai), [Anthropic](https://haystack.deepset.ai/integrations/anthropic), [Google](https://haystack.deepset.ai/integrations/google-genai), [Mistral](https://haystack.deepset.ai/integrations/mistral), or other providers, usually by setting an API key in the environment or **run locally**, for example via [Ollama](https://haystack.deepset.ai/integrations/ollama) or [vLLM](https://haystack.deepset.ai/integrations/vllm), or **on a Colab VM** by loading an open-weight model from Hugging Face. The *Initialize a ChatGenerator* section shows three concrete options (OpenAI, Mistral, and a local model).\n",
-        "\n",
-        "For this tutorial, you'll use the Wikipedia pages of [Seven Wonders of the Ancient World](https://en.wikipedia.org/wiki/Wonders_of_the_World) as Documents, but you can replace them with any text you want.\n"
-      ]
-    },
-    {
-      "cell_type": "markdown",
-      "metadata": {
-        "id": "Kww5B_vXO-qZ"
-      },
-      "source": [
-        "## Installing Haystack\n",
-        "\n",
-        "Install Haystack and other required packages with `pip`:"
-      ]
-    },
-    {
-      "cell_type": "code",
-      "execution_count": null,
-      "metadata": {
-        "colab": {
-          "base_uri": "https://localhost:8080/"
-        },
-        "id": "UQbU8GUfO-qZ",
-        "outputId": "7a4ef73b-8822-467e-9979-a75169b36729"
-      },
-      "outputs": [],
-      "source": [
-        "%%bash\n",
-        "\n",
-        "pip install haystack-ai mistral-haystack \"datasets>=2.6.1\" \"sentence-transformers>=4.1.0\""
-      ]
-    },
-    {
-      "cell_type": "markdown",
-      "metadata": {
-        "id": "_lvfew16O-qa"
-      },
-      "source": [
-        "## Fetching and Indexing Documents\n",
-        "\n",
-        "You'll start creating your question answering system by downloading the data and indexing the data with its embeddings to a DocumentStore.\n",
-        "\n",
-        "In this tutorial, you will take a simple approach to writing documents and their embeddings into the DocumentStore. For a full indexing pipeline with preprocessing, cleaning and splitting, check out our tutorial on [Preprocessing Different File Types](https://haystack.deepset.ai/tutorials/30_file_type_preprocessing_index_pipeline).\n",
-        "\n",
-        "\n",
-        "### Initializing the DocumentStore\n",
-        "\n",
-        "Initialize a DocumentStore to index your documents. A DocumentStore stores the Documents that the question answering system uses to find answers to your questions. In this tutorial, you'll be using the `InMemoryDocumentStore`."
-      ]
-    },
-    {
-      "cell_type": "code",
-      "execution_count": 2,
-      "metadata": {
-        "id": "CbVN-s5LO-qa"
-      },
-      "outputs": [],
-      "source": [
-        "from haystack.document_stores.in_memory import InMemoryDocumentStore\n",
-        "\n",
-        "document_store = InMemoryDocumentStore()"
-      ]
+ "cells": [
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": "# Tutorial: Creating Your First QA Pipeline with Retrieval-Augmentation\n\n- **Level**: Beginner\n- **Time to complete**: 10 minutes\n- **Components Used**: [`InMemoryDocumentStore`](https://docs.haystack.deepset.ai/docs/inmemorydocumentstore), [`SentenceTransformersDocumentEmbedder`](https://docs.haystack.deepset.ai/docs/sentencetransformersdocumentembedder), [`SentenceTransformersTextEmbedder`](https://docs.haystack.deepset.ai/docs/sentencetransformerstextembedder), [`InMemoryEmbeddingRetriever`](https://docs.haystack.deepset.ai/docs/inmemoryembeddingretriever), [`ChatPromptBuilder`](https://docs.haystack.deepset.ai/docs/chatpromptbuilder), and a [`ChatGenerator`](https://docs.haystack.deepset.ai/docs/generators) such as [`OpenAIChatGenerator`](https://docs.haystack.deepset.ai/docs/openaichatgenerator), [`MistralChatGenerator`](https://docs.haystack.deepset.ai/docs/mistralchatgenerator), or [`TransformersChatGenerator`](https://docs.haystack.deepset.ai/docs/transformerschatgenerator).\n- **Prerequisites**: Access to a large language model, either an **API key** from a provider or a **locally or on-premises hosted** model (for example on Colab runtime).\n- **Goal**: After completing this tutorial, you'll have learned the new prompt syntax and how to use ChatPromptBuilder with a ChatGenerator to build a generative question-answering pipeline with retrieval-augmentation."
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {
+    "id": "LFqHcXYPO-qZ"
+   },
+   "source": [
+    "## Overview\n",
+    "\n",
+    "This tutorial shows you how to create a generative question-answering pipeline using the retrieval-augmentation ([RAG](https://www.deepset.ai/blog/llms-retrieval-augmentation)) approach with Haystack. The process involves four main components: [SentenceTransformersTextEmbedder](https://docs.haystack.deepset.ai/docs/sentencetransformerstextembedder) for creating an embedding for the user query, [InMemoryEmbeddingRetriever](https://docs.haystack.deepset.ai/docs/inmemoryembeddingretriever) for fetching relevant documents, [ChatPromptBuilder](https://docs.haystack.deepset.ai/docs/chatpromptbuilder) for creating a template prompt, and a [ChatGenerator](https://docs.haystack.deepset.ai/docs/generators) for generating the final answer.\n",
+    "\n",
+    "The LLM behind that generator can be **hosted in the cloud**, for example with [OpenAI](https://haystack.deepset.ai/integrations/openai), [Anthropic](https://haystack.deepset.ai/integrations/anthropic), [Google](https://haystack.deepset.ai/integrations/google-genai), [Mistral](https://haystack.deepset.ai/integrations/mistral), or other providers, usually by setting an API key in the environment or **run locally**, for example via [Ollama](https://haystack.deepset.ai/integrations/ollama) or [vLLM](https://haystack.deepset.ai/integrations/vllm), or **on a Colab VM** by loading an open-weight model from Hugging Face. The *Initialize a ChatGenerator* section shows three concrete options (OpenAI, Mistral, and a local model).\n",
+    "\n",
+    "For this tutorial, you'll use the Wikipedia pages of [Seven Wonders of the Ancient World](https://en.wikipedia.org/wiki/Wonders_of_the_World) as Documents, but you can replace them with any text you want.\n"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {
+    "id": "Kww5B_vXO-qZ"
+   },
+   "source": [
+    "## Installing Haystack\n",
+    "\n",
+    "Install Haystack and other required packages with `pip`:"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {
+    "colab": {
+     "base_uri": "https://localhost:8080/"
     },
-    {
-      "cell_type": "markdown",
-      "metadata": {
-        "id": "yL8nuJdWO-qa"
-      },
-      "source": [
-        "> `InMemoryDocumentStore` is the simplest DocumentStore to get started with. It requires no external dependencies and it's a good option for smaller projects and debugging. But it doesn't scale up so well to larger Document collections, so it's not a good choice for production systems. To learn more about the different types of external databases that Haystack supports, see [DocumentStore Integrations](https://haystack.deepset.ai/integrations?type=Document+Store)."
-      ]
+    "id": "UQbU8GUfO-qZ",
+    "outputId": "7a4ef73b-8822-467e-9979-a75169b36729"
+   },
+   "outputs": [],
+   "source": "%%bash\n\npip install haystack-ai mistral-haystack transformers-haystack \"datasets>=2.6.1\" \"sentence-transformers>=4.1.0\""
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {
+    "id": "_lvfew16O-qa"
+   },
+   "source": [
+    "## Fetching and Indexing Documents\n",
+    "\n",
+    "You'll start creating your question answering system by downloading the data and indexing the data with its embeddings to a DocumentStore.\n",
+    "\n",
+    "In this tutorial, you will take a simple approach to writing documents and their embeddings into the DocumentStore. For a full indexing pipeline with preprocessing, cleaning and splitting, check out our tutorial on [Preprocessing Different File Types](https://haystack.deepset.ai/tutorials/30_file_type_preprocessing_index_pipeline).\n",
+    "\n",
+    "\n",
+    "### Initializing the DocumentStore\n",
+    "\n",
+    "Initialize a DocumentStore to index your documents. A DocumentStore stores the Documents that the question answering system uses to find answers to your questions. In this tutorial, you'll be using the `InMemoryDocumentStore`."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 2,
+   "metadata": {
+    "id": "CbVN-s5LO-qa"
+   },
+   "outputs": [],
+   "source": [
+    "from haystack.document_stores.in_memory import InMemoryDocumentStore\n",
+    "\n",
+    "document_store = InMemoryDocumentStore()"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {
+    "id": "yL8nuJdWO-qa"
+   },
+   "source": [
+    "> `InMemoryDocumentStore` is the simplest DocumentStore to get started with. It requires no external dependencies and it's a good option for smaller projects and debugging. But it doesn't scale up so well to larger Document collections, so it's not a good choice for production systems. To learn more about the different types of external databases that Haystack supports, see [DocumentStore Integrations](https://haystack.deepset.ai/integrations?type=Document+Store)."
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {
+    "id": "XvLVaFHTO-qb"
+   },
+   "source": [
+    "The DocumentStore is now ready. Now it's time to fill it with some Documents."
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {
+    "id": "HryYZP9ZO-qb"
+   },
+   "source": [
+    "### Fetch the Data\n",
+    "\n",
+    "You'll use the Wikipedia pages of [Seven Wonders of the Ancient World](https://en.wikipedia.org/wiki/Wonders_of_the_World) as Documents. We preprocessed the data and uploaded it to Hugging Face as the [Seven Wonders](https://huggingface.co/datasets/bilgeyucel/seven-wonders) dataset. Thus, you don't need to perform any additional cleaning or splitting.\n",
+    "\n",
+    "Fetch the data and convert it into Haystack Documents:"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 3,
+   "metadata": {
+    "colab": {
+     "base_uri": "https://localhost:8080/",
+     "height": 256,
+     "referenced_widgets": [
+      "b22af125522742d4a83e95890e582058",
+      "bab24f7e38c54ecca22a5551bc708a8e",
+      "879852bee39a471f86528f0f8afe58f7",
+      "31249898b08240df919cbd951bed2ccd",
+      "8652edf5598542b990aa91472e6d698f",
+      "2690be8f1f744602b9b393e6438fd559",
+      "1fa0537a43e04678880a1d063e4100be",
+      "d8dee92388ae4ddcb1639ae0625d7136",
+      "5b690d1088194714b83d401b7667bdd2",
+      "3137d503b8d34f56ab5c458018d0f575",
+      "5497fb84edbd4332adbff6de18a33015",
+      "c3fca5ba78d2467da72fb1abd0b01ec3",
+      "9f84829b414345a29d5acaf0c0d99bd5",
+      "7ef46645be63425f857db5349da4a3a9",
+      "45aa957278ce483e9ddf1aa3932e8789",
+      "8519f294cae34825afdd69bd03229db3",
+      "cb78d35eb8e741c1b30b33bb42d04621",
+      "6886a8c59b6c4ea693d511b874c12c51",
+      "be5d50edbf2449a59508feab6d3da98c",
+      "9a2686b5238d412a8df69f996429c9b2",
+      "6d4989d458d9420491ea50c2e8923597",
+      "a7adbec1f16f4e39b4aa27373993f532",
+      "041e6870096b4f8e95a10274524065ab",
+      "54169d1347cd41b7845616a98a3b38e8",
+      "db436133e86f425cad8c5cc28eea6c03",
+      "bb419307a3e547ea8455e89d70390c42",
+      "9aab6009b2544ce5994e4e26c9182e36",
+      "2a4c9085eb2348c6a4da76679b390d1f",
+      "d6c7c125d594416b92376b4417246af1",
+      "889f5a03fac949ebbfeb4e840dcb57d3",
+      "5f548252e5b845f9bb54dc7820a8835a",
+      "01707d970b6443c9bc0ea9602b0b1f5e",
+      "70d9add61b3e4c26a278b482a1380e26"
+     ]
     },
+    "id": "INdC3WvLO-qb",
+    "outputId": "d1515765-20ea-44db-c8a8-a68776fafdab"
+   },
+   "outputs": [
     {
-      "cell_type": "markdown",
-      "metadata": {
-        "id": "XvLVaFHTO-qb"
-      },
-      "source": [
-        "The DocumentStore is now ready. Now it's time to fill it with some Documents."
-      ]
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "/usr/local/lib/python3.12/dist-packages/huggingface_hub/utils/_auth.py:94: UserWarning: \n",
+      "The secret `HF_TOKEN` does not exist in your Colab secrets.\n",
+      "To authenticate with the Hugging Face Hub, create a token in your settings tab (https://huggingface.co/settings/tokens), set it as secret in your Google Colab and restart your session.\n",
+      "You will be able to reuse this secret in all of your notebooks.\n",
+      "Please note that authentication is recommended but still optional to access public models or datasets.\n",
+      "  warnings.warn(\n"
+     ]
     },
     {
-      "cell_type": "markdown",
-      "metadata": {
-        "id": "HryYZP9ZO-qb"
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "b22af125522742d4a83e95890e582058",
+       "version_major": 2,
+       "version_minor": 0
       },
-      "source": [
-        "### Fetch the Data\n",
-        "\n",
-        "You'll use the Wikipedia pages of [Seven Wonders of the Ancient World](https://en.wikipedia.org/wiki/Wonders_of_the_World) as Documents. We preprocessed the data and uploaded it to Hugging Face as the [Seven Wonders](https://huggingface.co/datasets/bilgeyucel/seven-wonders) dataset. Thus, you don't need to perform any additional cleaning or splitting.\n",
-        "\n",
-        "Fetch the data and convert it into Haystack Documents:"
+      "text/plain": [
+       "README.md:   0%|          | 0.00/46.0 [00:00<?, ?B/s]"
       ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
     },
     {
-      "cell_type": "code",
-      "execution_count": 3,
-      "metadata": {
-        "colab": {
-          "base_uri": "https://localhost:8080/",
-          "height": 256,
-          "referenced_widgets": [
-            "b22af125522742d4a83e95890e582058",
-            "bab24f7e38c54ecca22a5551bc708a8e",
-            "879852bee39a471f86528f0f8afe58f7",
-            "31249898b08240df919cbd951bed2ccd",
-            "8652edf5598542b990aa91472e6d698f",
-            "2690be8f1f744602b9b393e6438fd559",
-            "1fa0537a43e04678880a1d063e4100be",
-            "d8dee92388ae4ddcb1639ae0625d7136",
-            "5b690d1088194714b83d401b7667bdd2",
-            "3137d503b8d34f56ab5c458018d0f575",
-            "5497fb84edbd4332adbff6de18a33015",
-            "c3fca5ba78d2467da72fb1abd0b01ec3",
-            "9f84829b414345a29d5acaf0c0d99bd5",
-            "7ef46645be63425f857db5349da4a3a9",
-            "45aa957278ce483e9ddf1aa3932e8789",
-            "8519f294cae34825afdd69bd03229db3",
-            "cb78d35eb8e741c1b30b33bb42d04621",
-            "6886a8c59b6c4ea693d511b874c12c51",
-            "be5d50edbf2449a59508feab6d3da98c",
-            "9a2686b5238d412a8df69f996429c9b2",
-            "6d4989d458d9420491ea50c2e8923597",
-            "a7adbec1f16f4e39b4aa27373993f532",
-            "041e6870096b4f8e95a10274524065ab",
-            "54169d1347cd41b7845616a98a3b38e8",
-            "db436133e86f425cad8c5cc28eea6c03",
-            "bb419307a3e547ea8455e89d70390c42",
-            "9aab6009b2544ce5994e4e26c9182e36",
-            "2a4c9085eb2348c6a4da76679b390d1f",
-            "d6c7c125d594416b92376b4417246af1",
-            "889f5a03fac949ebbfeb4e840dcb57d3",
-            "5f548252e5b845f9bb54dc7820a8835a",
-            "01707d970b6443c9bc0ea9602b0b1f5e",
-            "70d9add61b3e4c26a278b482a1380e26"
-          ]
-        },
-        "id": "INdC3WvLO-qb",
-        "outputId": "d1515765-20ea-44db-c8a8-a68776fafdab"
-      },
-      "outputs": [
-        {
-          "name": "stdout",
-          "output_type": "stream",
-          "text": [
-            "/usr/local/lib/python3.12/dist-packages/huggingface_hub/utils/_auth.py:94: UserWarning: \n",
-            "The secret `HF_TOKEN` does not exist in your Colab secrets.\n",
-            "To authenticate with the Hugging Face Hub, create a token in your settings tab (https://huggingface.co/settings/tokens), set it as secret in your Google Colab and restart your session.\n",
-            "You will be able to reuse this secret in all of your notebooks.\n",
-            "Please note that authentication is recommended but still optional to access public models or datasets.\n",
-            "  warnings.warn(\n"
-          ]
-        },
-        {
-          "data": {
-            "application/vnd.jupyter.widget-view+json": {
-              "model_id": "b22af125522742d4a83e95890e582058",
-              "version_major": 2,
-              "version_minor": 0
-            },
-            "text/plain": [
-              "README.md:   0%|          | 0.00/46.0 [00:00<?, ?B/s]"
-            ]
-          },
-          "metadata": {},
-          "output_type": "display_data"
-        },
-        {
-          "name": "stdout",
-          "output_type": "stream",
-          "text": [
-            "Warning: You are sending unauthenticated requests to the HF Hub. Please set a HF_TOKEN to enable higher rate limits and faster downloads.\n",
-            "WARNING:huggingface_hub.utils._http:Warning: You are sending unauthenticated requests to the HF Hub. Please set a HF_TOKEN to enable higher rate limits and faster downloads.\n"
-          ]
-        },
-        {
-          "data": {
-            "application/vnd.jupyter.widget-view+json": {
-              "model_id": "c3fca5ba78d2467da72fb1abd0b01ec3",
-              "version_major": 2,
-              "version_minor": 0
-            },
-            "text/plain": [
-              "data/train-00000-of-00001-4077bd623d5510(…):   0%|          | 0.00/119k [00:00<?, ?B/s]"
-            ]
-          },
-          "metadata": {},
-          "output_type": "display_data"
-        },
-        {
-          "data": {
-            "application/vnd.jupyter.widget-view+json": {
-              "model_id": "041e6870096b4f8e95a10274524065ab",
-              "version_major": 2,
-              "version_minor": 0
-            },
-            "text/plain": [
-              "Generating train split:   0%|          | 0/151 [00:00<?, ? examples/s]"
-            ]
-          },
-          "metadata": {},
-          "output_type": "display_data"
-        }
-      ],
-      "source": [
-        "from datasets import load_dataset\n",
-        "from haystack import Document\n",
-        "\n",
-        "dataset = load_dataset(\"bilgeyucel/seven-wonders\", split=\"train\")\n",
-        "docs = [Document(content=doc[\"content\"], meta=doc[\"meta\"]) for doc in dataset]"
-      ]
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Warning: You are sending unauthenticated requests to the HF Hub. Please set a HF_TOKEN to enable higher rate limits and faster downloads.\n",
+      "WARNING:huggingface_hub.utils._http:Warning: You are sending unauthenticated requests to the HF Hub. Please set a HF_TOKEN to enable higher rate limits and faster downloads.\n"
+     ]
     },
     {
-      "cell_type": "markdown",
-      "metadata": {
-        "id": "czMjWwnxPA-3"
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "c3fca5ba78d2467da72fb1abd0b01ec3",
+       "version_major": 2,
+       "version_minor": 0
       },
-      "source": [
-        "### Initialize a Document Embedder\n",
-        "\n",
-        "To store your data in the DocumentStore with embeddings, initialize a [SentenceTransformersDocumentEmbedder](https://docs.haystack.deepset.ai/docs/sentencetransformersdocumentembedder) with the model name.\n",
-        "\n",
-        "> If you'd like, you can use a different [Embedder](https://docs.haystack.deepset.ai/docs/embedders) for your documents."
+      "text/plain": [
+       "data/train-00000-of-00001-4077bd623d5510(…):   0%|          | 0.00/119k [00:00<?, ?B/s]"
       ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
     },
     {
-      "cell_type": "code",
-      "execution_count": 4,
-      "metadata": {
-        "id": "EUmAH9sEn3R7"
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "041e6870096b4f8e95a10274524065ab",
+       "version_major": 2,
+       "version_minor": 0
       },
-      "outputs": [],
-      "source": [
-        "from haystack.components.embedders import SentenceTransformersDocumentEmbedder\n",
-        "\n",
-        "doc_embedder = SentenceTransformersDocumentEmbedder(model=\"sentence-transformers/all-MiniLM-L6-v2\")"
+      "text/plain": [
+       "Generating train split:   0%|          | 0/151 [00:00<?, ? examples/s]"
       ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    }
+   ],
+   "source": [
+    "from datasets import load_dataset\n",
+    "from haystack import Document\n",
+    "\n",
+    "dataset = load_dataset(\"bilgeyucel/seven-wonders\", split=\"train\")\n",
+    "docs = [Document(content=doc[\"content\"], meta=doc[\"meta\"]) for doc in dataset]"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {
+    "id": "czMjWwnxPA-3"
+   },
+   "source": [
+    "### Initialize a Document Embedder\n",
+    "\n",
+    "To store your data in the DocumentStore with embeddings, initialize a [SentenceTransformersDocumentEmbedder](https://docs.haystack.deepset.ai/docs/sentencetransformersdocumentembedder) with the model name.\n",
+    "\n",
+    "> If you'd like, you can use a different [Embedder](https://docs.haystack.deepset.ai/docs/embedders) for your documents."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 4,
+   "metadata": {
+    "id": "EUmAH9sEn3R7"
+   },
+   "outputs": [],
+   "source": [
+    "from haystack.components.embedders import SentenceTransformersDocumentEmbedder\n",
+    "\n",
+    "doc_embedder = SentenceTransformersDocumentEmbedder(model=\"sentence-transformers/all-MiniLM-L6-v2\")"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {
+    "id": "9y4iJE_SrS4K"
+   },
+   "source": [
+    "### Write Documents to the DocumentStore\n",
+    "\n",
+    "Run the `doc_embedder` with the Documents. The embedder will create embeddings for each document and store them in that document's `embedding` field. Then, write the Documents to the DocumentStore with the `write_documents()` method."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 5,
+   "metadata": {
+    "colab": {
+     "base_uri": "https://localhost:8080/",
+     "height": 576,
+     "referenced_widgets": [
+      "2cc35d93724b4e0f9608fe6999e96baa",
+      "769840529f8e48378f568109e008dda7",
+      "5e34616bda1840db92c9afdbcc17b090",
+      "74296c48c5204c26a186d5e6fe2eb389",
+      "6ab0bef578534eb3b326ce3f1c7952cb",
+      "821e521c20eb4952a9f553be1707fe4d",
+      "b627994ed6fb4e419d0d7b042a2d1845",
+      "430c4f94f9704dceb7657fdf54e4e979",
+      "b9f80e63f9f4477e815fb6741e0b7481",
+      "1bb5874fc5424756839b3119ee88c652",
+      "adf3861551a74ac2bfd622fe9a4dd8c4",
+      "f0ab87c57a644c8693e51d2f04a666f3",
+      "9acd8a5fa709457eb1627bdafed3dc90",
+      "a99f41226d8c48978417e050c447cf06",
+      "fa24a76d328e47eeac0c12fc4a50bcd7",
+      "a3cd8b42b2884452b82f56e81b9f23fa",
+      "f4a53626b22f458ab46e2bf3ce91cf1f",
+      "9f2586e4929e47ea8e3ce7788b9d6a09",
+      "0b3d4bc9fc8e4f7d96a04b9728d966c0",
+      "00be43d5e49d4d288757d8c3b4566262",
+      "851f2132407f4602bdb482e09aff7864",
+      "0a73b3d5dd7e4658ac146786039c005c",
+      "efe7818df31b4b4fb4ac23447133add1",
+      "d2b362efd0ad499193b03da90419ee41",
+      "31f44064c8b64cfcb8a305e111c8465a",
+      "77eb3fe2195b43d8aa622f23d009dfd6",
+      "3bc2a31d2fbb4f548c7a7fbbecb4de56",
+      "32bf3855ebea499c97baa448b4d721d5",
+      "3fa909ce952b471e9883a4c32586e111",
+      "23e319859ad64a389e141e6ec6175cb5",
+      "17d53e1b04ba4196b2d0d9ffd8a6fa29",
+      "92248f3c7de0496c8ca16a26f528ab5e",
+      "9fe390e03164438a855d4c041a3e3435",
+      "be6e75733aa44951a9a2f1e76b3d1627",
+      "9e58a463153b4aadac2b54ffac39c0b4",
+      "72f7dd0ba5ce45359b9ed35563b59aee",
+      "75986772e38e4dbea85249f34f52178e",
+      "894070da75a948e8af880e57898e5cb8",
+      "4c903df362c840b5a887a549e86ac62f",
+      "42166f3fba3b400c858d1e10feb4c751",
+      "65deef2a69ee47a698b3b6f3e4a6bce6",
+      "4fd6a3cecf47491bad25a58f563c4a15",
+      "11053c79eb414fc4976cef3966a7fac1",
+      "7f5cbe293ec2416f80c97c91fce7df1e",
+      "132784a9e3d74220abf9748a4d17ca89",
+      "39e35e2d422245ce833481b43416441e",
+      "b38ec117ee1741148e3d5e79167e74fe",
+      "d02863cda9c44772a165b7be9bd2fea9",
+      "41e2ffb4d7a645d5bb5ec794ee21cf86",
+      "a6c11c68ab754703b2c1c8f6816bb96a",
+      "25666b5ff5604b8ba366a529c5025230",
+      "0b4eb164565445b28828357715ef329b",
+      "4d865aefb4ab48448fcf458ad256ca20",
+      "b47bd72419e041ce8cdcc43d263a6686",
+      "f37aad71e98948e480718fa4e3f70217",
+      "7b2b5ad63a0b4775bbb652453c179d19",
+      "252525f805004deca52a9a94f9eae057",
+      "d8d01da923864706b8331af4f361b047",
+      "51770f17bef74ff59a1993abeb82de5f",
+      "bb2fbfbc2dc34f5d87c03e46f551ea98",
+      "836d16710f9e4edbbf6b1233af637928",
+      "35da2a2f76664857b9390b1d80c2ecd2",
+      "9d53c7d71c9e400399cf37b2f37c91af",
+      "2fae67ce866a4e8cb125f8395d96d896",
+      "4813b61b1f1c4adba5b9fe214459cac9",
+      "b47368b719da42aaad46070cf40a7a00",
+      "65d85c964cfb46dab8b9ea69c9506ada",
+      "5589e6aa47c541ce889beda46435a9c7",
+      "4694f52453794bb4b873de48ab7c6b3c",
+      "557161a5e01a40e390c86f344089fc60",
+      "a8185ea16ee54420a17c1cca14468b7c",
+      "86f2d32941e845088ceade417b76424a",
+      "bece87ceb6b04dacb8f01347a9d5bb7d",
+      "02ab1ee2008f4008b5f19346005ce6f7",
+      "73b9187ac82b4adb8117f90fb231434d",
+      "87cd40c733e44790bfa102607827596f",
+      "62431513a3b643839dcd0076b2ed1a9f",
+      "98895c06137b4d80b5451f56f06324a4",
+      "bedd40889bf6433f932729d5db0539f0",
+      "2812a84fd4e14914a93f37a32c7430db",
+      "9003b727e1f64fe19386a725d8a344fa",
+      "952bafd6d58144b28bc2c4ad66ed4f8b",
+      "b21cbd6d566d4ef293ab98e51a1033f1",
+      "17d2ae89093f4d2f9962ffa654ddcbad",
+      "9d9ab19f4caf487694d6483f234aabb7",
+      "5f52c41b56774eefac83864f42dabe28",
+      "4884f6f41f4045b5ba0239898fee50c6",
+      "ff77c736962b458c9341a947cd00a7f3",
+      "8c9072b8a35849cfbda6f5eb9179f528",
+      "7efffcc4356344228af97bb22065c750",
+      "1bc3fd2803e644e284752fb42a92bfc5",
+      "8d9c6c7014a24d719d36210cdb04b89a",
+      "f0312ab0e54c4395ab3b24deaf6ac930",
+      "94bcce13ca63491895532a8b03fbdc50",
+      "29f6e78fa0d64bee95316178f2af26b4",
+      "5ca4298d4a8d41d7ab357ab0d6c41607",
+      "69bb8165fe03447cac2409e52dfb6fba",
+      "b4f131eac5d145ac99773413639efd30",
+      "21c0e13bf8814bf8a7698831a81f40ce",
+      "6ad2981514934ba3a99d9af804b71b83",
+      "8aa676e6e41e4cb68f08b7b6fff394b8",
+      "69b1631b328e408e846e545accda625c",
+      "db375dcc92b04b64a3ece532b7058590",
+      "90fe90981b814463a2106ad7ab9d268e",
+      "ab355a59d76a46f695b4f40132aab760",
+      "7df0ad47f4624fb3a61cff463428e2f5",
+      "5ae61ea745fd4728ac38282300dde003",
+      "f2a66c6cda7346e4b5f1e0b535ebaca1",
+      "a24d5e98caa24cf39fb422dff93c7eca",
+      "8de77145f60b4271b5357abe6a145675",
+      "ba3552f1892e4334a82d7ff298cd3b5b",
+      "b733682eb42347f5906cc121927916e1",
+      "e4cd66a09968401ab56ad2951d4b26d1",
+      "8d1d910a9a1c46fa988835118b626691",
+      "a9ee6367c48540678a00d16948920aad",
+      "7975972153144d30b42aacace4e83274",
+      "2cb85592bf97403fbad9bb8c519cd8bf",
+      "f95a49beeb19460b94e318841aab492f",
+      "0ff989201f644a51adb95470a9292c66",
+      "70390c6a974a4fc583ca457e22140d9f",
+      "babcacf75255494f877706da78a2f6b4",
+      "962f0a845a8141fb9a616a548cf586ae",
+      "4614a496a0e742a1b7012bc5eaf3c846",
+      "be0724b67e1140b292ff67811ecae2e3",
+      "f62e6725df84439c85114851b3bac16b",
+      "85f395657239437bb8714f4cc31e0b47",
+      "f16162d038144049a87d95909db044fe",
+      "78ceb340847a4c10ba8e016746024af8",
+      "b1e5b5b6a98b4c29b6be1a646ff62c7c",
+      "80787ac2994845788981beff20ace5d4",
+      "c848ed8b46d546cfbc8a5a7e92e4ae44",
+      "9bb104726b3449cca9b3a4a5d60ff4eb",
+      "347ff1dbd39d441eb77d5cef02415a5e",
+      "c890c36976494af2b1a161306981b67c",
+      "cbfa575577d5449b8b23dd4a8600c982",
+      "dd686226092a4ebda728440cd72ef649",
+      "08408d415bac43bb82180aeb65e11592",
+      "507b6215a4d04df4ae38250d0ded7ba7",
+      "496aacba74bd42e983ffa1ba00d1c7e2",
+      "00b905e9cfa049f8bc32cb7166489f82",
+      "20cf7cbc45b345e599dc61c80fef33d6",
+      "47e583b278674aa38fc7883c10b44a20",
+      "a0294366add94b328970d7e7b20844d7"
+     ]
     },
+    "id": "ETpQKftLplqh",
+    "outputId": "2b73c450-364e-4483-80b1-449dccff6e6c"
+   },
+   "outputs": [
     {
-      "cell_type": "markdown",
-      "metadata": {
-        "id": "9y4iJE_SrS4K"
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "2cc35d93724b4e0f9608fe6999e96baa",
+       "version_major": 2,
+       "version_minor": 0
       },
-      "source": [
-        "### Write Documents to the DocumentStore\n",
-        "\n",
-        "Run the `doc_embedder` with the Documents. The embedder will create embeddings for each document and store them in that document's `embedding` field. Then, write the Documents to the DocumentStore with the `write_documents()` method."
+      "text/plain": [
+       "modules.json:   0%|          | 0.00/349 [00:00<?, ?B/s]"
       ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
     },
     {
-      "cell_type": "code",
-      "execution_count": 5,
-      "metadata": {
-        "colab": {
-          "base_uri": "https://localhost:8080/",
-          "height": 576,
-          "referenced_widgets": [
-            "2cc35d93724b4e0f9608fe6999e96baa",
-            "769840529f8e48378f568109e008dda7",
-            "5e34616bda1840db92c9afdbcc17b090",
-            "74296c48c5204c26a186d5e6fe2eb389",
-            "6ab0bef578534eb3b326ce3f1c7952cb",
-            "821e521c20eb4952a9f553be1707fe4d",
-            "b627994ed6fb4e419d0d7b042a2d1845",
-            "430c4f94f9704dceb7657fdf54e4e979",
-            "b9f80e63f9f4477e815fb6741e0b7481",
-            "1bb5874fc5424756839b3119ee88c652",
-            "adf3861551a74ac2bfd622fe9a4dd8c4",
-            "f0ab87c57a644c8693e51d2f04a666f3",
-            "9acd8a5fa709457eb1627bdafed3dc90",
-            "a99f41226d8c48978417e050c447cf06",
-            "fa24a76d328e47eeac0c12fc4a50bcd7",
-            "a3cd8b42b2884452b82f56e81b9f23fa",
-            "f4a53626b22f458ab46e2bf3ce91cf1f",
-            "9f2586e4929e47ea8e3ce7788b9d6a09",
-            "0b3d4bc9fc8e4f7d96a04b9728d966c0",
-            "00be43d5e49d4d288757d8c3b4566262",
-            "851f2132407f4602bdb482e09aff7864",
-            "0a73b3d5dd7e4658ac146786039c005c",
-            "efe7818df31b4b4fb4ac23447133add1",
-            "d2b362efd0ad499193b03da90419ee41",
-            "31f44064c8b64cfcb8a305e111c8465a",
-            "77eb3fe2195b43d8aa622f23d009dfd6",
-            "3bc2a31d2fbb4f548c7a7fbbecb4de56",
-            "32bf3855ebea499c97baa448b4d721d5",
-            "3fa909ce952b471e9883a4c32586e111",
-            "23e319859ad64a389e141e6ec6175cb5",
-            "17d53e1b04ba4196b2d0d9ffd8a6fa29",
-            "92248f3c7de0496c8ca16a26f528ab5e",
-            "9fe390e03164438a855d4c041a3e3435",
-            "be6e75733aa44951a9a2f1e76b3d1627",
-            "9e58a463153b4aadac2b54ffac39c0b4",
-            "72f7dd0ba5ce45359b9ed35563b59aee",
-            "75986772e38e4dbea85249f34f52178e",
-            "894070da75a948e8af880e57898e5cb8",
-            "4c903df362c840b5a887a549e86ac62f",
-            "42166f3fba3b400c858d1e10feb4c751",
-            "65deef2a69ee47a698b3b6f3e4a6bce6",
-            "4fd6a3cecf47491bad25a58f563c4a15",
-            "11053c79eb414fc4976cef3966a7fac1",
-            "7f5cbe293ec2416f80c97c91fce7df1e",
-            "132784a9e3d74220abf9748a4d17ca89",
-            "39e35e2d422245ce833481b43416441e",
-            "b38ec117ee1741148e3d5e79167e74fe",
-            "d02863cda9c44772a165b7be9bd2fea9",
-            "41e2ffb4d7a645d5bb5ec794ee21cf86",
-            "a6c11c68ab754703b2c1c8f6816bb96a",
-            "25666b5ff5604b8ba366a529c5025230",
-            "0b4eb164565445b28828357715ef329b",
-            "4d865aefb4ab48448fcf458ad256ca20",
-            "b47bd72419e041ce8cdcc43d263a6686",
-            "f37aad71e98948e480718fa4e3f70217",
-            "7b2b5ad63a0b4775bbb652453c179d19",
-            "252525f805004deca52a9a94f9eae057",
-            "d8d01da923864706b8331af4f361b047",
-            "51770f17bef74ff59a1993abeb82de5f",
-            "bb2fbfbc2dc34f5d87c03e46f551ea98",
-            "836d16710f9e4edbbf6b1233af637928",
-            "35da2a2f76664857b9390b1d80c2ecd2",
-            "9d53c7d71c9e400399cf37b2f37c91af",
-            "2fae67ce866a4e8cb125f8395d96d896",
-            "4813b61b1f1c4adba5b9fe214459cac9",
-            "b47368b719da42aaad46070cf40a7a00",
-            "65d85c964cfb46dab8b9ea69c9506ada",
-            "5589e6aa47c541ce889beda46435a9c7",
-            "4694f52453794bb4b873de48ab7c6b3c",
-            "557161a5e01a40e390c86f344089fc60",
-            "a8185ea16ee54420a17c1cca14468b7c",
-            "86f2d32941e845088ceade417b76424a",
-            "bece87ceb6b04dacb8f01347a9d5bb7d",
-            "02ab1ee2008f4008b5f19346005ce6f7",
-            "73b9187ac82b4adb8117f90fb231434d",
-            "87cd40c733e44790bfa102607827596f",
-            "62431513a3b643839dcd0076b2ed1a9f",
-            "98895c06137b4d80b5451f56f06324a4",
-            "bedd40889bf6433f932729d5db0539f0",
-            "2812a84fd4e14914a93f37a32c7430db",
-            "9003b727e1f64fe19386a725d8a344fa",
-            "952bafd6d58144b28bc2c4ad66ed4f8b",
-            "b21cbd6d566d4ef293ab98e51a1033f1",
-            "17d2ae89093f4d2f9962ffa654ddcbad",
-            "9d9ab19f4caf487694d6483f234aabb7",
-            "5f52c41b56774eefac83864f42dabe28",
-            "4884f6f41f4045b5ba0239898fee50c6",
-            "ff77c736962b458c9341a947cd00a7f3",
-            "8c9072b8a35849cfbda6f5eb9179f528",
-            "7efffcc4356344228af97bb22065c750",
-            "1bc3fd2803e644e284752fb42a92bfc5",
-            "8d9c6c7014a24d719d36210cdb04b89a",
-            "f0312ab0e54c4395ab3b24deaf6ac930",
-            "94bcce13ca63491895532a8b03fbdc50",
-            "29f6e78fa0d64bee95316178f2af26b4",
-            "5ca4298d4a8d41d7ab357ab0d6c41607",
-            "69bb8165fe03447cac2409e52dfb6fba",
-            "b4f131eac5d145ac99773413639efd30",
-            "21c0e13bf8814bf8a7698831a81f40ce",
-            "6ad2981514934ba3a99d9af804b71b83",
-            "8aa676e6e41e4cb68f08b7b6fff394b8",
-            "69b1631b328e408e846e545accda625c",
-            "db375dcc92b04b64a3ece532b7058590",
-            "90fe90981b814463a2106ad7ab9d268e",
-            "ab355a59d76a46f695b4f40132aab760",
-            "7df0ad47f4624fb3a61cff463428e2f5",
-            "5ae61ea745fd4728ac38282300dde003",
-            "f2a66c6cda7346e4b5f1e0b535ebaca1",
-            "a24d5e98caa24cf39fb422dff93c7eca",
-            "8de77145f60b4271b5357abe6a145675",
-            "ba3552f1892e4334a82d7ff298cd3b5b",
-            "b733682eb42347f5906cc121927916e1",
-            "e4cd66a09968401ab56ad2951d4b26d1",
-            "8d1d910a9a1c46fa988835118b626691",
-            "a9ee6367c48540678a00d16948920aad",
-            "7975972153144d30b42aacace4e83274",
-            "2cb85592bf97403fbad9bb8c519cd8bf",
-            "f95a49beeb19460b94e318841aab492f",
-            "0ff989201f644a51adb95470a9292c66",
-            "70390c6a974a4fc583ca457e22140d9f",
-            "babcacf75255494f877706da78a2f6b4",
-            "962f0a845a8141fb9a616a548cf586ae",
-            "4614a496a0e742a1b7012bc5eaf3c846",
-            "be0724b67e1140b292ff67811ecae2e3",
-            "f62e6725df84439c85114851b3bac16b",
-            "85f395657239437bb8714f4cc31e0b47",
-            "f16162d038144049a87d95909db044fe",
-            "78ceb340847a4c10ba8e016746024af8",
-            "b1e5b5b6a98b4c29b6be1a646ff62c7c",
-            "80787ac2994845788981beff20ace5d4",
-            "c848ed8b46d546cfbc8a5a7e92e4ae44",
-            "9bb104726b3449cca9b3a4a5d60ff4eb",
-            "347ff1dbd39d441eb77d5cef02415a5e",
-            "c890c36976494af2b1a161306981b67c",
-            "cbfa575577d5449b8b23dd4a8600c982",
-            "dd686226092a4ebda728440cd72ef649",
-            "08408d415bac43bb82180aeb65e11592",
-            "507b6215a4d04df4ae38250d0ded7ba7",
-            "496aacba74bd42e983ffa1ba00d1c7e2",
-            "00b905e9cfa049f8bc32cb7166489f82",
-            "20cf7cbc45b345e599dc61c80fef33d6",
-            "47e583b278674aa38fc7883c10b44a20",
-            "a0294366add94b328970d7e7b20844d7"
-          ]
-        },
-        "id": "ETpQKftLplqh",
-        "outputId": "2b73c450-364e-4483-80b1-449dccff6e6c"
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "f0ab87c57a644c8693e51d2f04a666f3",
+       "version_major": 2,
+       "version_minor": 0
       },
-      "outputs": [
-        {
-          "data": {
-            "application/vnd.jupyter.widget-view+json": {
-              "model_id": "2cc35d93724b4e0f9608fe6999e96baa",
-              "version_major": 2,
-              "version_minor": 0
-            },
-            "text/plain": [
-              "modules.json:   0%|          | 0.00/349 [00:00<?, ?B/s]"
-            ]
-          },
-          "metadata": {},
-          "output_type": "display_data"
-        },
-        {
-          "data": {
-            "application/vnd.jupyter.widget-view+json": {
-              "model_id": "f0ab87c57a644c8693e51d2f04a666f3",
-              "version_major": 2,
-              "version_minor": 0
-            },
-            "text/plain": [
-              "config_sentence_transformers.json:   0%|          | 0.00/116 [00:00<?, ?B/s]"
-            ]
-          },
-          "metadata": {},
-          "output_type": "display_data"
-        },
-        {
-          "data": {
-            "application/vnd.jupyter.widget-view+json": {
-              "model_id": "efe7818df31b4b4fb4ac23447133add1",
-              "version_major": 2,
-              "version_minor": 0
-            },
-            "text/plain": [
-              "README.md: 0.00B [00:00, ?B/s]"
-            ]
-          },
-          "metadata": {},
-          "output_type": "display_data"
-        },
-        {
-          "data": {
-            "application/vnd.jupyter.widget-view+json": {
-              "model_id": "be6e75733aa44951a9a2f1e76b3d1627",
-              "version_major": 2,
-              "version_minor": 0
-            },
-            "text/plain": [
-              "sentence_bert_config.json:   0%|          | 0.00/53.0 [00:00<?, ?B/s]"
-            ]
-          },
-          "metadata": {},
-          "output_type": "display_data"
-        },
-        {
-          "data": {
-            "application/vnd.jupyter.widget-view+json": {
-              "model_id": "132784a9e3d74220abf9748a4d17ca89",
-              "version_major": 2,
-              "version_minor": 0
-            },
-            "text/plain": [
-              "config.json:   0%|          | 0.00/612 [00:00<?, ?B/s]"
-            ]
-          },
-          "metadata": {},
-          "output_type": "display_data"
-        },
-        {
-          "data": {
-            "application/vnd.jupyter.widget-view+json": {
-              "model_id": "7b2b5ad63a0b4775bbb652453c179d19",
-              "version_major": 2,
-              "version_minor": 0
-            },
-            "text/plain": [
-              "model.safetensors:   0%|          | 0.00/90.9M [00:00<?, ?B/s]"
-            ]
-          },
-          "metadata": {},
-          "output_type": "display_data"
-        },
-        {
-          "data": {
-            "application/vnd.jupyter.widget-view+json": {
-              "model_id": "65d85c964cfb46dab8b9ea69c9506ada",
-              "version_major": 2,
-              "version_minor": 0
-            },
-            "text/plain": [
-              "Loading weights:   0%|          | 0/103 [00:00<?, ?it/s]"
-            ]
-          },
-          "metadata": {},
-          "output_type": "display_data"
-        },
-        {
-          "name": "stdout",
-          "output_type": "stream",
-          "text": [
-            "BertModel LOAD REPORT from: sentence-transformers/all-MiniLM-L6-v2\n",
-            "Key                     | Status     |  | \n",
-            "------------------------+------------+--+-\n",
-            "embeddings.position_ids | UNEXPECTED |  | \n",
-            "\n",
-            "Notes:\n",
-            "- UNEXPECTED\t:can be ignored when loading from different task/architecture; not ok if you expect identical arch.\n"
-          ]
-        },
-        {
-          "data": {
-            "application/vnd.jupyter.widget-view+json": {
-              "model_id": "98895c06137b4d80b5451f56f06324a4",
-              "version_major": 2,
-              "version_minor": 0
-            },
-            "text/plain": [
-              "tokenizer_config.json:   0%|          | 0.00/350 [00:00<?, ?B/s]"
-            ]
-          },
-          "metadata": {},
-          "output_type": "display_data"
-        },
-        {
-          "data": {
-            "application/vnd.jupyter.widget-view+json": {
-              "model_id": "8c9072b8a35849cfbda6f5eb9179f528",
-              "version_major": 2,
-              "version_minor": 0
-            },
-            "text/plain": [
-              "vocab.txt: 0.00B [00:00, ?B/s]"
-            ]
-          },
-          "metadata": {},
-          "output_type": "display_data"
-        },
-        {
-          "data": {
-            "application/vnd.jupyter.widget-view+json": {
-              "model_id": "6ad2981514934ba3a99d9af804b71b83",
-              "version_major": 2,
-              "version_minor": 0
-            },
-            "text/plain": [
-              "tokenizer.json: 0.00B [00:00, ?B/s]"
-            ]
-          },
-          "metadata": {},
-          "output_type": "display_data"
-        },
-        {
-          "data": {
-            "application/vnd.jupyter.widget-view+json": {
-              "model_id": "ba3552f1892e4334a82d7ff298cd3b5b",
-              "version_major": 2,
-              "version_minor": 0
-            },
-            "text/plain": [
-              "special_tokens_map.json:   0%|          | 0.00/112 [00:00<?, ?B/s]"
-            ]
-          },
-          "metadata": {},
-          "output_type": "display_data"
-        },
-        {
-          "data": {
-            "application/vnd.jupyter.widget-view+json": {
-              "model_id": "962f0a845a8141fb9a616a548cf586ae",
-              "version_major": 2,
-              "version_minor": 0
-            },
-            "text/plain": [
-              "config.json:   0%|          | 0.00/190 [00:00<?, ?B/s]"
-            ]
-          },
-          "metadata": {},
-          "output_type": "display_data"
-        },
-        {
-          "data": {
-            "application/vnd.jupyter.widget-view+json": {
-              "model_id": "347ff1dbd39d441eb77d5cef02415a5e",
-              "version_major": 2,
-              "version_minor": 0
-            },
-            "text/plain": [
-              "Batches:   0%|          | 0/5 [00:00<?, ?it/s]"
-            ]
-          },
-          "metadata": {},
-          "output_type": "display_data"
-        },
-        {
-          "data": {
-            "text/plain": [
-              "151"
-            ]
-          },
-          "execution_count": null,
-          "metadata": {},
-          "output_type": "execute_result"
-        }
-      ],
-      "source": [
-        "docs_with_embeddings = doc_embedder.run(docs)\n",
-        "document_store.write_documents(docs_with_embeddings[\"documents\"])"
+      "text/plain": [
+       "config_sentence_transformers.json:   0%|          | 0.00/116 [00:00<?, ?B/s]"
       ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
     },
     {
-      "cell_type": "markdown",
-      "metadata": {
-        "id": "IdojTxg6uubn"
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "efe7818df31b4b4fb4ac23447133add1",
+       "version_major": 2,
+       "version_minor": 0
       },
-      "source": [
-        "## Building the RAG Pipeline\n",
-        "\n",
-        "The next step is to build a [Pipeline](https://docs.haystack.deepset.ai/docs/pipelines) to generate answers for the user query following the RAG approach. To create the pipeline, you first need to initialize each component, add them to your pipeline, and connect them."
+      "text/plain": [
+       "README.md: 0.00B [00:00, ?B/s]"
       ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
     },
     {
-      "cell_type": "markdown",
-      "metadata": {
-        "id": "0uyV6-u-u56P"
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "be6e75733aa44951a9a2f1e76b3d1627",
+       "version_major": 2,
+       "version_minor": 0
       },
-      "source": [
-        "### Initialize a Text Embedder\n",
-        "\n",
-        "Initialize a text embedder to create an embedding for the user query. The created embedding will later be used by the Retriever to retrieve relevant documents from the DocumentStore.\n",
-        "\n",
-        "> ⚠️ Notice that you used `sentence-transformers/all-MiniLM-L6-v2` model to create embeddings for your documents before. This is why you need to use the same model to embed the user queries."
+      "text/plain": [
+       "sentence_bert_config.json:   0%|          | 0.00/53.0 [00:00<?, ?B/s]"
       ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
     },
     {
-      "cell_type": "code",
-      "execution_count": 6,
-      "metadata": {
-        "id": "LyJY2yW628dl"
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "132784a9e3d74220abf9748a4d17ca89",
+       "version_major": 2,
+       "version_minor": 0
       },
-      "outputs": [],
-      "source": [
-        "from haystack.components.embedders import SentenceTransformersTextEmbedder\n",
-        "\n",
-        "text_embedder = SentenceTransformersTextEmbedder(model=\"sentence-transformers/all-MiniLM-L6-v2\")"
+      "text/plain": [
+       "config.json:   0%|          | 0.00/612 [00:00<?, ?B/s]"
       ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
     },
     {
-      "cell_type": "markdown",
-      "metadata": {
-        "id": "0_cj-5m-O-qb"
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "7b2b5ad63a0b4775bbb652453c179d19",
+       "version_major": 2,
+       "version_minor": 0
       },
-      "source": [
-        "### Initialize the Retriever\n",
-        "\n",
-        "Initialize an [InMemoryEmbeddingRetriever](https://docs.haystack.deepset.ai/docs/inmemoryembeddingretriever) and make it use the `InMemoryDocumentStore` you initialized earlier in this tutorial. This Retriever will fetch the documents most relevant to the query."
+      "text/plain": [
+       "model.safetensors:   0%|          | 0.00/90.9M [00:00<?, ?B/s]"
       ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
     },
     {
-      "cell_type": "code",
-      "execution_count": 7,
-      "metadata": {
-        "id": "-uo-6fjiO-qb"
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "65d85c964cfb46dab8b9ea69c9506ada",
+       "version_major": 2,
+       "version_minor": 0
       },
-      "outputs": [],
-      "source": [
-        "from haystack.components.retrievers.in_memory import InMemoryEmbeddingRetriever\n",
-        "\n",
-        "retriever = InMemoryEmbeddingRetriever(document_store)"
+      "text/plain": [
+       "Loading weights:   0%|          | 0/103 [00:00<?, ?it/s]"
       ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
     },
     {
-      "cell_type": "markdown",
-      "metadata": {
-        "id": "6CEuQpB7O-qb"
-      },
-      "source": [
-        "### Define a Template Prompt\n",
-        "\n",
-        "Create a [ChatMessage](https://docs.haystack.deepset.ai/docs/chatmessage) object with the `from_user` method and pass the custom prompt for a question answering task using the RAG approach. The prompt should take in two parameters: `documents`, which are retrieved from a document store, and a `question` from the user. Use the Jinja2 looping syntax to combine the content of the retrieved documents in the prompt.\n",
-        "\n",
-        "Next, initialize a [ChatPromptBuilder](https://docs.haystack.deepset.ai/docs/chatpromptbuilder) instance with your prompt template. The `ChatPromptBuilder`, when given the necessary values, will automatically fill in the variable values and generate a complete prompt. This approach allows for a more tailored and effective question-answering experience.\n",
-        "\n",
-        "> By default, all prompt variables are treated as optional. Set `required_variables=\"*\"` to ensure that all prompt variables are mandatory for the prompt."
-      ]
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "BertModel LOAD REPORT from: sentence-transformers/all-MiniLM-L6-v2\n",
+      "Key                     | Status     |  | \n",
+      "------------------------+------------+--+-\n",
+      "embeddings.position_ids | UNEXPECTED |  | \n",
+      "\n",
+      "Notes:\n",
+      "- UNEXPECTED\t:can be ignored when loading from different task/architecture; not ok if you expect identical arch.\n"
+     ]
     },
     {
-      "cell_type": "code",
-      "execution_count": 10,
-      "metadata": {
-        "id": "ObahTh45FqOT"
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "98895c06137b4d80b5451f56f06324a4",
+       "version_major": 2,
+       "version_minor": 0
       },
-      "outputs": [],
-      "source": [
-        "from haystack.components.builders import ChatPromptBuilder\n",
-        "from haystack.dataclasses import ChatMessage\n",
-        "\n",
-        "template = [\n",
-        "    ChatMessage.from_user(\n",
-        "        \"\"\"\n",
-        "Given the following information, answer the question.\n",
-        "\n",
-        "Context:\n",
-        "{% for document in documents %}\n",
-        "    {{ document.content }}\n",
-        "{% endfor %}\n",
-        "\n",
-        "Question: {{question}}\n",
-        "Answer:\n",
-        "\"\"\"\n",
-        "    )\n",
-        "]\n",
-        "\n",
-        "prompt_builder = ChatPromptBuilder(template=template, required_variables=\"*\")"
+      "text/plain": [
+       "tokenizer_config.json:   0%|          | 0.00/350 [00:00<?, ?B/s]"
       ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
     },
     {
-      "cell_type": "markdown",
-      "metadata": {
-        "id": "HR14lbfcFtXj"
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "8c9072b8a35849cfbda6f5eb9179f528",
+       "version_major": 2,
+       "version_minor": 0
       },
-      "source": [
-        "### Initialize a ChatGenerator\n",
-        "\n",
-        "[ChatGenerators](https://docs.haystack.deepset.ai/docs/generators) are the components that call large language models (LLMs) and return chat completions.\n",
-        "\n",
-        "**Before you run the pipeline, decide how you will access the LLM:**\n",
-        "\n",
-        "- **Hosted provider API** — Create an API key with a provider. In Colab, you can store it under *Secrets* tab or set the matching environment variable (`OPENAI_API_KEY`, `MISTRAL_API_KEY`, …). The cells below prompt for a key if it is not already set.\n",
-        "- **Local or self-hosted (including on Colab)** — If you prefer not to use a remote API, you can run an open-weight model on your machine or the Colab runtime with [`HuggingFaceLocalChatGenerator`](https://docs.haystack.deepset.ai/docs/huggingfacelocalchatgenerator). See the [generators documentation](https://docs.haystack.deepset.ai/docs/generators) for more integrations.\n",
-        "\n",
-        "The next three sections show **OpenAI**, **Mistral**, and **Hugging Face** as examples. Run **only one** of them to define `chat_generator`."
-      ]
-    },
-    {
-      "cell_type": "markdown",
-      "metadata": {},
-      "source": [
-        "**Use open-weight models from Hugging Face (no API key required for local inference)**\n",
-        "\n",
-        "Initialize `HuggingFaceLocalChatGenerator` with an open-weight LLM from Hugging Face, such as [Qwen/Qwen3-4B-Instruct-2507](https://huggingface.co/Qwen/Qwen3-4B-Instruct-2507). To call models through the **Hugging Face Inference API** instead, use [`HuggingFaceAPIChatGenerator`](https://docs.haystack.deepset.ai/docs/huggingfaceapichatgenerator), which requires a Hugging Face API token."
+      "text/plain": [
+       "vocab.txt: 0.00B [00:00, ?B/s]"
       ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
     },
     {
-      "cell_type": "code",
-      "execution_count": null,
-      "metadata": {},
-      "outputs": [],
-      "source": [
-        "from haystack.components.generators.chat import HuggingFaceLocalChatGenerator\n",
-        "\n",
-        "chat_generator = HuggingFaceLocalChatGenerator(model=\"Qwen/Qwen3-4B-Instruct-2507\")"
-      ]
-    },
-    {
-      "cell_type": "markdown",
-      "metadata": {},
-      "source": [
-        "**Use OpenAI's GPT models (requires an API key)**\n",
-        "\n",
-        "[Get an OpenAI API key](https://platform.openai.com/api-keys) and set it as the `OPENAI_API_KEY` environment variable. Then initialize `OpenAIChatGenerator` with the model name you want to use. "
-      ]
-    },
-    {
-      "cell_type": "code",
-      "execution_count": null,
-      "metadata": {
-        "id": "SavE_FAqfApo"
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "6ad2981514934ba3a99d9af804b71b83",
+       "version_major": 2,
+       "version_minor": 0
       },
-      "outputs": [],
-      "source": [
-        "import os\n",
-        "from getpass import getpass\n",
-        "from haystack.components.generators.chat import OpenAIChatGenerator\n",
-        "\n",
-        "if \"OPENAI_API_KEY\" not in os.environ:\n",
-        "    os.environ[\"OPENAI_API_KEY\"] = getpass(\"Enter OpenAI API key:\")\n",
-        "    \n",
-        "chat_generator = OpenAIChatGenerator(model=\"gpt-4o-mini\")"
+      "text/plain": [
+       "tokenizer.json: 0.00B [00:00, ?B/s]"
       ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
     },
     {
-      "cell_type": "markdown",
-      "metadata": {},
-      "source": [
-        "**Use Mistral models (requires a free API key)**\n",
-        "\n",
-        "[Get a Mistral API key](https://docs.mistral.ai/) (free tier available) and set it as the `MISTRAL_API_KEY` environment variable. Then initialize `MistralChatGenerator` with the model name you want to use. "
-      ]
-    },
-    {
-      "cell_type": "code",
-      "execution_count": null,
-      "metadata": {
-        "colab": {
-          "base_uri": "https://localhost:8080/"
-        },
-        "id": "0-zl-0WsZI7T",
-        "outputId": "dffb77e3-8c03-4fc2-d038-692e1d3cc2e7"
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "ba3552f1892e4334a82d7ff298cd3b5b",
+       "version_major": 2,
+       "version_minor": 0
       },
-      "outputs": [
-        {
-          "name": "stdout",
-          "output_type": "stream",
-          "text": [
-            "Enter Mistral API key:··········\n"
-          ]
-        }
-      ],
-      "source": [
-        "import os\n",
-        "from getpass import getpass\n",
-        "from haystack_integrations.components.generators.mistral import MistralChatGenerator\n",
-        "\n",
-        "if \"MISTRAL_API_KEY\" not in os.environ:\n",
-        "  os.environ[\"MISTRAL_API_KEY\"] = getpass(\"Enter Mistral API key:\")\n",
-        "  \n",
-        "chat_generator = MistralChatGenerator(model=\"mistral-small-latest\")"
+      "text/plain": [
+       "special_tokens_map.json:   0%|          | 0.00/112 [00:00<?, ?B/s]"
       ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
     },
     {
-      "cell_type": "markdown",
-      "metadata": {
-        "id": "nenbo2SvycHd"
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "962f0a845a8141fb9a616a548cf586ae",
+       "version_major": 2,
+       "version_minor": 0
       },
-      "source": [
-        "> You can replace the examples above with any Haystack `ChatGenerator` that fits your setup: another API provider or a local / Colab-hosted backend. See the full list of chat generators [here](https://docs.haystack.deepset.ai/docs/generators)."
+      "text/plain": [
+       "config.json:   0%|          | 0.00/190 [00:00<?, ?B/s]"
       ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
     },
     {
-      "cell_type": "markdown",
-      "metadata": {
-        "id": "1bfHwOQwycHe"
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "347ff1dbd39d441eb77d5cef02415a5e",
+       "version_major": 2,
+       "version_minor": 0
       },
-      "source": [
-        "### Build the Pipeline\n",
-        "\n",
-        "To build a pipeline, add all components to your pipeline and connect them. Create connections from `text_embedder`'s \"embedding\" output to \"query_embedding\" input of `retriever`, from `retriever` to `prompt_builder` and from `prompt_builder` to `llm`. Explicitly connect the output of `retriever` with \"documents\" input of the `prompt_builder` to make the connection obvious as `prompt_builder` has two inputs (\"documents\" and \"question\").\n",
-        "\n",
-        "For more information on pipelines and creating connections, refer to [Creating Pipelines](https://docs.haystack.deepset.ai/docs/creating-pipelines) documentation."
+      "text/plain": [
+       "Batches:   0%|          | 0/5 [00:00<?, ?it/s]"
       ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
     },
     {
-      "cell_type": "code",
-      "execution_count": 14,
-      "metadata": {
-        "id": "f6NFmpjEO-qb"
-      },
-      "outputs": [],
-      "source": [
-        "from haystack import Pipeline\n",
-        "\n",
-        "basic_rag_pipeline = Pipeline()\n",
-        "# Add components to your pipeline\n",
-        "basic_rag_pipeline.add_component(\"text_embedder\", text_embedder)\n",
-        "basic_rag_pipeline.add_component(\"retriever\", retriever)\n",
-        "basic_rag_pipeline.add_component(\"prompt_builder\", prompt_builder)\n",
-        "basic_rag_pipeline.add_component(\"llm\", chat_generator)"
-      ]
-    },
-    {
-      "cell_type": "code",
-      "execution_count": 15,
-      "metadata": {
-        "colab": {
-          "base_uri": "https://localhost:8080/"
-        },
-        "id": "CyqzFsp1qWVM",
-        "outputId": "591f9e19-13d6-4232-f00a-d6becd89694b"
-      },
-      "outputs": [
-        {
-          "data": {
-            "text/plain": [
-              "<haystack.core.pipeline.pipeline.Pipeline object at 0x7a7fb2c19730>\n",
-              "🚅 Components\n",
-              "  - text_embedder: SentenceTransformersTextEmbedder\n",
-              "  - retriever: InMemoryEmbeddingRetriever\n",
-              "  - prompt_builder: ChatPromptBuilder\n",
-              "  - llm: MistralChatGenerator\n",
-              "🛤️ Connections\n",
-              "  - text_embedder.embedding -> retriever.query_embedding (list[float])\n",
-              "  - retriever.documents -> prompt_builder.documents (list[Document])\n",
-              "  - prompt_builder.prompt -> llm.messages (list[ChatMessage])"
-            ]
-          },
-          "execution_count": 15,
-          "metadata": {},
-          "output_type": "execute_result"
-        }
-      ],
-      "source": [
-        "# Now, connect the components to each other\n",
-        "basic_rag_pipeline.connect(\"text_embedder.embedding\", \"retriever.query_embedding\")\n",
-        "basic_rag_pipeline.connect(\"retriever\", \"prompt_builder\")\n",
-        "basic_rag_pipeline.connect(\"prompt_builder.prompt\", \"llm.messages\")"
-      ]
-    },
-    {
-      "cell_type": "markdown",
-      "metadata": {
-        "id": "6NqyLhx7O-qc"
-      },
-      "source": [
-        "That's it! Your RAG pipeline is ready to generate answers to questions!"
-      ]
-    },
-    {
-      "cell_type": "markdown",
-      "metadata": {
-        "id": "DBAyF5tVO-qc"
-      },
-      "source": [
-        "## Asking a Question\n",
-        "\n",
-        "When asking a question, use the `run()` method of the pipeline. Make sure to provide the question to both the `text_embedder` and the `prompt_builder`. This ensures that the `{{question}}` variable in the template prompt gets replaced with your specific question.\n",
-        "\n",
-        "> ⚠️ If you host the model on the Colab runtime (for example with HuggingFaceLocalChatGenerator), the first pipeline run can take longer as the LLM is loaded and prepared for inference."
+     "data": {
+      "text/plain": [
+       "151"
       ]
+     },
+     "execution_count": null,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "docs_with_embeddings = doc_embedder.run(docs)\n",
+    "document_store.write_documents(docs_with_embeddings[\"documents\"])"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {
+    "id": "IdojTxg6uubn"
+   },
+   "source": [
+    "## Building the RAG Pipeline\n",
+    "\n",
+    "The next step is to build a [Pipeline](https://docs.haystack.deepset.ai/docs/pipelines) to generate answers for the user query following the RAG approach. To create the pipeline, you first need to initialize each component, add them to your pipeline, and connect them."
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {
+    "id": "0uyV6-u-u56P"
+   },
+   "source": [
+    "### Initialize a Text Embedder\n",
+    "\n",
+    "Initialize a text embedder to create an embedding for the user query. The created embedding will later be used by the Retriever to retrieve relevant documents from the DocumentStore.\n",
+    "\n",
+    "> ⚠️ Notice that you used `sentence-transformers/all-MiniLM-L6-v2` model to create embeddings for your documents before. This is why you need to use the same model to embed the user queries."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 6,
+   "metadata": {
+    "id": "LyJY2yW628dl"
+   },
+   "outputs": [],
+   "source": [
+    "from haystack.components.embedders import SentenceTransformersTextEmbedder\n",
+    "\n",
+    "text_embedder = SentenceTransformersTextEmbedder(model=\"sentence-transformers/all-MiniLM-L6-v2\")"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {
+    "id": "0_cj-5m-O-qb"
+   },
+   "source": [
+    "### Initialize the Retriever\n",
+    "\n",
+    "Initialize an [InMemoryEmbeddingRetriever](https://docs.haystack.deepset.ai/docs/inmemoryembeddingretriever) and make it use the `InMemoryDocumentStore` you initialized earlier in this tutorial. This Retriever will fetch the documents most relevant to the query."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 7,
+   "metadata": {
+    "id": "-uo-6fjiO-qb"
+   },
+   "outputs": [],
+   "source": [
+    "from haystack.components.retrievers.in_memory import InMemoryEmbeddingRetriever\n",
+    "\n",
+    "retriever = InMemoryEmbeddingRetriever(document_store)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {
+    "id": "6CEuQpB7O-qb"
+   },
+   "source": [
+    "### Define a Template Prompt\n",
+    "\n",
+    "Create a [ChatMessage](https://docs.haystack.deepset.ai/docs/chatmessage) object with the `from_user` method and pass the custom prompt for a question answering task using the RAG approach. The prompt should take in two parameters: `documents`, which are retrieved from a document store, and a `question` from the user. Use the Jinja2 looping syntax to combine the content of the retrieved documents in the prompt.\n",
+    "\n",
+    "Next, initialize a [ChatPromptBuilder](https://docs.haystack.deepset.ai/docs/chatpromptbuilder) instance with your prompt template. The `ChatPromptBuilder`, when given the necessary values, will automatically fill in the variable values and generate a complete prompt. This approach allows for a more tailored and effective question-answering experience.\n",
+    "\n",
+    "> By default, all prompt variables are treated as optional. Set `required_variables=\"*\"` to ensure that all prompt variables are mandatory for the prompt."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 10,
+   "metadata": {
+    "id": "ObahTh45FqOT"
+   },
+   "outputs": [],
+   "source": [
+    "from haystack.components.builders import ChatPromptBuilder\n",
+    "from haystack.dataclasses import ChatMessage\n",
+    "\n",
+    "template = [\n",
+    "    ChatMessage.from_user(\n",
+    "        \"\"\"\n",
+    "Given the following information, answer the question.\n",
+    "\n",
+    "Context:\n",
+    "{% for document in documents %}\n",
+    "    {{ document.content }}\n",
+    "{% endfor %}\n",
+    "\n",
+    "Question: {{question}}\n",
+    "Answer:\n",
+    "\"\"\"\n",
+    "    )\n",
+    "]\n",
+    "\n",
+    "prompt_builder = ChatPromptBuilder(template=template, required_variables=\"*\")"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {
+    "id": "HR14lbfcFtXj"
+   },
+   "source": "### Initialize a ChatGenerator\n\n[ChatGenerators](https://docs.haystack.deepset.ai/docs/generators) are the components that call large language models (LLMs) and return chat completions.\n\n**Before you run the pipeline, decide how you will access the LLM:**\n\n- **Hosted provider API** — Create an API key with a provider. In Colab, you can store it under *Secrets* tab or set the matching environment variable (`OPENAI_API_KEY`, `MISTRAL_API_KEY`, …). The cells below prompt for a key if it is not already set.\n- **Local or self-hosted (including on Colab)** — If you prefer not to use a remote API, you can run an open-weight model on your machine or the Colab runtime with [`TransformersChatGenerator`](https://docs.haystack.deepset.ai/docs/transformerschatgenerator). See the [generators documentation](https://docs.haystack.deepset.ai/docs/generators) for more integrations.\n\nThe next three sections show **OpenAI**, **Mistral**, and **Hugging Face** as examples. Run **only one** of them to define `chat_generator`."
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": "**Use open-weight models from Hugging Face (no API key required for local inference)**\n\nInitialize `TransformersChatGenerator` with an open-weight LLM from Hugging Face, such as [Qwen/Qwen3-4B-Instruct-2507](https://huggingface.co/Qwen/Qwen3-4B-Instruct-2507). `TransformersChatGenerator` is provided by the [`transformers-haystack`](https://haystack.deepset.ai/integrations/huggingface) integration. To call models through the **Hugging Face Inference API** instead, use [`HuggingFaceAPIChatGenerator`](https://docs.haystack.deepset.ai/docs/huggingfaceapichatgenerator), which requires a Hugging Face API token."
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": "from haystack_integrations.components.generators.transformers import TransformersChatGenerator\n\nchat_generator = TransformersChatGenerator(model=\"Qwen/Qwen3-4B-Instruct-2507\")"
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "**Use OpenAI's GPT models (requires an API key)**\n",
+    "\n",
+    "[Get an OpenAI API key](https://platform.openai.com/api-keys) and set it as the `OPENAI_API_KEY` environment variable. Then initialize `OpenAIChatGenerator` with the model name you want to use. "
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {
+    "id": "SavE_FAqfApo"
+   },
+   "outputs": [],
+   "source": [
+    "import os\n",
+    "from getpass import getpass\n",
+    "from haystack.components.generators.chat import OpenAIChatGenerator\n",
+    "\n",
+    "if \"OPENAI_API_KEY\" not in os.environ:\n",
+    "    os.environ[\"OPENAI_API_KEY\"] = getpass(\"Enter OpenAI API key:\")\n",
+    "    \n",
+    "chat_generator = OpenAIChatGenerator(model=\"gpt-4o-mini\")"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "**Use Mistral models (requires a free API key)**\n",
+    "\n",
+    "[Get a Mistral API key](https://docs.mistral.ai/) (free tier available) and set it as the `MISTRAL_API_KEY` environment variable. Then initialize `MistralChatGenerator` with the model name you want to use. "
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {
+    "colab": {
+     "base_uri": "https://localhost:8080/"
     },
+    "id": "0-zl-0WsZI7T",
+    "outputId": "dffb77e3-8c03-4fc2-d038-692e1d3cc2e7"
+   },
+   "outputs": [
     {
-      "cell_type": "code",
-      "execution_count": null,
-      "metadata": {
-        "colab": {
-          "base_uri": "https://localhost:8080/",
-          "height": 86,
-          "referenced_widgets": [
-            "4e6e97b6d54f4f80bb7e8b25aba8e616",
-            "1a820c06a7a049d8b6c9ff300284d06e",
-            "58ff4e0603a74978a134f63533859be5",
-            "8bdb8bfae31d4f4cb6c3b0bf43120eed",
-            "39a68d9a5c274e2dafaa2d1f86eea768",
-            "d0cfe5dacdfc431a91b4c4741123e2d0",
-            "e7f1e1a14bb740d18827dd78bbe7b2e3",
-            "3fda06f905b445a488efdd2dd08c0939",
-            "2bc341a780f7498ba9cd475468841bb5",
-            "d7218475e23b420a8c03d00ca4ab8718",
-            "a694abaf765f4d1b82fa0138e59c6793"
-          ]
-        },
-        "id": "Vnt283M5O-qc",
-        "outputId": "d2843a73-3ad5-4daa-8d1e-a58de7aa2bb0"
-      },
-      "outputs": [
-        {
-          "name": "stdout",
-          "output_type": "stream",
-          "text": [
-            "Batches: 100%|██████████| 1/1 [00:00<00:00,  1.77it/s]\n",
-            "huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks...\n",
-            "To disable this warning, you can either:\n",
-            "\t- Avoid using `tokenizers` before the fork if possible\n",
-            "\t- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)\n"
-          ]
-        },
-        {
-          "name": "stdout",
-          "output_type": "stream",
-          "text": [
-            "The Colossus of Rhodes was a statue of the Greek sun-god Helios, standing approximately 70 cubits (about 33 meters or 108 feet) tall. Although no complete descriptions of its appearance exist, scholars believe it featured the following characteristics:\n",
-            "\n",
-            "1. **Facial Features**: The head of the statue likely had curly hair, with spikes resembling bronze or silver flames radiating outward. This style is similar to depictions found on contemporary Rhodian coins.\n",
-            "\n",
-            "2. **Posture**: While the exact pose is uncertain, it is suggested that the statue may have been constructed in a pose where Helios is depicted shielding his eyes with one hand, a common representation of someone looking toward the sun.\n",
-            "\n",
-            "3. **Construction Materials**: The structure was built using iron tie bars and brass plates, which formed the skin of the statue. The interior was filled with stone blocks.\n",
-            "\n",
-            "4. **Height and Scale**: The Colossus was positioned on a 15-metre-high (49-foot) pedestal, making it one of the tallest statues of the ancient world, towering over the harbor entrance.\n",
-            "\n",
-            "5. **Symbolic Representation**: The statue was meant to symbolize the victory and freedom of the Rhodians after successfully defending their city against an invader.\n",
-            "\n",
-            "Overall, the Colossus of Rhodes was an impressive and monumental statue designed to celebrate and symbolize the strength and resilience of the city of Rhodes.\n"
-          ]
-        }
-      ],
-      "source": [
-        "question = \"What does Rhodes Statue look like?\"\n",
-        "\n",
-        "response = basic_rag_pipeline.run({\"text_embedder\": {\"text\": question}, \"prompt_builder\": {\"question\": question}})\n",
-        "\n",
-        "print(response[\"llm\"][\"replies\"][0].text)"
-      ]
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Enter Mistral API key:··········\n"
+     ]
+    }
+   ],
+   "source": [
+    "import os\n",
+    "from getpass import getpass\n",
+    "from haystack_integrations.components.generators.mistral import MistralChatGenerator\n",
+    "\n",
+    "if \"MISTRAL_API_KEY\" not in os.environ:\n",
+    "  os.environ[\"MISTRAL_API_KEY\"] = getpass(\"Enter Mistral API key:\")\n",
+    "  \n",
+    "chat_generator = MistralChatGenerator(model=\"mistral-small-latest\")"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {
+    "id": "nenbo2SvycHd"
+   },
+   "source": [
+    "> You can replace the examples above with any Haystack `ChatGenerator` that fits your setup: another API provider or a local / Colab-hosted backend. See the full list of chat generators [here](https://docs.haystack.deepset.ai/docs/generators)."
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {
+    "id": "1bfHwOQwycHe"
+   },
+   "source": [
+    "### Build the Pipeline\n",
+    "\n",
+    "To build a pipeline, add all components to your pipeline and connect them. Create connections from `text_embedder`'s \"embedding\" output to \"query_embedding\" input of `retriever`, from `retriever` to `prompt_builder` and from `prompt_builder` to `llm`. Explicitly connect the output of `retriever` with \"documents\" input of the `prompt_builder` to make the connection obvious as `prompt_builder` has two inputs (\"documents\" and \"question\").\n",
+    "\n",
+    "For more information on pipelines and creating connections, refer to [Creating Pipelines](https://docs.haystack.deepset.ai/docs/creating-pipelines) documentation."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 14,
+   "metadata": {
+    "id": "f6NFmpjEO-qb"
+   },
+   "outputs": [],
+   "source": [
+    "from haystack import Pipeline\n",
+    "\n",
+    "basic_rag_pipeline = Pipeline()\n",
+    "# Add components to your pipeline\n",
+    "basic_rag_pipeline.add_component(\"text_embedder\", text_embedder)\n",
+    "basic_rag_pipeline.add_component(\"retriever\", retriever)\n",
+    "basic_rag_pipeline.add_component(\"prompt_builder\", prompt_builder)\n",
+    "basic_rag_pipeline.add_component(\"llm\", chat_generator)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 15,
+   "metadata": {
+    "colab": {
+     "base_uri": "https://localhost:8080/"
     },
+    "id": "CyqzFsp1qWVM",
+    "outputId": "591f9e19-13d6-4232-f00a-d6becd89694b"
+   },
+   "outputs": [
     {
-      "cell_type": "code",
-      "execution_count": 16,
-      "metadata": {
-        "colab": {
-          "base_uri": "https://localhost:8080/",
-          "height": 712,
-          "referenced_widgets": [
-            "3a404870f30f48aeb5fce11bcb794a1a",
-            "6b9eb9888076445c92b80f9aa29121ce",
-            "1839264932db40d0a40ccbfc08b50896",
-            "0a893c45730f4ce5a36060dcc880add1",
-            "699de9f0c89e4cc294b341932c4decc7",
-            "d283295d0bec454d9bd84256f14904ea",
-            "b4d7b68ea70b449b95eadc54e37954d6",
-            "0c9be40eb1064e50a70fe4de5cf9c760",
-            "96d50cf0bf05451a91c9eed788d36ed0",
-            "d891ea3f48314c7199f0963277063df8",
-            "24d82ad3686c4616aff7987647485df6"
-          ]
-        },
-        "id": "v6bQceW8ZduN",
-        "outputId": "f8ca4d07-ca67-4810-d07c-354c7888f80f"
-      },
-      "outputs": [
-        {
-          "data": {
-            "application/vnd.jupyter.widget-view+json": {
-              "model_id": "3a404870f30f48aeb5fce11bcb794a1a",
-              "version_major": 2,
-              "version_minor": 0
-            },
-            "text/plain": [
-              "Batches:   0%|          | 0/1 [00:00<?, ?it/s]"
-            ]
-          },
-          "metadata": {},
-          "output_type": "display_data"
-        },
-        {
-          "name": "stdout",
-          "output_type": "stream",
-          "text": [
-            "The **Colossus of Rhodes** was a massive bronze statue of the Greek sun-god **Helios**, the patron deity of Rhodes. While no surviving images or detailed descriptions of the statue exist, historians and archaeologists have pieced together its likely appearance based on:\n",
-            "\n",
-            "### **1. General Description**\n",
-            "- **Height**: Approximately **32–33 meters (105–108 feet)** tall (about the height of the Statue of Liberty from feet to crown).\n",
-            "- **Material**: Constructed with **iron tie bars** for structural support, covered in **bronze plates** (likely hammered bronze sheets).\n",
-            "- **Pose**: Most scholars believe it stood in a **contrapposto pose** (weight on one leg, with the other slightly bent), possibly with one hand raised to shield its eyes from the sun (similar to depictions on Rhodian coins).\n",
-            "- **Head & Face**: Based on contemporary Rhodian coins, Helios was depicted with **curly hair** and **radiant spikes** (possibly representing sun rays) on his head.\n",
-            "\n",
-            "### **2. Possible Depictions**\n",
-            "- **Torch or Crown?**\n",
-            "  - Some ancient texts mention the Rhodians \"kindled the torch of freedom\" after the siege, leading to speculation that the statue may have held a **torch aloft** (like the Statue of Liberty).\n",
-            "  - However, no direct evidence supports this; it may have been a symbolic reference rather than a physical torch.\n",
-            "- **Helios’ Standard Pose**:\n",
-            "  - A **relief in a nearby temple** shows Helios standing with one hand shielding his eyes, suggesting the Colossus may have been in a similar pose.\n",
-            "\n",
-            "### **3. Comparison to Other Ancient Statues**\n",
-            "- Similar to other **Hellenistic bronze statues** (e.g., the **Zeus at Olympia** or **Athena Parthenos**), the Colossus likely had:\n",
-            "  - A **muscular, idealized human form** (Helios was often depicted as youthful and athletic).\n",
-            "  - **Detailed drapery** (if wearing a robe, though no records confirm this).\n",
-            "  - **A crown or radiant headpiece** (symbolizing the sun).\n",
-            "\n",
-            "### **4. Controversies & Alternative Theories**\n",
-            "- **Harbour-Straddling Myth**:\n",
-            "  - Ancient accounts of the Colossus **spanning the harbor entrance** are considered **unrealistic** by modern scholars due to engineering constraints (the statue would collapse under its own weight).\n",
-            "- **Location**:\n",
-            "  - Likely stood near the **harbor entrance** (possibly on a **15-meter marble pedestal**), but not straddling it.\n",
-            "  - Some propose it was built on a **breakwater** or near the **Fortress of St. Nicholas**.\n",
-            "\n",
-            "### **5. Legacy & Influence**\n",
-            "- The Colossus inspired later monumental statues, including the **Statue of Liberty** (which shares its height and torch symbolism).\n",
-            "- Its **fall and destruction** (after the 226 BC earthquake) left a lasting myth, with debates over whether its ruins blocked the harbor.\n",
-            "\n",
-            "### **Conclusion**\n",
-            "The Colossus of Rhodes was a **towering bronze statue of Helios**, likely standing in a **heroic, contrapposto pose** with a **radiant headpiece**, possibly with one hand raised. While its exact appearance remains speculative, it was one of the most impressive feats of ancient engineering—a testament to Rhodes' wealth and devotion to its patron god.\n",
-            "\n",
-            "Would you like details on how it was constructed or its cultural significance?\n"
-          ]
-        }
-      ],
-      "source": [
-        "question = \"What does Rhodes Statue look like?\"\n",
-        "\n",
-        "response = basic_rag_pipeline.run({\"text_embedder\": {\"text\": question}, \"prompt_builder\": {\"question\": question}})\n",
-        "\n",
-        "print(response[\"llm\"][\"replies\"][0].text)"
+     "data": {
+      "text/plain": [
+       "<haystack.core.pipeline.pipeline.Pipeline object at 0x7a7fb2c19730>\n",
+       "🚅 Components\n",
+       "  - text_embedder: SentenceTransformersTextEmbedder\n",
+       "  - retriever: InMemoryEmbeddingRetriever\n",
+       "  - prompt_builder: ChatPromptBuilder\n",
+       "  - llm: MistralChatGenerator\n",
+       "🛤️ Connections\n",
+       "  - text_embedder.embedding -> retriever.query_embedding (list[float])\n",
+       "  - retriever.documents -> prompt_builder.documents (list[Document])\n",
+       "  - prompt_builder.prompt -> llm.messages (list[ChatMessage])"
       ]
+     },
+     "execution_count": 15,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "# Now, connect the components to each other\n",
+    "basic_rag_pipeline.connect(\"text_embedder.embedding\", \"retriever.query_embedding\")\n",
+    "basic_rag_pipeline.connect(\"retriever\", \"prompt_builder\")\n",
+    "basic_rag_pipeline.connect(\"prompt_builder.prompt\", \"llm.messages\")"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {
+    "id": "6NqyLhx7O-qc"
+   },
+   "source": [
+    "That's it! Your RAG pipeline is ready to generate answers to questions!"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {
+    "id": "DBAyF5tVO-qc"
+   },
+   "source": "## Asking a Question\n\nWhen asking a question, use the `run()` method of the pipeline. Make sure to provide the question to both the `text_embedder` and the `prompt_builder`. This ensures that the `{{question}}` variable in the template prompt gets replaced with your specific question.\n\n> ⚠️ If you host the model on the Colab runtime (for example with TransformersChatGenerator), the first pipeline run can take longer as the LLM is loaded and prepared for inference."
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {
+    "colab": {
+     "base_uri": "https://localhost:8080/",
+     "height": 86,
+     "referenced_widgets": [
+      "4e6e97b6d54f4f80bb7e8b25aba8e616",
+      "1a820c06a7a049d8b6c9ff300284d06e",
+      "58ff4e0603a74978a134f63533859be5",
+      "8bdb8bfae31d4f4cb6c3b0bf43120eed",
+      "39a68d9a5c274e2dafaa2d1f86eea768",
+      "d0cfe5dacdfc431a91b4c4741123e2d0",
+      "e7f1e1a14bb740d18827dd78bbe7b2e3",
+      "3fda06f905b445a488efdd2dd08c0939",
+      "2bc341a780f7498ba9cd475468841bb5",
+      "d7218475e23b420a8c03d00ca4ab8718",
+      "a694abaf765f4d1b82fa0138e59c6793"
+     ]
     },
+    "id": "Vnt283M5O-qc",
+    "outputId": "d2843a73-3ad5-4daa-8d1e-a58de7aa2bb0"
+   },
+   "outputs": [
     {
-      "cell_type": "markdown",
-      "metadata": {
-        "id": "IWQN-aoGO-qc"
-      },
-      "source": [
-        "Here are some other example questions to test:"
-      ]
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Batches: 100%|██████████| 1/1 [00:00<00:00,  1.77it/s]\n",
+      "huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks...\n",
+      "To disable this warning, you can either:\n",
+      "\t- Avoid using `tokenizers` before the fork if possible\n",
+      "\t- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)\n"
+     ]
     },
     {
-      "cell_type": "code",
-      "execution_count": null,
-      "metadata": {
-        "id": "_OHUQ5xxO-qc"
-      },
-      "outputs": [],
-      "source": [
-        "examples = [\n",
-        "    \"Where is Gardens of Babylon?\",\n",
-        "    \"Why did people build Great Pyramid of Giza?\",\n",
-        "    \"What does Rhodes Statue look like?\",\n",
-        "    \"Why did people visit the Temple of Artemis?\",\n",
-        "    \"What is the importance of Colossus of Rhodes?\",\n",
-        "    \"What happened to the Tomb of Mausolus?\",\n",
-        "    \"How did Colossus of Rhodes collapse?\",\n",
-        "]"
-      ]
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "The Colossus of Rhodes was a statue of the Greek sun-god Helios, standing approximately 70 cubits (about 33 meters or 108 feet) tall. Although no complete descriptions of its appearance exist, scholars believe it featured the following characteristics:\n",
+      "\n",
+      "1. **Facial Features**: The head of the statue likely had curly hair, with spikes resembling bronze or silver flames radiating outward. This style is similar to depictions found on contemporary Rhodian coins.\n",
+      "\n",
+      "2. **Posture**: While the exact pose is uncertain, it is suggested that the statue may have been constructed in a pose where Helios is depicted shielding his eyes with one hand, a common representation of someone looking toward the sun.\n",
+      "\n",
+      "3. **Construction Materials**: The structure was built using iron tie bars and brass plates, which formed the skin of the statue. The interior was filled with stone blocks.\n",
+      "\n",
+      "4. **Height and Scale**: The Colossus was positioned on a 15-metre-high (49-foot) pedestal, making it one of the tallest statues of the ancient world, towering over the harbor entrance.\n",
+      "\n",
+      "5. **Symbolic Representation**: The statue was meant to symbolize the victory and freedom of the Rhodians after successfully defending their city against an invader.\n",
+      "\n",
+      "Overall, the Colossus of Rhodes was an impressive and monumental statue designed to celebrate and symbolize the strength and resilience of the city of Rhodes.\n"
+     ]
+    }
+   ],
+   "source": [
+    "question = \"What does Rhodes Statue look like?\"\n",
+    "\n",
+    "response = basic_rag_pipeline.run({\"text_embedder\": {\"text\": question}, \"prompt_builder\": {\"question\": question}})\n",
+    "\n",
+    "print(response[\"llm\"][\"replies\"][0].text)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 16,
+   "metadata": {
+    "colab": {
+     "base_uri": "https://localhost:8080/",
+     "height": 712,
+     "referenced_widgets": [
+      "3a404870f30f48aeb5fce11bcb794a1a",
+      "6b9eb9888076445c92b80f9aa29121ce",
+      "1839264932db40d0a40ccbfc08b50896",
+      "0a893c45730f4ce5a36060dcc880add1",
+      "699de9f0c89e4cc294b341932c4decc7",
+      "d283295d0bec454d9bd84256f14904ea",
+      "b4d7b68ea70b449b95eadc54e37954d6",
+      "0c9be40eb1064e50a70fe4de5cf9c760",
+      "96d50cf0bf05451a91c9eed788d36ed0",
+      "d891ea3f48314c7199f0963277063df8",
+      "24d82ad3686c4616aff7987647485df6"
+     ]
     },
+    "id": "v6bQceW8ZduN",
+    "outputId": "f8ca4d07-ca67-4810-d07c-354c7888f80f"
+   },
+   "outputs": [
     {
-      "cell_type": "markdown",
-      "metadata": {
-        "id": "XueCK3y4O-qc"
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "3a404870f30f48aeb5fce11bcb794a1a",
+       "version_major": 2,
+       "version_minor": 0
       },
-      "source": [
-        "## What's next\n",
-        "\n",
-        "🎉 Congratulations! You've learned how to create a generative QA system for your documents with the RAG approach.\n",
-        "\n",
-        "If you liked this tutorial, you may also enjoy:\n",
-        "- [Filtering Documents with Metadata](https://haystack.deepset.ai/tutorials/31_metadata_filtering)\n",
-        "- [Preprocessing Different File Types](https://haystack.deepset.ai/tutorials/30_file_type_preprocessing_index_pipeline)\n",
-        "- [Creating a Hybrid Retrieval Pipeline](https://haystack.deepset.ai/tutorials/33_hybrid_retrieval)\n",
-        "\n",
-        "To stay up to date on the latest Haystack developments, you can [subscribe to our newsletter](https://landing.deepset.ai/haystack-community-updates) and [join the Haystack Discord community](https://discord.com/invite/xYvH6drSmA).\n",
-        "\n",
-        "Thanks for reading!"
+      "text/plain": [
+       "Batches:   0%|          | 0/1 [00:00<?, ?it/s]"
       ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
     },
     {
-      "cell_type": "code",
-      "execution_count": null,
-      "metadata": {
-        "id": "pwWunnaubzFD"
-      },
-      "outputs": [],
-      "source": []
-    }
-  ],
-  "metadata": {
-    "accelerator": "GPU",
-    "colab": {
-      "gpuType": "T4",
-      "provenance": []
-    },
-    "kernelspec": {
-      "display_name": "Python 3",
-      "name": "python3"
-    },
-    "language_info": {
-      "codemirror_mode": {
-        "name": "ipython",
-        "version": 3
-      },
-      "file_extension": ".py",
-      "mimetype": "text/x-python",
-      "name": "python",
-      "nbconvert_exporter": "python",
-      "pygments_lexer": "ipython3",
-      "version": "3.9.6"
-    },
-    "orig_nbformat": 4,
-    "vscode": {
-      "interpreter": {
-        "hash": "31f2aee4e71d21fbe5cf8b01ff0e069b9275f58929596ceb00d14d90e3e16cd6"
-      }
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "The **Colossus of Rhodes** was a massive bronze statue of the Greek sun-god **Helios**, the patron deity of Rhodes. While no surviving images or detailed descriptions of the statue exist, historians and archaeologists have pieced together its likely appearance based on:\n",
+      "\n",
+      "### **1. General Description**\n",
+      "- **Height**: Approximately **32–33 meters (105–108 feet)** tall (about the height of the Statue of Liberty from feet to crown).\n",
+      "- **Material**: Constructed with **iron tie bars** for structural support, covered in **bronze plates** (likely hammered bronze sheets).\n",
+      "- **Pose**: Most scholars believe it stood in a **contrapposto pose** (weight on one leg, with the other slightly bent), possibly with one hand raised to shield its eyes from the sun (similar to depictions on Rhodian coins).\n",
+      "- **Head & Face**: Based on contemporary Rhodian coins, Helios was depicted with **curly hair** and **radiant spikes** (possibly representing sun rays) on his head.\n",
+      "\n",
+      "### **2. Possible Depictions**\n",
+      "- **Torch or Crown?**\n",
+      "  - Some ancient texts mention the Rhodians \"kindled the torch of freedom\" after the siege, leading to speculation that the statue may have held a **torch aloft** (like the Statue of Liberty).\n",
+      "  - However, no direct evidence supports this; it may have been a symbolic reference rather than a physical torch.\n",
+      "- **Helios’ Standard Pose**:\n",
+      "  - A **relief in a nearby temple** shows Helios standing with one hand shielding his eyes, suggesting the Colossus may have been in a similar pose.\n",
+      "\n",
+      "### **3. Comparison to Other Ancient Statues**\n",
+      "- Similar to other **Hellenistic bronze statues** (e.g., the **Zeus at Olympia** or **Athena Parthenos**), the Colossus likely had:\n",
+      "  - A **muscular, idealized human form** (Helios was often depicted as youthful and athletic).\n",
+      "  - **Detailed drapery** (if wearing a robe, though no records confirm this).\n",
+      "  - **A crown or radiant headpiece** (symbolizing the sun).\n",
+      "\n",
+      "### **4. Controversies & Alternative Theories**\n",
+      "- **Harbour-Straddling Myth**:\n",
+      "  - Ancient accounts of the Colossus **spanning the harbor entrance** are considered **unrealistic** by modern scholars due to engineering constraints (the statue would collapse under its own weight).\n",
+      "- **Location**:\n",
+      "  - Likely stood near the **harbor entrance** (possibly on a **15-meter marble pedestal**), but not straddling it.\n",
+      "  - Some propose it was built on a **breakwater** or near the **Fortress of St. Nicholas**.\n",
+      "\n",
+      "### **5. Legacy & Influence**\n",
+      "- The Colossus inspired later monumental statues, including the **Statue of Liberty** (which shares its height and torch symbolism).\n",
+      "- Its **fall and destruction** (after the 226 BC earthquake) left a lasting myth, with debates over whether its ruins blocked the harbor.\n",
+      "\n",
+      "### **Conclusion**\n",
+      "The Colossus of Rhodes was a **towering bronze statue of Helios**, likely standing in a **heroic, contrapposto pose** with a **radiant headpiece**, possibly with one hand raised. While its exact appearance remains speculative, it was one of the most impressive feats of ancient engineering—a testament to Rhodes' wealth and devotion to its patron god.\n",
+      "\n",
+      "Would you like details on how it was constructed or its cultural significance?\n"
+     ]
     }
+   ],
+   "source": [
+    "question = \"What does Rhodes Statue look like?\"\n",
+    "\n",
+    "response = basic_rag_pipeline.run({\"text_embedder\": {\"text\": question}, \"prompt_builder\": {\"question\": question}})\n",
+    "\n",
+    "print(response[\"llm\"][\"replies\"][0].text)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {
+    "id": "IWQN-aoGO-qc"
+   },
+   "source": [
+    "Here are some other example questions to test:"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {
+    "id": "_OHUQ5xxO-qc"
+   },
+   "outputs": [],
+   "source": [
+    "examples = [\n",
+    "    \"Where is Gardens of Babylon?\",\n",
+    "    \"Why did people build Great Pyramid of Giza?\",\n",
+    "    \"What does Rhodes Statue look like?\",\n",
+    "    \"Why did people visit the Temple of Artemis?\",\n",
+    "    \"What is the importance of Colossus of Rhodes?\",\n",
+    "    \"What happened to the Tomb of Mausolus?\",\n",
+    "    \"How did Colossus of Rhodes collapse?\",\n",
+    "]"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {
+    "id": "XueCK3y4O-qc"
+   },
+   "source": [
+    "## What's next\n",
+    "\n",
+    "🎉 Congratulations! You've learned how to create a generative QA system for your documents with the RAG approach.\n",
+    "\n",
+    "If you liked this tutorial, you may also enjoy:\n",
+    "- [Filtering Documents with Metadata](https://haystack.deepset.ai/tutorials/31_metadata_filtering)\n",
+    "- [Preprocessing Different File Types](https://haystack.deepset.ai/tutorials/30_file_type_preprocessing_index_pipeline)\n",
+    "- [Creating a Hybrid Retrieval Pipeline](https://haystack.deepset.ai/tutorials/33_hybrid_retrieval)\n",
+    "\n",
+    "To stay up to date on the latest Haystack developments, you can [subscribe to our newsletter](https://landing.deepset.ai/haystack-community-updates) and [join the Haystack Discord community](https://discord.com/invite/xYvH6drSmA).\n",
+    "\n",
+    "Thanks for reading!"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {
+    "id": "pwWunnaubzFD"
+   },
+   "outputs": [],
+   "source": []
+  }
+ ],
+ "metadata": {
+  "accelerator": "GPU",
+  "colab": {
+   "gpuType": "T4",
+   "provenance": []
+  },
+  "kernelspec": {
+   "display_name": "Python 3",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.9.6"
   },
-  "nbformat": 4,
-  "nbformat_minor": 0
-}
+  "orig_nbformat": 4,
+  "vscode": {
+   "interpreter": {
+    "hash": "31f2aee4e71d21fbe5cf8b01ff0e069b9275f58929596ceb00d14d90e3e16cd6"
+   }
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 0
+}
\ No newline at end of file
diff --git a/tutorials/29_Serializing_Pipelines.ipynb b/tutorials/29_Serializing_Pipelines.ipynb
index ed1e65c..64fc550 100644
--- a/tutorials/29_Serializing_Pipelines.ipynb
+++ b/tutorials/29_Serializing_Pipelines.ipynb
@@ -5,15 +5,7 @@
    "metadata": {
     "id": "cFFW8D-weE2S"
    },
-   "source": [
-    "# Tutorial: Serializing LLM Pipelines\n",
-    "\n",
-    "- **Level**: Beginner\n",
-    "- **Time to complete**: 10 minutes\n",
-    "- **Components Used**: [`HuggingFaceLocalChatGenerator`](https://docs.haystack.deepset.ai/docs/huggingfacelocalchatgenerator), [`ChatPromptBuilder`](https://docs.haystack.deepset.ai/docs/chatpromptbuilder)\n",
-    "- **Prerequisites**: None\n",
-    "- **Goal**: After completing this tutorial, you'll understand how to serialize and deserialize between YAML and Python code."
-   ]
+   "source": "# Tutorial: Serializing LLM Pipelines\n\n- **Level**: Beginner\n- **Time to complete**: 10 minutes\n- **Components Used**: [`TransformersChatGenerator`](https://docs.haystack.deepset.ai/docs/transformerschatgenerator), [`ChatPromptBuilder`](https://docs.haystack.deepset.ai/docs/chatpromptbuilder)\n- **Prerequisites**: None\n- **Goal**: After completing this tutorial, you'll understand how to serialize and deserialize between YAML and Python code."
   },
   {
    "cell_type": "markdown",
@@ -35,11 +27,7 @@
    "metadata": {
     "id": "TLaHxdJcfWtI"
    },
-   "source": [
-    "## Installing Haystack\n",
-    "\n",
-    "Install Haystack with `pip`:"
-   ]
+   "source": "## Installing Haystack\n\nInstall Haystack and the [`transformers-haystack`](https://haystack.deepset.ai/integrations/huggingface) integration (which provides `TransformersChatGenerator`) with `pip`:"
   },
   {
    "cell_type": "code",
@@ -52,11 +40,7 @@
     "outputId": "e304450a-24e3-4ef8-e642-1fbb573e7d55"
    },
    "outputs": [],
-   "source": [
-    "%%bash\n",
-    "\n",
-    "pip install haystack-ai"
-   ]
+   "source": "%%bash\n\npip install haystack-ai transformers-haystack"
   },
   {
    "cell_type": "markdown",
@@ -71,51 +55,12 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 3,
+   "execution_count": null,
    "metadata": {
     "id": "odZJjD7KgO1g"
    },
-   "outputs": [
-    {
-     "data": {
-      "text/plain": [
-       "<haystack.core.pipeline.pipeline.Pipeline object at 0x13cc77370>\n",
-       "🚅 Components\n",
-       "  - builder: ChatPromptBuilder\n",
-       "  - llm: HuggingFaceLocalChatGenerator\n",
-       "🛤️ Connections\n",
-       "  - builder.prompt -> llm.messages (List[ChatMessage])"
-      ]
-     },
-     "execution_count": 3,
-     "metadata": {},
-     "output_type": "execute_result"
-    }
-   ],
-   "source": [
-    "from haystack import Pipeline\n",
-    "from haystack.components.builders import ChatPromptBuilder\n",
-    "from haystack.dataclasses import ChatMessage\n",
-    "from haystack.components.generators.chat import HuggingFaceLocalChatGenerator\n",
-    "\n",
-    "template = [\n",
-    "    ChatMessage.from_user(\n",
-    "        \"\"\"\n",
-    "Please create a summary about the following topic:\n",
-    "{{ topic }}\n",
-    "\"\"\"\n",
-    "    )\n",
-    "]\n",
-    "\n",
-    "builder = ChatPromptBuilder(template=template)\n",
-    "llm = HuggingFaceLocalChatGenerator(model=\"Qwen/Qwen2.5-1.5B-Instruct\", generation_kwargs={\"max_new_tokens\": 150})\n",
-    "\n",
-    "pipeline = Pipeline()\n",
-    "pipeline.add_component(name=\"builder\", instance=builder)\n",
-    "pipeline.add_component(name=\"llm\", instance=llm)\n",
-    "\n",
-    "pipeline.connect(\"builder.prompt\", \"llm.messages\")"
-   ]
+   "outputs": [],
+   "source": "from haystack import Pipeline\nfrom haystack.components.builders import ChatPromptBuilder\nfrom haystack.dataclasses import ChatMessage\nfrom haystack_integrations.components.generators.transformers import TransformersChatGenerator\n\ntemplate = [\n    ChatMessage.from_user(\n        \"\"\"\nPlease create a summary about the following topic:\n{{ topic }}\n\"\"\"\n    )\n]\n\nbuilder = ChatPromptBuilder(template=template)\nllm = TransformersChatGenerator(model=\"Qwen/Qwen2.5-1.5B-Instruct\", generation_kwargs={\"max_new_tokens\": 150})\n\npipeline = Pipeline()\npipeline.add_component(name=\"builder\", instance=builder)\npipeline.add_component(name=\"llm\", instance=llm)\n\npipeline.connect(\"builder.prompt\", \"llm.messages\")"
   },
   {
    "cell_type": "code",
@@ -225,54 +170,7 @@
    "metadata": {
     "id": "0C7zGsUCGszq"
    },
-   "source": [
-    "You should get a pipeline YAML that looks like the following:\n",
-    "\n",
-    "```yaml\n",
-    "components:\n",
-    "  builder:\n",
-    "    init_parameters:\n",
-    "      required_variables: null\n",
-    "      template:\n",
-    "      - _content:\n",
-    "        - text: '\n",
-    "\n",
-    "            Please create a summary about the following topic:\n",
-    "\n",
-    "            {{ topic }}\n",
-    "\n",
-    "            '\n",
-    "        _meta: {}\n",
-    "        _name: null\n",
-    "        _role: user\n",
-    "      variables: null\n",
-    "    type: haystack.components.builders.chat_prompt_builder.ChatPromptBuilder\n",
-    "  llm:\n",
-    "    init_parameters:\n",
-    "      init_parameters:\n",
-    "      generation_kwargs:\n",
-    "        max_new_tokens: 150\n",
-    "        stop_sequences: []\n",
-    "      huggingface_pipeline_kwargs:\n",
-    "        device: cpu\n",
-    "        model: Qwen/Qwen2.5-1.5B-Instruct\n",
-    "        task: text-generation\n",
-    "      streaming_callback: null\n",
-    "      token:\n",
-    "        env_vars:\n",
-    "        - HF_API_TOKEN\n",
-    "        - HF_TOKEN\n",
-    "        strict: false\n",
-    "        type: env_var\n",
-    "    type: haystack.components.generators.chat.hugging_face_local.HuggingFaceLocalChatGenerator\n",
-    "connections:\n",
-    "- receiver: llm.messages\n",
-    "  sender: builder.prompt\n",
-    "max_runs_per_component: 100\n",
-    "metadata: {}\n",
-    "\n",
-    "```"
-   ]
+   "source": "You should get a pipeline YAML that looks like the following:\n\n```yaml\ncomponents:\n  builder:\n    init_parameters:\n      required_variables: null\n      template:\n      - _content:\n        - text: '\n\n            Please create a summary about the following topic:\n\n            {{ topic }}\n\n            '\n        _meta: {}\n        _name: null\n        _role: user\n      variables: null\n    type: haystack.components.builders.chat_prompt_builder.ChatPromptBuilder\n  llm:\n    init_parameters:\n      chat_template: null\n      enable_thinking: false\n      generation_kwargs:\n        max_new_tokens: 150\n      huggingface_pipeline_kwargs:\n        device: cpu\n        model: Qwen/Qwen2.5-1.5B-Instruct\n        task: text-generation\n      streaming_callback: null\n      token:\n        env_vars:\n        - HF_API_TOKEN\n        - HF_TOKEN\n        strict: false\n        type: env_var\n      tool_parsing_function: haystack_integrations.components.generators.transformers.chat.chat_generator.default_tool_parser\n      tools: null\n    type: haystack_integrations.components.generators.transformers.chat.chat_generator.TransformersChatGenerator\nconnections:\n- receiver: llm.messages\n  sender: builder.prompt\nmax_runs_per_component: 100\nmetadata: {}\n\n```"
   },
   {
    "cell_type": "markdown",
@@ -287,49 +185,12 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 5,
+   "execution_count": null,
    "metadata": {
     "id": "U332-VjovFfn"
    },
    "outputs": [],
-   "source": [
-    "yaml_pipeline = \"\"\"\n",
-    "components:\n",
-    "  builder:\n",
-    "    init_parameters:\n",
-    "      template:\n",
-    "      - _content:\n",
-    "        - text: 'Please translate the following to French: \\n{{ sentence }}\\n'\n",
-    "        _meta: {}\n",
-    "        _name: null\n",
-    "        _role: user\n",
-    "      variables: null\n",
-    "    type: haystack.components.builders.chat_prompt_builder.ChatPromptBuilder\n",
-    "  llm:\n",
-    "    init_parameters:\n",
-    "      generation_kwargs:\n",
-    "        max_new_tokens: 150\n",
-    "        stop_sequences: []\n",
-    "      huggingface_pipeline_kwargs:\n",
-    "        device: cpu\n",
-    "        model: Qwen/Qwen2.5-1.5B-Instruct\n",
-    "        task: text-generation\n",
-    "      streaming_callback: null\n",
-    "      chat_template : \"{% for message in messages %}{% if message['role'] == 'user' %}{{ ' ' }}{% endif %}{{ message['content'] }}{% if not loop.last %}{{ '  ' }}{% endif %}{% endfor %}{{ eos_token }}\"\n",
-    "      token:\n",
-    "        env_vars:\n",
-    "        - HF_API_TOKEN\n",
-    "        - HF_TOKEN\n",
-    "        strict: false\n",
-    "        type: env_var\n",
-    "    type: haystack.components.generators.chat.hugging_face_local.HuggingFaceLocalChatGenerator\n",
-    "connections:\n",
-    "- receiver: llm.messages\n",
-    "  sender: builder.prompt\n",
-    "max_runs_per_component: 100\n",
-    "metadata: {}\n",
-    "\"\"\""
-   ]
+   "source": "yaml_pipeline = \"\"\"\ncomponents:\n  builder:\n    init_parameters:\n      template:\n      - _content:\n        - text: 'Please translate the following to French: \\n{{ sentence }}\\n'\n        _meta: {}\n        _name: null\n        _role: user\n      variables: null\n    type: haystack.components.builders.chat_prompt_builder.ChatPromptBuilder\n  llm:\n    init_parameters:\n      generation_kwargs:\n        max_new_tokens: 150\n        stop_sequences: []\n      huggingface_pipeline_kwargs:\n        device: cpu\n        model: Qwen/Qwen2.5-1.5B-Instruct\n        task: text-generation\n      streaming_callback: null\n      chat_template : \"{% for message in messages %}{% if message['role'] == 'user' %}{{ ' ' }}{% endif %}{{ message['content'] }}{% if not loop.last %}{{ '  ' }}{% endif %}{% endfor %}{{ eos_token }}\"\n      token:\n        env_vars:\n        - HF_API_TOKEN\n        - HF_TOKEN\n        strict: false\n        type: env_var\n    type: haystack_integrations.components.generators.transformers.chat.chat_generator.TransformersChatGenerator\nconnections:\n- receiver: llm.messages\n  sender: builder.prompt\nmax_runs_per_component: 100\nmetadata: {}\n\"\"\""
   },
   {
    "cell_type": "markdown",
@@ -428,4 +289,4 @@
  },
  "nbformat": 4,
  "nbformat_minor": 0
-}
+}
\ No newline at end of file
diff --git a/tutorials/33_Hybrid_Retrieval.ipynb b/tutorials/33_Hybrid_Retrieval.ipynb
index e11df79..febebfd 100644
--- a/tutorials/33_Hybrid_Retrieval.ipynb
+++ b/tutorials/33_Hybrid_Retrieval.ipynb
@@ -5,15 +5,7 @@
    "metadata": {
     "id": "kTas9ZQ7lXP7"
    },
-   "source": [
-    "# Tutorial: Creating a Hybrid Retrieval Pipeline\n",
-    "\n",
-    "- **Level**: Intermediate\n",
-    "- **Time to complete**: 15 minutes\n",
-    "- **Components Used**: [`DocumentSplitter`](https://docs.haystack.deepset.ai/docs/documentsplitter), [`SentenceTransformersDocumentEmbedder`](https://docs.haystack.deepset.ai/docs/sentencetransformersdocumentembedder), [`InMemoryDocumentStore`](https://docs.haystack.deepset.ai/docs/inmemorydocumentstore), [`InMemoryBM25Retriever`](https://docs.haystack.deepset.ai/docs/inmemorybm25retriever), [`InMemoryEmbeddingRetriever`](https://docs.haystack.deepset.ai/docs/inmemoryembeddingretriever), and [`TransformersSimilarityRanker`](https://docs.haystack.deepset.ai/docs/transformerssimilarityranker)\n",
-    "- **Prerequisites**: None\n",
-    "- **Goal**: After completing this tutorial, you will have learned about creating a hybrid retrieval and when it's useful."
-   ]
+   "source": "# Tutorial: Creating a Hybrid Retrieval Pipeline\n\n- **Level**: Intermediate\n- **Time to complete**: 15 minutes\n- **Components Used**: [`DocumentSplitter`](https://docs.haystack.deepset.ai/docs/documentsplitter), [`SentenceTransformersDocumentEmbedder`](https://docs.haystack.deepset.ai/docs/sentencetransformersdocumentembedder), [`InMemoryDocumentStore`](https://docs.haystack.deepset.ai/docs/inmemorydocumentstore), [`InMemoryBM25Retriever`](https://docs.haystack.deepset.ai/docs/inmemorybm25retriever), [`InMemoryEmbeddingRetriever`](https://docs.haystack.deepset.ai/docs/inmemoryembeddingretriever), and [`SentenceTransformersSimilarityRanker`](https://docs.haystack.deepset.ai/docs/sentencetransformerssimilarityranker)\n- **Prerequisites**: None\n- **Goal**: After completing this tutorial, you will have learned about creating a hybrid retrieval and when it's useful."
   },
   {
    "cell_type": "markdown",
@@ -230,24 +222,16 @@
    "metadata": {
     "id": "r8_jHzmosbC_"
    },
-   "source": [
-    "### 2) Rank the Results\n",
-    "\n",
-    "Use the [TransformersSimilarityRanker](https://docs.haystack.deepset.ai/docs/transformerssimilarityranker) that scores the relevancy of all retrieved documents for the given search query by using a cross encoder model. In this example, you will use [BAAI/bge-reranker-base](https://huggingface.co/BAAI/bge-reranker-base) model to rank the retrieved documents but you can replace this model with other cross-encoder models on Hugging Face."
-   ]
+   "source": "### 2) Rank the Results\n\nUse the [SentenceTransformersSimilarityRanker](https://docs.haystack.deepset.ai/docs/sentencetransformerssimilarityranker) that scores the relevancy of all retrieved documents for the given search query by using a cross encoder model. In this example, you will use [BAAI/bge-reranker-base](https://huggingface.co/BAAI/bge-reranker-base) model to rank the retrieved documents but you can replace this model with other cross-encoder models on Hugging Face."
   },
   {
    "cell_type": "code",
-   "execution_count": 9,
+   "execution_count": null,
    "metadata": {
     "id": "cN0woIxHs4Ng"
    },
    "outputs": [],
-   "source": [
-    "from haystack.components.rankers import TransformersSimilarityRanker\n",
-    "\n",
-    "ranker = TransformersSimilarityRanker(model=\"BAAI/bge-reranker-base\")"
-   ]
+   "source": "from haystack.components.rankers import SentenceTransformersSimilarityRanker\n\nranker = SentenceTransformersSimilarityRanker(model=\"BAAI/bge-reranker-base\")"
   },
   {
    "cell_type": "markdown",
@@ -533,4 +517,4 @@
  },
  "nbformat": 4,
  "nbformat_minor": 0
-}
+}
\ No newline at end of file
diff --git a/tutorials/34_Extractive_QA_Pipeline.ipynb b/tutorials/34_Extractive_QA_Pipeline.ipynb
index 64cba2f..1ece9a0 100644
--- a/tutorials/34_Extractive_QA_Pipeline.ipynb
+++ b/tutorials/34_Extractive_QA_Pipeline.ipynb
@@ -5,14 +5,7 @@
    "metadata": {
     "id": "2ErVy6A2NisJ"
    },
-   "source": [
-    " ## Tutorial: Build an Extractive QA Pipeline\n",
-    "\n",
-    "- **Level**: Beginner\n",
-    "- **Time to complete**: 15 minutes\n",
-    "- **Components Used**: [`ExtractiveReader`](https://docs.haystack.deepset.ai/docs/extractivereader), [`InMemoryDocumentStore`](https://docs.haystack.deepset.ai/docs/inmemorydocumentstore), [`InMemoryEmbeddingRetriever`](https://docs.haystack.deepset.ai/docs/inmemoryembeddingretriever), [`DocumentWriter`](https://docs.haystack.deepset.ai/docs/documentwriter), [`SentenceTransformersDocumentEmbedder`](https://docs.haystack.deepset.ai/docs/sentencetransformersdocumentembedder), [`SentenceTransformersTextEmbedder`](https://docs.haystack.deepset.ai/docs/sentencetransformerstextembedder)\n",
-    "- **Goal**: After completing this tutorial, you'll have learned how to build a Haystack pipeline that uses an extractive model to display where the answer to your query is."
-   ]
+   "source": " ## Tutorial: Build an Extractive QA Pipeline\n\n- **Level**: Beginner\n- **Time to complete**: 15 minutes\n- **Components Used**: [`TransformersExtractiveReader`](https://docs.haystack.deepset.ai/docs/transformersextractivereader), [`InMemoryDocumentStore`](https://docs.haystack.deepset.ai/docs/inmemorydocumentstore), [`InMemoryEmbeddingRetriever`](https://docs.haystack.deepset.ai/docs/inmemoryembeddingretriever), [`DocumentWriter`](https://docs.haystack.deepset.ai/docs/documentwriter), [`SentenceTransformersDocumentEmbedder`](https://docs.haystack.deepset.ai/docs/sentencetransformersdocumentembedder), [`SentenceTransformersTextEmbedder`](https://docs.haystack.deepset.ai/docs/sentencetransformerstextembedder)\n- **Goal**: After completing this tutorial, you'll have learned how to build a Haystack pipeline that uses an extractive model to display where the answer to your query is."
   },
   {
    "cell_type": "markdown",
@@ -45,11 +38,7 @@
     "id": "rwgpwV4eHVoo"
    },
    "outputs": [],
-   "source": [
-    "%%bash\n",
-    "\n",
-    "pip install haystack-ai accelerate \"sentence-transformers>=4.1.0\" \"datasets>=2.6.1\" \"transformers<5\""
-   ]
+   "source": "%%bash\n\npip install haystack-ai transformers-haystack accelerate \"sentence-transformers>=4.1.0\" \"datasets>=2.6.1\" \"transformers<5\""
   },
   {
    "cell_type": "markdown",
@@ -256,284 +245,15 @@
     "id": "ttuq7kLtaV5b",
     "outputId": "01877b76-f083-4a94-a90e-6717bcecc3d3"
    },
-   "outputs": [
-    {
-     "name": "stderr",
-     "output_type": "stream",
-     "text": [
-      "/usr/local/lib/python3.10/dist-packages/huggingface_hub/utils/_token.py:88: UserWarning: \n",
-      "The secret `HF_TOKEN` does not exist in your Colab secrets.\n",
-      "To authenticate with the Hugging Face Hub, create a token in your settings tab (https://huggingface.co/settings/tokens), set it as secret in your Google Colab and restart your session.\n",
-      "You will be able to reuse this secret in all of your notebooks.\n",
-      "Please note that authentication is recommended but still optional to access public models or datasets.\n",
-      "  warnings.warn(\n"
-     ]
-    },
-    {
-     "data": {
-      "application/vnd.jupyter.widget-view+json": {
-       "model_id": "7003e95fe7594baa9dcf3b78001dae8c",
-       "version_major": 2,
-       "version_minor": 0
-      },
-      "text/plain": [
-       "Downloading readme:   0%|          | 0.00/46.0 [00:00<?, ?B/s]"
-      ]
-     },
-     "metadata": {},
-     "output_type": "display_data"
-    },
-    {
-     "data": {
-      "application/vnd.jupyter.widget-view+json": {
-       "model_id": "f0128d87740d449eb7e5efcc3045f44e",
-       "version_major": 2,
-       "version_minor": 0
-      },
-      "text/plain": [
-       "Downloading data:   0%|          | 0.00/119k [00:00<?, ?B/s]"
-      ]
-     },
-     "metadata": {},
-     "output_type": "display_data"
-    },
-    {
-     "data": {
-      "application/vnd.jupyter.widget-view+json": {
-       "model_id": "518a021bc14546388ffc719adaa45c18",
-       "version_major": 2,
-       "version_minor": 0
-      },
-      "text/plain": [
-       "Generating train split: 0 examples [00:00, ? examples/s]"
-      ]
-     },
-     "metadata": {},
-     "output_type": "display_data"
-    },
-    {
-     "data": {
-      "application/vnd.jupyter.widget-view+json": {
-       "model_id": "0ca27757f7c64134931aef12165f4d74",
-       "version_major": 2,
-       "version_minor": 0
-      },
-      "text/plain": [
-       "modules.json:   0%|          | 0.00/229 [00:00<?, ?B/s]"
-      ]
-     },
-     "metadata": {},
-     "output_type": "display_data"
-    },
-    {
-     "data": {
-      "application/vnd.jupyter.widget-view+json": {
-       "model_id": "30f823aaa04f4fc78ca022339c60bea7",
-       "version_major": 2,
-       "version_minor": 0
-      },
-      "text/plain": [
-       "config_sentence_transformers.json:   0%|          | 0.00/116 [00:00<?, ?B/s]"
-      ]
-     },
-     "metadata": {},
-     "output_type": "display_data"
-    },
-    {
-     "data": {
-      "application/vnd.jupyter.widget-view+json": {
-       "model_id": "5b0ad080573e40919752004106dcd523",
-       "version_major": 2,
-       "version_minor": 0
-      },
-      "text/plain": [
-       "README.md:   0%|          | 0.00/8.66k [00:00<?, ?B/s]"
-      ]
-     },
-     "metadata": {},
-     "output_type": "display_data"
-    },
-    {
-     "data": {
-      "application/vnd.jupyter.widget-view+json": {
-       "model_id": "a2768619988240c591a4aa2d6fc8e4b6",
-       "version_major": 2,
-       "version_minor": 0
-      },
-      "text/plain": [
-       "sentence_bert_config.json:   0%|          | 0.00/53.0 [00:00<?, ?B/s]"
-      ]
-     },
-     "metadata": {},
-     "output_type": "display_data"
-    },
-    {
-     "data": {
-      "application/vnd.jupyter.widget-view+json": {
-       "model_id": "fdb7c19e3e2a4408ac6ed1a1dd69d0e2",
-       "version_major": 2,
-       "version_minor": 0
-      },
-      "text/plain": [
-       "config.json:   0%|          | 0.00/571 [00:00<?, ?B/s]"
-      ]
-     },
-     "metadata": {},
-     "output_type": "display_data"
-    },
-    {
-     "data": {
-      "application/vnd.jupyter.widget-view+json": {
-       "model_id": "a9f74674fc7b42aab231ba01aa112636",
-       "version_major": 2,
-       "version_minor": 0
-      },
-      "text/plain": [
-       "pytorch_model.bin:   0%|          | 0.00/438M [00:00<?, ?B/s]"
-      ]
-     },
-     "metadata": {},
-     "output_type": "display_data"
-    },
-    {
-     "data": {
-      "application/vnd.jupyter.widget-view+json": {
-       "model_id": "b95eac15198143c0a559320d8ba233e4",
-       "version_major": 2,
-       "version_minor": 0
-      },
-      "text/plain": [
-       "tokenizer_config.json:   0%|          | 0.00/363 [00:00<?, ?B/s]"
-      ]
-     },
-     "metadata": {},
-     "output_type": "display_data"
-    },
-    {
-     "data": {
-      "application/vnd.jupyter.widget-view+json": {
-       "model_id": "0a5717f7492c4749a7bf9f5bf7c87181",
-       "version_major": 2,
-       "version_minor": 0
-      },
-      "text/plain": [
-       "vocab.txt:   0%|          | 0.00/232k [00:00<?, ?B/s]"
-      ]
-     },
-     "metadata": {},
-     "output_type": "display_data"
-    },
-    {
-     "data": {
-      "application/vnd.jupyter.widget-view+json": {
-       "model_id": "bf5a8dcb41694fd6a27ed94c5e132ff5",
-       "version_major": 2,
-       "version_minor": 0
-      },
-      "text/plain": [
-       "tokenizer.json:   0%|          | 0.00/466k [00:00<?, ?B/s]"
-      ]
-     },
-     "metadata": {},
-     "output_type": "display_data"
-    },
-    {
-     "data": {
-      "application/vnd.jupyter.widget-view+json": {
-       "model_id": "dbd79d2df046429bb10cbd9b52b4e5c3",
-       "version_major": 2,
-       "version_minor": 0
-      },
-      "text/plain": [
-       "special_tokens_map.json:   0%|          | 0.00/239 [00:00<?, ?B/s]"
-      ]
-     },
-     "metadata": {},
-     "output_type": "display_data"
-    },
-    {
-     "data": {
-      "application/vnd.jupyter.widget-view+json": {
-       "model_id": "d2c569dd2a9b4287ab4af93dad846998",
-       "version_major": 2,
-       "version_minor": 0
-      },
-      "text/plain": [
-       "1_Pooling/config.json:   0%|          | 0.00/190 [00:00<?, ?B/s]"
-      ]
-     },
-     "metadata": {},
-     "output_type": "display_data"
-    },
-    {
-     "data": {
-      "application/vnd.jupyter.widget-view+json": {
-       "model_id": "31e2d766917c4e6fa927e6605e6e1b88",
-       "version_major": 2,
-       "version_minor": 0
-      },
-      "text/plain": [
-       "Batches:   0%|          | 0/5 [00:00<?, ?it/s]"
-      ]
-     },
-     "metadata": {},
-     "output_type": "display_data"
-    },
-    {
-     "data": {
-      "text/plain": [
-       "{'writer': {'documents_written': 151}}"
-      ]
-     },
-     "execution_count": 5,
-     "metadata": {},
-     "output_type": "execute_result"
-    }
-   ],
-   "source": [
-    "from datasets import load_dataset\n",
-    "from haystack import Document\n",
-    "from haystack import Pipeline\n",
-    "from haystack.document_stores.in_memory import InMemoryDocumentStore\n",
-    "from haystack.components.retrievers.in_memory import InMemoryEmbeddingRetriever\n",
-    "from haystack.components.readers import ExtractiveReader\n",
-    "from haystack.components.embedders import SentenceTransformersDocumentEmbedder\n",
-    "from haystack.components.writers import DocumentWriter\n",
-    "\n",
-    "\n",
-    "dataset = load_dataset(\"bilgeyucel/seven-wonders\", split=\"train\")\n",
-    "\n",
-    "documents = [Document(content=doc[\"content\"], meta=doc[\"meta\"]) for doc in dataset]\n",
-    "\n",
-    "model = \"sentence-transformers/multi-qa-mpnet-base-dot-v1\"\n",
-    "\n",
-    "document_store = InMemoryDocumentStore()\n",
-    "\n",
-    "indexing_pipeline = Pipeline()\n",
-    "\n",
-    "indexing_pipeline.add_component(instance=SentenceTransformersDocumentEmbedder(model=model), name=\"embedder\")\n",
-    "indexing_pipeline.add_component(instance=DocumentWriter(document_store=document_store), name=\"writer\")\n",
-    "indexing_pipeline.connect(\"embedder.documents\", \"writer.documents\")\n",
-    "\n",
-    "indexing_pipeline.run({\"documents\": documents})"
-   ]
+   "outputs": [],
+   "source": "from datasets import load_dataset\nfrom haystack import Document\nfrom haystack import Pipeline\nfrom haystack.document_stores.in_memory import InMemoryDocumentStore\nfrom haystack.components.retrievers.in_memory import InMemoryEmbeddingRetriever\nfrom haystack_integrations.components.readers.transformers import TransformersExtractiveReader\nfrom haystack.components.embedders import SentenceTransformersDocumentEmbedder\nfrom haystack.components.writers import DocumentWriter\n\n\ndataset = load_dataset(\"bilgeyucel/seven-wonders\", split=\"train\")\n\ndocuments = [Document(content=doc[\"content\"], meta=doc[\"meta\"]) for doc in dataset]\n\nmodel = \"sentence-transformers/multi-qa-mpnet-base-dot-v1\"\n\ndocument_store = InMemoryDocumentStore()\n\nindexing_pipeline = Pipeline()\n\nindexing_pipeline.add_component(instance=SentenceTransformersDocumentEmbedder(model=model), name=\"embedder\")\nindexing_pipeline.add_component(instance=DocumentWriter(document_store=document_store), name=\"writer\")\nindexing_pipeline.connect(\"embedder.documents\", \"writer.documents\")\n\nindexing_pipeline.run({\"documents\": documents})"
   },
   {
    "cell_type": "markdown",
    "metadata": {
     "id": "r5CL5VXaVQqE"
    },
-   "source": [
-    "## Build an Extractive QA Pipeline\n",
-    "\n",
-    "Your extractive QA pipeline will consist of three components: an embedder, retriever, and reader.\n",
-    "\n",
-    "- The `SentenceTransformersTextEmbedder` turns a query into a vector, using the same embedding model defined above.\n",
-    "\n",
-    "- Vector search allows the retriever to efficiently return relevant documents from the document store. Retrievers are tightly coupled with document stores; thus, you'll use an `InMemoryEmbeddingRetriever`to go with the `InMemoryDocumentStore`.\n",
-    "\n",
-    "- The `ExtractiveReader` returns answers to that query, as well as their location in the source document, and a confidence score.\n"
-   ]
+   "source": "## Build an Extractive QA Pipeline\n\nYour extractive QA pipeline will consist of three components: an embedder, retriever, and reader.\n\n- The `SentenceTransformersTextEmbedder` turns a query into a vector, using the same embedding model defined above.\n\n- Vector search allows the retriever to efficiently return relevant documents from the document store. Retrievers are tightly coupled with document stores; thus, you'll use an `InMemoryEmbeddingRetriever`to go with the `InMemoryDocumentStore`.\n\n- The `TransformersExtractiveReader` returns answers to that query, as well as their location in the source document, and a confidence score.\n"
   },
   {
    "cell_type": "code",
@@ -542,25 +262,7 @@
     "id": "xZGGv8yaHZtV"
    },
    "outputs": [],
-   "source": [
-    "from haystack.components.retrievers.in_memory import InMemoryEmbeddingRetriever\n",
-    "from haystack.components.readers import ExtractiveReader\n",
-    "from haystack.components.embedders import SentenceTransformersTextEmbedder\n",
-    "\n",
-    "\n",
-    "retriever = InMemoryEmbeddingRetriever(document_store=document_store)\n",
-    "reader = ExtractiveReader()\n",
-    "reader.warm_up()\n",
-    "\n",
-    "extractive_qa_pipeline = Pipeline()\n",
-    "\n",
-    "extractive_qa_pipeline.add_component(instance=SentenceTransformersTextEmbedder(model=model), name=\"embedder\")\n",
-    "extractive_qa_pipeline.add_component(instance=retriever, name=\"retriever\")\n",
-    "extractive_qa_pipeline.add_component(instance=reader, name=\"reader\")\n",
-    "\n",
-    "extractive_qa_pipeline.connect(\"embedder.embedding\", \"retriever.query_embedding\")\n",
-    "extractive_qa_pipeline.connect(\"retriever.documents\", \"reader.documents\")"
-   ]
+   "source": "from haystack.components.retrievers.in_memory import InMemoryEmbeddingRetriever\nfrom haystack_integrations.components.readers.transformers import TransformersExtractiveReader\nfrom haystack.components.embedders import SentenceTransformersTextEmbedder\n\n\nretriever = InMemoryEmbeddingRetriever(document_store=document_store)\nreader = TransformersExtractiveReader()\nreader.warm_up()\n\nextractive_qa_pipeline = Pipeline()\n\nextractive_qa_pipeline.add_component(instance=SentenceTransformersTextEmbedder(model=model), name=\"embedder\")\nextractive_qa_pipeline.add_component(instance=retriever, name=\"retriever\")\nextractive_qa_pipeline.add_component(instance=reader, name=\"reader\")\n\nextractive_qa_pipeline.connect(\"embedder.embedding\", \"retriever.query_embedding\")\nextractive_qa_pipeline.connect(\"retriever.documents\", \"reader.documents\")"
   },
   {
    "cell_type": "markdown",
@@ -590,26 +292,7 @@
    "metadata": {
     "id": "GOKWgMDCWGRd"
    },
-   "source": [
-    "## `ExtractiveReader`: a closer look\n",
-    "\n",
-    "Here's an example answer:\n",
-    "```python\n",
-    "[ExtractedAnswer(query='Who was Pliny the Elder?', score=0.8306006193161011, data='Roman writer', document=Document(id=bb2c5f3d2e2e2bf28d599c7b686ab47ba10fbc13c07279e612d8632af81e5d71, content: 'The Roman writer Pliny the Elder, writing in the first century AD, argued that the Great Pyramid had...', meta: {'url': 'https://en.wikipedia.org/wiki/Great_Pyramid_of_Giza', '_split_id': 16}\n",
-    "```\n",
-    "\n",
-    "The confidence score ranges from 0 to 1. Higher scores mean the model has more confidence in the answer's relevance.\n",
-    "\n",
-    "The Reader sorts the answers based on their probability scores, with higher probability listed first. You can limit the number of answers the Reader returns in the optional `top_k` parameter.\n",
-    "\n",
-    "By default, the Reader sets a `no_answer=True` parameter. This param returns an `ExtractedAnswer` with no text, and the probability that none of the returned answers are correct.\n",
-    "\n",
-    "```python\n",
-    "ExtractedAnswer(query='Who was Pliny the Elder?', score=0.04606167031102615, data=None, document=None, context=None, document_offset=None, context_offset=None, meta={})]}}\n",
-    "```\n",
-    "\n",
-    "`.0.04606167031102615` means the model is fairly confident the provided answers are correct in this case. You can disable this behavior and return only answers by setting the `no_answer` param to `False` when initializing your `ExtractiveReader`.\n"
-   ]
+   "source": "## `TransformersExtractiveReader`: a closer look\n\nHere's an example answer:\n```python\n[ExtractedAnswer(query='Who was Pliny the Elder?', score=0.8306006193161011, data='Roman writer', document=Document(id=bb2c5f3d2e2e2bf28d599c7b686ab47ba10fbc13c07279e612d8632af81e5d71, content: 'The Roman writer Pliny the Elder, writing in the first century AD, argued that the Great Pyramid had...', meta: {'url': 'https://en.wikipedia.org/wiki/Great_Pyramid_of_Giza', '_split_id': 16}\n```\n\nThe confidence score ranges from 0 to 1. Higher scores mean the model has more confidence in the answer's relevance.\n\nThe Reader sorts the answers based on their probability scores, with higher probability listed first. You can limit the number of answers the Reader returns in the optional `top_k` parameter.\n\nBy default, the Reader sets a `no_answer=True` parameter. This param returns an `ExtractedAnswer` with no text, and the probability that none of the returned answers are correct.\n\n```python\nExtractedAnswer(query='Who was Pliny the Elder?', score=0.04606167031102615, data=None, document=None, context=None, document_offset=None, context_offset=None, meta={})]}}\n```\n\n`.0.04606167031102615` means the model is fairly confident the provided answers are correct in this case. You can disable this behavior and return only answers by setting the `no_answer` param to `False` when initializing your `TransformersExtractiveReader`.\n"
   },
   {
    "cell_type": "markdown",
@@ -647,4 +330,4 @@
  },
  "nbformat": 4,
  "nbformat_minor": 0
-}
+}
\ No newline at end of file
diff --git a/tutorials/41_Query_Classification_with_TransformersTextRouter_and_TransformersZeroShotTextRouter.ipynb b/tutorials/41_Query_Classification_with_TransformersTextRouter_and_TransformersZeroShotTextRouter.ipynb
index 10c93d9..ced5902 100644
--- a/tutorials/41_Query_Classification_with_TransformersTextRouter_and_TransformersZeroShotTextRouter.ipynb
+++ b/tutorials/41_Query_Classification_with_TransformersTextRouter_and_TransformersZeroShotTextRouter.ipynb
@@ -50,11 +50,7 @@
    "metadata": {
     "id": "TNlqD5HeN-gc"
    },
-   "source": [
-    "## Installing Haystack\n",
-    "\n",
-    "To start, install the latest release of Haystack with `pip`:"
-   ]
+   "source": "## Installing Haystack\n\n`TransformersTextRouter`, `TransformersZeroShotTextRouter`, and `TransformersExtractiveReader` are provided by the [`transformers-haystack`](https://haystack.deepset.ai/integrations/huggingface) integration. To start, install the latest release of Haystack together with `transformers-haystack` using `pip`:"
   },
   {
    "cell_type": "code",
@@ -64,12 +60,7 @@
     "id": "CjA5n5lMN-gd"
    },
    "outputs": [],
-   "source": [
-    "%%bash\n",
-    "\n",
-    "pip install --upgrade pip\n",
-    "pip install haystack-ai torch sentencepiece datasets sentence-transformers \"transformers<5\""
-   ]
+   "source": "%%bash\n\npip install --upgrade pip\npip install haystack-ai transformers-haystack torch sentencepiece datasets sentence-transformers \"transformers<5\""
   },
   {
    "cell_type": "markdown",
@@ -91,12 +82,7 @@
     "id": "XhPMEqBzxA8V"
    },
    "outputs": [],
-   "source": [
-    "from haystack.components.routers import TransformersTextRouter\n",
-    "\n",
-    "text_router = TransformersTextRouter(model=\"shahrukhx01/bert-mini-finetune-question-detection\")\n",
-    "text_router.warm_up()"
-   ]
+   "source": "from haystack_integrations.components.routers.transformers import TransformersTextRouter\n\ntext_router = TransformersTextRouter(model=\"shahrukhx01/bert-mini-finetune-question-detection\")\ntext_router.warm_up()"
   },
   {
    "cell_type": "markdown",
@@ -1311,12 +1297,7 @@
     "id": "xO7sr516vLgu"
    },
    "outputs": [],
-   "source": [
-    "from haystack.components.routers import TransformersZeroShotTextRouter\n",
-    "\n",
-    "text_router = TransformersZeroShotTextRouter(labels=[\"music\", \"cinema\"])\n",
-    "text_router.warm_up()"
-   ]
+   "source": "from haystack_integrations.components.routers.transformers import TransformersZeroShotTextRouter\n\ntext_router = TransformersZeroShotTextRouter(labels=[\"music\", \"cinema\"])\ntext_router.warm_up()"
   },
   {
    "cell_type": "code",
@@ -1646,7 +1627,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 14,
+   "execution_count": null,
    "metadata": {
     "colab": {
      "base_uri": "https://localhost:8080/",
@@ -1655,307 +1636,8 @@
     "id": "1ZULHEBVmqq2",
     "outputId": "50bfdccc-d04c-40f8-d616-9da8f8356b40"
    },
-   "outputs": [
-    {
-     "name": "stderr",
-     "output_type": "stream",
-     "text": [
-      "Asking to truncate to max_length but no maximum length is provided and the model has no predefined maximum length. Default to no truncation.\n"
-     ]
-    },
-    {
-     "data": {
-      "application/vnd.google.colaboratory.intrinsic+json": {
-       "summary": "{\n  \"name\": \"pd\",\n  \"rows\": 3,\n  \"fields\": [\n    {\n      \"column\": \"Query\",\n      \"properties\": {\n        \"dtype\": \"string\",\n        \"num_unique_values\": 3,\n        \"samples\": [\n          \"Who was the father of Arya Stark\",\n          \"Who was the father of Luke Skywalker\",\n          \"Who was the father of Frodo Baggins\"\n        ],\n        \"semantic_type\": \"\",\n        \"description\": \"\"\n      }\n    },\n    {\n      \"column\": \"Output Branch\",\n      \"properties\": {\n        \"dtype\": \"string\",\n        \"num_unique_values\": 3,\n        \"samples\": [\n          \"Game of Thrones\",\n          \"Star Wars\",\n          \"Lord of the Rings\"\n        ],\n        \"semantic_type\": \"\",\n        \"description\": \"\"\n      }\n    }\n  ]\n}",
-       "type": "dataframe"
-      },
-      "text/html": [
-       "\n",
-       "  <div id=\"df-d2c38e9b-e8bd-44c9-9509-bf349740a7ed\" class=\"colab-df-container\">\n",
-       "    <div>\n",
-       "<style scoped>\n",
-       "    .dataframe tbody tr th:only-of-type {\n",
-       "        vertical-align: middle;\n",
-       "    }\n",
-       "\n",
-       "    .dataframe tbody tr th {\n",
-       "        vertical-align: top;\n",
-       "    }\n",
-       "\n",
-       "    .dataframe thead th {\n",
-       "        text-align: right;\n",
-       "    }\n",
-       "</style>\n",
-       "<table border=\"1\" class=\"dataframe\">\n",
-       "  <thead>\n",
-       "    <tr style=\"text-align: right;\">\n",
-       "      <th></th>\n",
-       "      <th>Query</th>\n",
-       "      <th>Output Branch</th>\n",
-       "    </tr>\n",
-       "  </thead>\n",
-       "  <tbody>\n",
-       "    <tr>\n",
-       "      <th>0</th>\n",
-       "      <td>Who was the father of Arya Stark</td>\n",
-       "      <td>Game of Thrones</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>1</th>\n",
-       "      <td>Who was the father of Luke Skywalker</td>\n",
-       "      <td>Star Wars</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>2</th>\n",
-       "      <td>Who was the father of Frodo Baggins</td>\n",
-       "      <td>Lord of the Rings</td>\n",
-       "    </tr>\n",
-       "  </tbody>\n",
-       "</table>\n",
-       "</div>\n",
-       "    <div class=\"colab-df-buttons\">\n",
-       "\n",
-       "  <div class=\"colab-df-container\">\n",
-       "    <button class=\"colab-df-convert\" onclick=\"convertToInteractive('df-d2c38e9b-e8bd-44c9-9509-bf349740a7ed')\"\n",
-       "            title=\"Convert this dataframe to an interactive table.\"\n",
-       "            style=\"display:none;\">\n",
-       "\n",
-       "  <svg xmlns=\"http://www.w3.org/2000/svg\" height=\"24px\" viewBox=\"0 -960 960 960\">\n",
-       "    <path d=\"M120-120v-720h720v720H120Zm60-500h600v-160H180v160Zm220 220h160v-160H400v160Zm0 220h160v-160H400v160ZM180-400h160v-160H180v160Zm440 0h160v-160H620v160ZM180-180h160v-160H180v160Zm440 0h160v-160H620v160Z\"/>\n",
-       "  </svg>\n",
-       "    </button>\n",
-       "\n",
-       "  <style>\n",
-       "    .colab-df-container {\n",
-       "      display:flex;\n",
-       "      gap: 12px;\n",
-       "    }\n",
-       "\n",
-       "    .colab-df-convert {\n",
-       "      background-color: #E8F0FE;\n",
-       "      border: none;\n",
-       "      border-radius: 50%;\n",
-       "      cursor: pointer;\n",
-       "      display: none;\n",
-       "      fill: #1967D2;\n",
-       "      height: 32px;\n",
-       "      padding: 0 0 0 0;\n",
-       "      width: 32px;\n",
-       "    }\n",
-       "\n",
-       "    .colab-df-convert:hover {\n",
-       "      background-color: #E2EBFA;\n",
-       "      box-shadow: 0px 1px 2px rgba(60, 64, 67, 0.3), 0px 1px 3px 1px rgba(60, 64, 67, 0.15);\n",
-       "      fill: #174EA6;\n",
-       "    }\n",
-       "\n",
-       "    .colab-df-buttons div {\n",
-       "      margin-bottom: 4px;\n",
-       "    }\n",
-       "\n",
-       "    [theme=dark] .colab-df-convert {\n",
-       "      background-color: #3B4455;\n",
-       "      fill: #D2E3FC;\n",
-       "    }\n",
-       "\n",
-       "    [theme=dark] .colab-df-convert:hover {\n",
-       "      background-color: #434B5C;\n",
-       "      box-shadow: 0px 1px 3px 1px rgba(0, 0, 0, 0.15);\n",
-       "      filter: drop-shadow(0px 1px 2px rgba(0, 0, 0, 0.3));\n",
-       "      fill: #FFFFFF;\n",
-       "    }\n",
-       "  </style>\n",
-       "\n",
-       "    <script>\n",
-       "      const buttonEl =\n",
-       "        document.querySelector('#df-d2c38e9b-e8bd-44c9-9509-bf349740a7ed button.colab-df-convert');\n",
-       "      buttonEl.style.display =\n",
-       "        google.colab.kernel.accessAllowed ? 'block' : 'none';\n",
-       "\n",
-       "      async function convertToInteractive(key) {\n",
-       "        const element = document.querySelector('#df-d2c38e9b-e8bd-44c9-9509-bf349740a7ed');\n",
-       "        const dataTable =\n",
-       "          await google.colab.kernel.invokeFunction('convertToInteractive',\n",
-       "                                                    [key], {});\n",
-       "        if (!dataTable) return;\n",
-       "\n",
-       "        const docLinkHtml = 'Like what you see? Visit the ' +\n",
-       "          '<a target=\"_blank\" href=https://colab.research.google.com/notebooks/data_table.ipynb>data table notebook</a>'\n",
-       "          + ' to learn more about interactive tables.';\n",
-       "        element.innerHTML = '';\n",
-       "        dataTable['output_type'] = 'display_data';\n",
-       "        await google.colab.output.renderOutput(dataTable, element);\n",
-       "        const docLink = document.createElement('div');\n",
-       "        docLink.innerHTML = docLinkHtml;\n",
-       "        element.appendChild(docLink);\n",
-       "      }\n",
-       "    </script>\n",
-       "  </div>\n",
-       "\n",
-       "\n",
-       "<div id=\"df-65429ad9-ffeb-4c0f-b2dd-7f25bc6c8db2\">\n",
-       "  <button class=\"colab-df-quickchart\" onclick=\"quickchart('df-65429ad9-ffeb-4c0f-b2dd-7f25bc6c8db2')\"\n",
-       "            title=\"Suggest charts\"\n",
-       "            style=\"display:none;\">\n",
-       "\n",
-       "<svg xmlns=\"http://www.w3.org/2000/svg\" height=\"24px\"viewBox=\"0 0 24 24\"\n",
-       "     width=\"24px\">\n",
-       "    <g>\n",
-       "        <path d=\"M19 3H5c-1.1 0-2 .9-2 2v14c0 1.1.9 2 2 2h14c1.1 0 2-.9 2-2V5c0-1.1-.9-2-2-2zM9 17H7v-7h2v7zm4 0h-2V7h2v10zm4 0h-2v-4h2v4z\"/>\n",
-       "    </g>\n",
-       "</svg>\n",
-       "  </button>\n",
-       "\n",
-       "<style>\n",
-       "  .colab-df-quickchart {\n",
-       "      --bg-color: #E8F0FE;\n",
-       "      --fill-color: #1967D2;\n",
-       "      --hover-bg-color: #E2EBFA;\n",
-       "      --hover-fill-color: #174EA6;\n",
-       "      --disabled-fill-color: #AAA;\n",
-       "      --disabled-bg-color: #DDD;\n",
-       "  }\n",
-       "\n",
-       "  [theme=dark] .colab-df-quickchart {\n",
-       "      --bg-color: #3B4455;\n",
-       "      --fill-color: #D2E3FC;\n",
-       "      --hover-bg-color: #434B5C;\n",
-       "      --hover-fill-color: #FFFFFF;\n",
-       "      --disabled-bg-color: #3B4455;\n",
-       "      --disabled-fill-color: #666;\n",
-       "  }\n",
-       "\n",
-       "  .colab-df-quickchart {\n",
-       "    background-color: var(--bg-color);\n",
-       "    border: none;\n",
-       "    border-radius: 50%;\n",
-       "    cursor: pointer;\n",
-       "    display: none;\n",
-       "    fill: var(--fill-color);\n",
-       "    height: 32px;\n",
-       "    padding: 0;\n",
-       "    width: 32px;\n",
-       "  }\n",
-       "\n",
-       "  .colab-df-quickchart:hover {\n",
-       "    background-color: var(--hover-bg-color);\n",
-       "    box-shadow: 0 1px 2px rgba(60, 64, 67, 0.3), 0 1px 3px 1px rgba(60, 64, 67, 0.15);\n",
-       "    fill: var(--button-hover-fill-color);\n",
-       "  }\n",
-       "\n",
-       "  .colab-df-quickchart-complete:disabled,\n",
-       "  .colab-df-quickchart-complete:disabled:hover {\n",
-       "    background-color: var(--disabled-bg-color);\n",
-       "    fill: var(--disabled-fill-color);\n",
-       "    box-shadow: none;\n",
-       "  }\n",
-       "\n",
-       "  .colab-df-spinner {\n",
-       "    border: 2px solid var(--fill-color);\n",
-       "    border-color: transparent;\n",
-       "    border-bottom-color: var(--fill-color);\n",
-       "    animation:\n",
-       "      spin 1s steps(1) infinite;\n",
-       "  }\n",
-       "\n",
-       "  @keyframes spin {\n",
-       "    0% {\n",
-       "      border-color: transparent;\n",
-       "      border-bottom-color: var(--fill-color);\n",
-       "      border-left-color: var(--fill-color);\n",
-       "    }\n",
-       "    20% {\n",
-       "      border-color: transparent;\n",
-       "      border-left-color: var(--fill-color);\n",
-       "      border-top-color: var(--fill-color);\n",
-       "    }\n",
-       "    30% {\n",
-       "      border-color: transparent;\n",
-       "      border-left-color: var(--fill-color);\n",
-       "      border-top-color: var(--fill-color);\n",
-       "      border-right-color: var(--fill-color);\n",
-       "    }\n",
-       "    40% {\n",
-       "      border-color: transparent;\n",
-       "      border-right-color: var(--fill-color);\n",
-       "      border-top-color: var(--fill-color);\n",
-       "    }\n",
-       "    60% {\n",
-       "      border-color: transparent;\n",
-       "      border-right-color: var(--fill-color);\n",
-       "    }\n",
-       "    80% {\n",
-       "      border-color: transparent;\n",
-       "      border-right-color: var(--fill-color);\n",
-       "      border-bottom-color: var(--fill-color);\n",
-       "    }\n",
-       "    90% {\n",
-       "      border-color: transparent;\n",
-       "      border-bottom-color: var(--fill-color);\n",
-       "    }\n",
-       "  }\n",
-       "</style>\n",
-       "\n",
-       "  <script>\n",
-       "    async function quickchart(key) {\n",
-       "      const quickchartButtonEl =\n",
-       "        document.querySelector('#' + key + ' button');\n",
-       "      quickchartButtonEl.disabled = true;  // To prevent multiple clicks.\n",
-       "      quickchartButtonEl.classList.add('colab-df-spinner');\n",
-       "      try {\n",
-       "        const charts = await google.colab.kernel.invokeFunction(\n",
-       "            'suggestCharts', [key], {});\n",
-       "      } catch (error) {\n",
-       "        console.error('Error during call to suggestCharts:', error);\n",
-       "      }\n",
-       "      quickchartButtonEl.classList.remove('colab-df-spinner');\n",
-       "      quickchartButtonEl.classList.add('colab-df-quickchart-complete');\n",
-       "    }\n",
-       "    (() => {\n",
-       "      let quickchartButtonEl =\n",
-       "        document.querySelector('#df-65429ad9-ffeb-4c0f-b2dd-7f25bc6c8db2 button');\n",
-       "      quickchartButtonEl.style.display =\n",
-       "        google.colab.kernel.accessAllowed ? 'block' : 'none';\n",
-       "    })();\n",
-       "  </script>\n",
-       "</div>\n",
-       "\n",
-       "    </div>\n",
-       "  </div>\n"
-      ],
-      "text/plain": [
-       "                                  Query      Output Branch\n",
-       "0      Who was the father of Arya Stark    Game of Thrones\n",
-       "1  Who was the father of Luke Skywalker          Star Wars\n",
-       "2   Who was the father of Frodo Baggins  Lord of the Rings"
-      ]
-     },
-     "execution_count": 14,
-     "metadata": {},
-     "output_type": "execute_result"
-    }
-   ],
-   "source": [
-    "from haystack.components.routers import TransformersZeroShotTextRouter\n",
-    "\n",
-    "text_router = TransformersZeroShotTextRouter(labels=[\"Game of Thrones\", \"Star Wars\", \"Lord of the Rings\"])\n",
-    "text_router.warm_up()\n",
-    "\n",
-    "queries = [\n",
-    "    \"Who was the father of Arya Stark\",  # Game of Thrones\n",
-    "    \"Who was the father of Luke Skywalker\",  # Star Wars\n",
-    "    \"Who was the father of Frodo Baggins\",  # Lord of the Rings\n",
-    "]\n",
-    "\n",
-    "results = {\"Query\": [], \"Output Branch\": []}\n",
-    "\n",
-    "for query in queries:\n",
-    "    result = text_router.run(text=query)\n",
-    "    results[\"Query\"].append(query)\n",
-    "    results[\"Output Branch\"].append(next(iter(result)))\n",
-    "\n",
-    "pd.DataFrame.from_dict(results)"
-   ]
+   "outputs": [],
+   "source": "from haystack_integrations.components.routers.transformers import TransformersZeroShotTextRouter\n\ntext_router = TransformersZeroShotTextRouter(labels=[\"Game of Thrones\", \"Star Wars\", \"Lord of the Rings\"])\ntext_router.warm_up()\n\nqueries = [\n    \"Who was the father of Arya Stark\",  # Game of Thrones\n    \"Who was the father of Luke Skywalker\",  # Star Wars\n    \"Who was the father of Frodo Baggins\",  # Lord of the Rings\n]\n\nresults = {\"Query\": [], \"Output Branch\": []}\n\nfor query in queries:\n    result = text_router.run(text=query)\n    results[\"Query\"].append(query)\n    results[\"Output Branch\"].append(next(iter(result)))\n\npd.DataFrame.from_dict(results)"
   },
   {
    "cell_type": "markdown",
@@ -2384,7 +2066,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 22,
+   "execution_count": null,
    "metadata": {
     "colab": {
      "base_uri": "https://localhost:8080/"
@@ -2392,42 +2074,8 @@
     "id": "BIisEJrzDr-9",
     "outputId": "86043b13-a035-4fde-ebc8-d9cdddaedfe8"
    },
-   "outputs": [
-    {
-     "data": {
-      "text/plain": [
-       "<haystack.core.pipeline.pipeline.Pipeline object at 0x79e77e697940>\n",
-       "🚅 Components\n",
-       "  - bm25_retriever_0: InMemoryBM25Retriever\n",
-       "  - bm25_retriever_1: InMemoryBM25Retriever\n",
-       "  - text_router: TransformersTextRouter\n",
-       "  - reader: ExtractiveReader\n",
-       "🛤️ Connections\n",
-       "  - bm25_retriever_0.documents -> reader.documents (List[Document])\n",
-       "  - text_router.LABEL_0 -> bm25_retriever_0.query (str)\n",
-       "  - text_router.LABEL_1 -> bm25_retriever_1.query (str)"
-      ]
-     },
-     "execution_count": 22,
-     "metadata": {},
-     "output_type": "execute_result"
-    }
-   ],
-   "source": [
-    "from haystack.components.readers import ExtractiveReader\n",
-    "\n",
-    "query_classification_pipeline = Pipeline()\n",
-    "query_classification_pipeline.add_component(\"bm25_retriever_0\", InMemoryBM25Retriever(document_store))\n",
-    "query_classification_pipeline.add_component(\"bm25_retriever_1\", InMemoryBM25Retriever(document_store))\n",
-    "query_classification_pipeline.add_component(\n",
-    "    \"text_router\", TransformersTextRouter(model=\"shahrukhx01/question-vs-statement-classifier\")\n",
-    ")\n",
-    "query_classification_pipeline.add_component(\"reader\", ExtractiveReader())\n",
-    "\n",
-    "query_classification_pipeline.connect(\"text_router.LABEL_0\", \"bm25_retriever_0\")\n",
-    "query_classification_pipeline.connect(\"bm25_retriever_0\", \"reader\")\n",
-    "query_classification_pipeline.connect(\"text_router.LABEL_1\", \"bm25_retriever_1\")"
-   ]
+   "outputs": [],
+   "source": "from haystack_integrations.components.readers.transformers import TransformersExtractiveReader\n\nquery_classification_pipeline = Pipeline()\nquery_classification_pipeline.add_component(\"bm25_retriever_0\", InMemoryBM25Retriever(document_store))\nquery_classification_pipeline.add_component(\"bm25_retriever_1\", InMemoryBM25Retriever(document_store))\nquery_classification_pipeline.add_component(\n    \"text_router\", TransformersTextRouter(model=\"shahrukhx01/question-vs-statement-classifier\")\n)\nquery_classification_pipeline.add_component(\"reader\", TransformersExtractiveReader())\n\nquery_classification_pipeline.connect(\"text_router.LABEL_0\", \"bm25_retriever_0\")\nquery_classification_pipeline.connect(\"bm25_retriever_0\", \"reader\")\nquery_classification_pipeline.connect(\"text_router.LABEL_1\", \"bm25_retriever_1\")"
   },
   {
    "cell_type": "markdown",
@@ -2696,4 +2344,4 @@
  },
  "nbformat": 4,
  "nbformat_minor": 0
-}
+}
\ No newline at end of file
diff --git a/tutorials/44_Creating_Custom_SuperComponents.ipynb b/tutorials/44_Creating_Custom_SuperComponents.ipynb
index c3f27b0..96fb927 100644
--- a/tutorials/44_Creating_Custom_SuperComponents.ipynb
+++ b/tutorials/44_Creating_Custom_SuperComponents.ipynb
@@ -5,14 +5,7 @@
    "metadata": {
     "id": "2OvkPji9O-qX"
    },
-   "source": [
-    "# Tutorial: Creating Custom SuperComponents\n",
-    "\n",
-    "- **Level**: Intermediate\n",
-    "- **Time to complete**: 20 minutes\n",
-    "- **Concepts and Components Used**: [`@super_component`](https://docs.haystack.deepset.ai/docs/supercomponents), [`Pipeline`](https://docs.haystack.deepset.ai/docs/pipelines), [`DocumentJoiner`](https://docs.haystack.deepset.ai/docs/documentjoiner), [`SentenceTransformersTextEmbedder`](https://docs.haystack.deepset.ai/docs/sentencetransformerstextembedder), [`InMemoryBM25Retriever`](https://docs.haystack.deepset.ai/docs/inmemorybm25retriever), [`InMemoryEmbeddingRetriever`](https://docs.haystack.deepset.ai/docs/inmemoryembeddingretriever), [`TransformersSimilarityRanker`](https://docs.haystack.deepset.ai/docs/transformerssimilarityranker)\n",
-    "- **Goal**: After completing this tutorial, you'll have learned how to create custom SuperComponents using the `@super_component` decorator to simplify complex pipelines and make them reusable as components."
-   ]
+   "source": "# Tutorial: Creating Custom SuperComponents\n\n- **Level**: Intermediate\n- **Time to complete**: 20 minutes\n- **Concepts and Components Used**: [`@super_component`](https://docs.haystack.deepset.ai/docs/supercomponents), [`Pipeline`](https://docs.haystack.deepset.ai/docs/pipelines), [`DocumentJoiner`](https://docs.haystack.deepset.ai/docs/documentjoiner), [`SentenceTransformersTextEmbedder`](https://docs.haystack.deepset.ai/docs/sentencetransformerstextembedder), [`InMemoryBM25Retriever`](https://docs.haystack.deepset.ai/docs/inmemorybm25retriever), [`InMemoryEmbeddingRetriever`](https://docs.haystack.deepset.ai/docs/inmemoryembeddingretriever), [`SentenceTransformersSimilarityRanker`](https://docs.haystack.deepset.ai/docs/sentencetransformerssimilarityranker)\n- **Goal**: After completing this tutorial, you'll have learned how to create custom SuperComponents using the `@super_component` decorator to simplify complex pipelines and make them reusable as components."
   },
   {
    "cell_type": "markdown",
@@ -261,51 +254,9 @@
      "start_time": "2026-05-26T08:59:55.782346Z"
     }
    },
-   "source": [
-    "from haystack import Document, Pipeline, super_component\n",
-    "from haystack.components.joiners import DocumentJoiner\n",
-    "from haystack.components.embedders import SentenceTransformersTextEmbedder\n",
-    "from haystack.components.rankers import TransformersSimilarityRanker\n",
-    "from haystack.components.retrievers import InMemoryBM25Retriever, InMemoryEmbeddingRetriever\n",
-    "from haystack.document_stores.in_memory import InMemoryDocumentStore\n",
-    "\n",
-    "from datasets import load_dataset\n",
-    "\n",
-    "\n",
-    "@super_component\n",
-    "class HybridRetrieverWithRanker:\n",
-    "    def __init__(\n",
-    "        self,\n",
-    "        document_store: InMemoryDocumentStore,\n",
-    "        embedder_model: str = \"BAAI/bge-small-en-v1.5\",\n",
-    "        ranker_model: str = \"BAAI/bge-reranker-base\",\n",
-    "    ):\n",
-    "        # Create the components\n",
-    "        embedding_retriever = InMemoryEmbeddingRetriever(document_store)\n",
-    "        bm25_retriever = InMemoryBM25Retriever(document_store)\n",
-    "        text_embedder = SentenceTransformersTextEmbedder(embedder_model)\n",
-    "        document_joiner = DocumentJoiner()\n",
-    "        ranker = TransformersSimilarityRanker(ranker_model)\n",
-    "\n",
-    "        # Create the pipeline\n",
-    "        self.pipeline = Pipeline()\n",
-    "        self.pipeline.add_component(\"text_embedder\", text_embedder)\n",
-    "        self.pipeline.add_component(\"embedding_retriever\", embedding_retriever)\n",
-    "        self.pipeline.add_component(\"bm25_retriever\", bm25_retriever)\n",
-    "        self.pipeline.add_component(\"document_joiner\", document_joiner)\n",
-    "        self.pipeline.add_component(\"ranker\", ranker)\n",
-    "\n",
-    "        # Connect the components\n",
-    "        self.pipeline.connect(\"text_embedder\", \"embedding_retriever\")\n",
-    "        self.pipeline.connect(\"bm25_retriever\", \"document_joiner\")\n",
-    "        self.pipeline.connect(\"embedding_retriever\", \"document_joiner\")\n",
-    "        self.pipeline.connect(\"document_joiner\", \"ranker\")\n",
-    "\n",
-    "        # Define input mapping\n",
-    "        self.input_mapping = {\"query\": [\"text_embedder.text\", \"bm25_retriever.query\", \"ranker.query\"]}"
-   ],
+   "source": "from haystack import Document, Pipeline, super_component\nfrom haystack.components.joiners import DocumentJoiner\nfrom haystack.components.embedders import SentenceTransformersTextEmbedder\nfrom haystack.components.rankers import SentenceTransformersSimilarityRanker\nfrom haystack.components.retrievers import InMemoryBM25Retriever, InMemoryEmbeddingRetriever\nfrom haystack.document_stores.in_memory import InMemoryDocumentStore\n\nfrom datasets import load_dataset\n\n\n@super_component\nclass HybridRetrieverWithRanker:\n    def __init__(\n        self,\n        document_store: InMemoryDocumentStore,\n        embedder_model: str = \"BAAI/bge-small-en-v1.5\",\n        ranker_model: str = \"BAAI/bge-reranker-base\",\n    ):\n        # Create the components\n        embedding_retriever = InMemoryEmbeddingRetriever(document_store)\n        bm25_retriever = InMemoryBM25Retriever(document_store)\n        text_embedder = SentenceTransformersTextEmbedder(embedder_model)\n        document_joiner = DocumentJoiner()\n        ranker = SentenceTransformersSimilarityRanker(ranker_model)\n\n        # Create the pipeline\n        self.pipeline = Pipeline()\n        self.pipeline.add_component(\"text_embedder\", text_embedder)\n        self.pipeline.add_component(\"embedding_retriever\", embedding_retriever)\n        self.pipeline.add_component(\"bm25_retriever\", bm25_retriever)\n        self.pipeline.add_component(\"document_joiner\", document_joiner)\n        self.pipeline.add_component(\"ranker\", ranker)\n\n        # Connect the components\n        self.pipeline.connect(\"text_embedder\", \"embedding_retriever\")\n        self.pipeline.connect(\"bm25_retriever\", \"document_joiner\")\n        self.pipeline.connect(\"embedding_retriever\", \"document_joiner\")\n        self.pipeline.connect(\"document_joiner\", \"ranker\")\n\n        # Define input mapping\n        self.input_mapping = {\"query\": [\"text_embedder.text\", \"bm25_retriever.query\", \"ranker.query\"]}",
    "outputs": [],
-   "execution_count": 5
+   "execution_count": null
   },
   {
    "cell_type": "code",
@@ -444,16 +395,7 @@
    "metadata": {
     "id": "xtORWP3_0FAU"
    },
-   "source": [
-    "### Comparing the Two Retrievers\n",
-    "\n",
-    "The main differences between the two retrievers are:\n",
-    "\n",
-    "1. **Added Ranker Component**: The second version includes a `TransformersSimilarityRanker` that re-ranks the documents based on their semantic similarity to the query.\n",
-    "2. **Updated Input Mapping**: We added `\"text_embedder.text\"`, `\"bm25_retriever.query\"` and `\"ranker.query\"` to the input mapping to ensure the input query is sent to all three components while simplifying the `retriever.run` method.\n",
-    "\n",
-    "The ranker can significantly improve the quality of the results by re-ranking the documents based on their semantic similarity to the query, even if they were not ranked highly by the initial retrievers."
-   ]
+   "source": "### Comparing the Two Retrievers\n\nThe main differences between the two retrievers are:\n\n1. **Added Ranker Component**: The second version includes a `SentenceTransformersSimilarityRanker` that re-ranks the documents based on their semantic similarity to the query.\n2. **Updated Input Mapping**: We added `\"text_embedder.text\"`, `\"bm25_retriever.query\"` and `\"ranker.query\"` to the input mapping to ensure the input query is sent to all three components while simplifying the `retriever.run` method.\n\nThe ranker can significantly improve the quality of the results by re-ranking the documents based on their semantic similarity to the query, even if they were not ranked highly by the initial retrievers."
   },
   {
    "cell_type": "markdown",
@@ -560,58 +502,9 @@
      "start_time": "2026-05-26T09:01:35.685324Z"
     }
    },
-   "source": [
-    "from haystack import Document, Pipeline, super_component\n",
-    "from haystack.components.joiners import DocumentJoiner\n",
-    "from haystack.components.embedders import SentenceTransformersTextEmbedder\n",
-    "from haystack.components.retrievers import InMemoryBM25Retriever, InMemoryEmbeddingRetriever\n",
-    "from haystack.components.rankers import TransformersSimilarityRanker\n",
-    "from haystack.document_stores.in_memory import InMemoryDocumentStore\n",
-    "\n",
-    "\n",
-    "@super_component\n",
-    "class AdvancedHybridRetriever:\n",
-    "    def __init__(\n",
-    "        self,\n",
-    "        document_store: InMemoryDocumentStore,\n",
-    "        embedder_model: str = \"BAAI/bge-small-en-v1.5\",\n",
-    "        ranker_model: str = \"BAAI/bge-reranker-base\",\n",
-    "    ):\n",
-    "        # Create the components\n",
-    "        embedding_retriever = InMemoryEmbeddingRetriever(document_store)\n",
-    "        bm25_retriever = InMemoryBM25Retriever(document_store)\n",
-    "        text_embedder = SentenceTransformersTextEmbedder(embedder_model)\n",
-    "        document_joiner = DocumentJoiner()\n",
-    "        ranker = TransformersSimilarityRanker(ranker_model)\n",
-    "\n",
-    "        # Create the pipeline\n",
-    "        self.pipeline = Pipeline()\n",
-    "        self.pipeline.add_component(\"text_embedder\", text_embedder)\n",
-    "        self.pipeline.add_component(\"embedding_retriever\", embedding_retriever)\n",
-    "        self.pipeline.add_component(\"bm25_retriever\", bm25_retriever)\n",
-    "        self.pipeline.add_component(\"document_joiner\", document_joiner)\n",
-    "        self.pipeline.add_component(\"ranker\", ranker)\n",
-    "\n",
-    "        # Connect the components\n",
-    "        self.pipeline.connect(\"text_embedder\", \"embedding_retriever\")\n",
-    "        self.pipeline.connect(\"bm25_retriever\", \"document_joiner\")\n",
-    "        self.pipeline.connect(\"embedding_retriever\", \"document_joiner\")\n",
-    "        self.pipeline.connect(\"document_joiner\", \"ranker\")\n",
-    "\n",
-    "        # Define input and output mappings\n",
-    "        self.input_mapping = {\"query\": [\"text_embedder.text\", \"bm25_retriever.query\", \"ranker.query\"]}\n",
-    "\n",
-    "        # Expose outputs from multiple components, including non-leaf components\n",
-    "        self.output_mapping = {\n",
-    "            \"bm25_retriever.documents\": \"bm25_documents\",\n",
-    "            \"embedding_retriever.documents\": \"embedding_documents\",\n",
-    "            \"document_joiner.documents\": \"joined_documents\",\n",
-    "            \"ranker.documents\": \"ranked_documents\",\n",
-    "            \"text_embedder.embedding\": \"query_embedding\",\n",
-    "        }"
-   ],
+   "source": "from haystack import Document, Pipeline, super_component\nfrom haystack.components.joiners import DocumentJoiner\nfrom haystack.components.embedders import SentenceTransformersTextEmbedder\nfrom haystack.components.retrievers import InMemoryBM25Retriever, InMemoryEmbeddingRetriever\nfrom haystack.components.rankers import SentenceTransformersSimilarityRanker\nfrom haystack.document_stores.in_memory import InMemoryDocumentStore\n\n\n@super_component\nclass AdvancedHybridRetriever:\n    def __init__(\n        self,\n        document_store: InMemoryDocumentStore,\n        embedder_model: str = \"BAAI/bge-small-en-v1.5\",\n        ranker_model: str = \"BAAI/bge-reranker-base\",\n    ):\n        # Create the components\n        embedding_retriever = InMemoryEmbeddingRetriever(document_store)\n        bm25_retriever = InMemoryBM25Retriever(document_store)\n        text_embedder = SentenceTransformersTextEmbedder(embedder_model)\n        document_joiner = DocumentJoiner()\n        ranker = SentenceTransformersSimilarityRanker(ranker_model)\n\n        # Create the pipeline\n        self.pipeline = Pipeline()\n        self.pipeline.add_component(\"text_embedder\", text_embedder)\n        self.pipeline.add_component(\"embedding_retriever\", embedding_retriever)\n        self.pipeline.add_component(\"bm25_retriever\", bm25_retriever)\n        self.pipeline.add_component(\"document_joiner\", document_joiner)\n        self.pipeline.add_component(\"ranker\", ranker)\n\n        # Connect the components\n        self.pipeline.connect(\"text_embedder\", \"embedding_retriever\")\n        self.pipeline.connect(\"bm25_retriever\", \"document_joiner\")\n        self.pipeline.connect(\"embedding_retriever\", \"document_joiner\")\n        self.pipeline.connect(\"document_joiner\", \"ranker\")\n\n        # Define input and output mappings\n        self.input_mapping = {\"query\": [\"text_embedder.text\", \"bm25_retriever.query\", \"ranker.query\"]}\n\n        # Expose outputs from multiple components, including non-leaf components\n        self.output_mapping = {\n            \"bm25_retriever.documents\": \"bm25_documents\",\n            \"embedding_retriever.documents\": \"embedding_documents\",\n            \"document_joiner.documents\": \"joined_documents\",\n            \"ranker.documents\": \"ranked_documents\",\n            \"text_embedder.embedding\": \"query_embedding\",\n        }",
    "outputs": [],
-   "execution_count": 8
+   "execution_count": null
   },
   {
    "cell_type": "code",
@@ -787,4 +680,4 @@
  },
  "nbformat": 4,
  "nbformat_minor": 0
-}
+}
\ No newline at end of file
diff --git a/tutorials/49_TurboQuant_Quantization_with_HuggingFace.ipynb b/tutorials/49_TurboQuant_Quantization_with_HuggingFace.ipynb
index 5532eb0..ce391b7 100644
--- a/tutorials/49_TurboQuant_Quantization_with_HuggingFace.ipynb
+++ b/tutorials/49_TurboQuant_Quantization_with_HuggingFace.ipynb
@@ -3,41 +3,17 @@
   {
    "cell_type": "markdown",
    "metadata": {},
-   "source": [
-    "# Compress the KV Cache with TurboQuant and Haystack\n",
-    "\n",
-    "- **Level**: Advanced\n",
-    "- **Time to complete**: 20 min\n",
-    "- **Components Used**: [`HuggingFaceLocalChatGenerator`](https://docs.haystack.deepset.ai/docs/huggingfacelocalchatgenerator)\n",
-    "- **Goal**: Apply TurboQuant KV cache compression to a local LLM and measure its memory and throughput impact with Haystack."
-   ]
+   "source": "# Compress the KV Cache with TurboQuant and Haystack\n\n- **Level**: Advanced\n- **Time to complete**: 20 min\n- **Components Used**: [`TransformersChatGenerator`](https://docs.haystack.deepset.ai/docs/transformerschatgenerator)\n- **Goal**: Apply TurboQuant KV cache compression to a local LLM and measure its memory and throughput impact with Haystack."
   },
   {
    "cell_type": "markdown",
    "metadata": {},
-   "source": [
-    "## Overview\n",
-    "\n",
-    "Every time an LLM generates a token, it reads and writes a **key-value (KV) cache** - a growing table of intermediate activations that lets the model attend to previous tokens without recomputing them. On long contexts or large models, this cache becomes the dominant consumer of GPU memory.\n",
-    "\n",
-    "[TurboQuant](https://research.google/blog/turboquant-redefining-ai-efficiency-with-extreme-compression/) is a KV cache compression algorithm from Google Research (ICLR 2026) that shrinks those vectors to 3–4 bits per coordinate without any retraining. It works in two stages:\n",
-    "\n",
-    "1. **PolarQuant** - a random orthogonal rotation maps cache vectors to a more uniform distribution, then quantizes them in polar coordinates using Lloyd-Max optimal centroids.\n",
-    "2. **QJL** (Quantized Johnson-Lindenstrauss) - a single extra bit per vector corrects residual errors in attention score computation, preserving accuracy at extreme compression ratios.\n",
-    "\n",
-    "The result: KV memory can drop from 1,639 MiB to 435 MiB (3.76x) on an RTX 4090, with ≥6x reduction validated on server hardware, and near-identical output quality.\n",
-    "\n",
-    "In this tutorial you will use [`turboquant-vllm`](https://github.com/Alberto-Codes/turboquant-vllm), a community implementation of the TurboQuant algorithm, to wire `CompressedDynamicCache` into Haystack's [`HuggingFaceLocalChatGenerator`](https://docs.haystack.deepset.ai/docs/huggingfacelocalchatgenerator), run a generation, and measure time-to-first-token, throughput, and live VRAM usage."
-   ]
+   "source": "## Overview\n\nEvery time an LLM generates a token, it reads and writes a **key-value (KV) cache** - a growing table of intermediate activations that lets the model attend to previous tokens without recomputing them. On long contexts or large models, this cache becomes the dominant consumer of GPU memory.\n\n[TurboQuant](https://research.google/blog/turboquant-redefining-ai-efficiency-with-extreme-compression/) is a KV cache compression algorithm from Google Research (ICLR 2026) that shrinks those vectors to 3–4 bits per coordinate without any retraining. It works in two stages:\n\n1. **PolarQuant** - a random orthogonal rotation maps cache vectors to a more uniform distribution, then quantizes them in polar coordinates using Lloyd-Max optimal centroids.\n2. **QJL** (Quantized Johnson-Lindenstrauss) - a single extra bit per vector corrects residual errors in attention score computation, preserving accuracy at extreme compression ratios.\n\nThe result: KV memory can drop from 1,639 MiB to 435 MiB (3.76x) on an RTX 4090, with ≥6x reduction validated on server hardware, and near-identical output quality.\n\nIn this tutorial you will use [`turboquant-vllm`](https://github.com/Alberto-Codes/turboquant-vllm), a community implementation of the TurboQuant algorithm, to wire `CompressedDynamicCache` into Haystack's [`TransformersChatGenerator`](https://docs.haystack.deepset.ai/docs/transformerschatgenerator), run a generation, and measure time-to-first-token, throughput, and live VRAM usage."
   },
   {
    "cell_type": "markdown",
    "metadata": {},
-   "source": [
-    "## Installing Haystack and TurboQuant\n",
-    "\n",
-    "First, let's install `haystack-ai` and [`turboquant-vllm`](https://github.com/Alberto-Codes/turboquant-vllm), a community implementation of the TurboQuant algorithm that provides the `CompressedDynamicCache` wrapper."
-   ]
+   "source": "## Installing Haystack and TurboQuant\n\nFirst, let's install `haystack-ai`, the [`transformers-haystack`](https://haystack.deepset.ai/integrations/huggingface) integration (which provides `TransformersChatGenerator`), and [`turboquant-vllm`](https://github.com/Alberto-Codes/turboquant-vllm), a community implementation of the TurboQuant algorithm that provides the `CompressedDynamicCache` wrapper."
   },
   {
    "cell_type": "code",
@@ -47,23 +23,9 @@
      "start_time": "2026-04-03T13:26:24.012627Z"
     }
    },
-   "source": [
-    "%%bash\n",
-    "\n",
-    "pip install -q haystack-ai turboquant-vllm"
-   ],
-   "outputs": [
-    {
-     "name": "stderr",
-     "output_type": "stream",
-     "text": [
-      "\n",
-      "\u001B[1m[\u001B[0m\u001B[34;49mnotice\u001B[0m\u001B[1;39;49m]\u001B[0m\u001B[39;49m A new release of pip is available: \u001B[0m\u001B[31;49m25.0.1\u001B[0m\u001B[39;49m -> \u001B[0m\u001B[32;49m26.0.1\u001B[0m\n",
-      "\u001B[1m[\u001B[0m\u001B[34;49mnotice\u001B[0m\u001B[1;39;49m]\u001B[0m\u001B[39;49m To update, run: \u001B[0m\u001B[32;49mpip install --upgrade pip\u001B[0m\n"
-     ]
-    }
-   ],
-   "execution_count": 1
+   "source": "%%bash\n\npip install -q haystack-ai transformers-haystack turboquant-vllm",
+   "outputs": [],
+   "execution_count": null
   },
   {
    "cell_type": "markdown",
@@ -146,11 +108,7 @@
   {
    "cell_type": "markdown",
    "metadata": {},
-   "source": [
-    "## Initializing the Generator\n",
-    "\n",
-    "Now let's set up [`HuggingFaceLocalChatGenerator`](https://docs.haystack.deepset.ai/docs/huggingfacelocalchatgenerator) with a selected model, like `Qwen/Qwen3-4B-Thinking-2507`. We pass the compressed `cache` via `generation_kwargs` so that every decoding step writes through TurboQuant."
-   ]
+   "source": "## Initializing the Generator\n\nNow let's set up [`TransformersChatGenerator`](https://docs.haystack.deepset.ai/docs/transformerschatgenerator) with a selected model, like `Qwen/Qwen3-4B-Thinking-2507`. We pass the compressed `cache` via `generation_kwargs` so that every decoding step writes through TurboQuant."
   },
   {
    "cell_type": "code",
@@ -160,21 +118,9 @@
      "start_time": "2026-04-03T13:27:40.873264Z"
     }
    },
-   "source": [
-    "from haystack.components.generators.chat import HuggingFaceLocalChatGenerator\n",
-    "\n",
-    "generator = HuggingFaceLocalChatGenerator(\n",
-    "    model=\"Qwen/Qwen3-4B-Thinking-2507\",\n",
-    "    task=\"text-generation\",\n",
-    "    generation_kwargs={\n",
-    "        \"past_key_values\": cache,\n",
-    "        \"use_cache\": True,\n",
-    "    },\n",
-    "    streaming_callback=timing_callback,\n",
-    ")"
-   ],
+   "source": "from haystack_integrations.components.generators.transformers import TransformersChatGenerator\n\ngenerator = TransformersChatGenerator(\n    model=\"Qwen/Qwen3-4B-Thinking-2507\",\n    task=\"text-generation\",\n    generation_kwargs={\n        \"past_key_values\": cache,\n        \"use_cache\": True,\n    },\n    streaming_callback=timing_callback,\n)",
    "outputs": [],
-   "execution_count": 4
+   "execution_count": null
   },
   {
    "cell_type": "markdown",
@@ -352,4 +298,4 @@
  },
  "nbformat": 4,
  "nbformat_minor": 4
-}
+}
\ No newline at end of file

From db9ae7b0ed4126bbb753719c26315bba34d7d15e Mon Sep 17 00:00:00 2001
From: anakin87 <stefanofiorucci@gmail.com>
Date: Wed, 10 Jun 2026 15:12:02 +0200
Subject: [PATCH 2/6] improvemnts

---
 index.toml                                    |  4 +--
 tutorials/29_Serializing_Pipelines.ipynb      | 30 +++++++++++--------
 tutorials/34_Extractive_QA_Pipeline.ipynb     |  2 +-
 ...r_and_TransformersZeroShotTextRouter.ipynb |  2 +-
 4 files changed, 22 insertions(+), 16 deletions(-)

diff --git a/index.toml b/index.toml
index 69c02fb..2e6932d 100644
--- a/index.toml
+++ b/index.toml
@@ -98,7 +98,7 @@ notebook = "34_Extractive_QA_Pipeline.ipynb"
 aliases = []
 completion_time = "10 min"
 created_at = 2024-02-09
-dependencies = ["accelerate", "sentence-transformers", "datasets", "transformers<5", "transformers-haystack"]
+dependencies = ["accelerate", "sentence-transformers", "datasets", "transformers-haystack"]
 
 [[tutorial]]
 title = "Evaluating RAG Pipelines"
@@ -154,7 +154,7 @@ notebook = "41_Query_Classification_with_TransformersTextRouter_and_Transformers
 aliases = []
 completion_time = "25 min"
 created_at = 2024-10-15
-dependencies = ["sentence-transformers>=4.1.0", "gradio", "torch", "sentencepiece", "datasets", "accelerate", "transformers<5", "transformers-haystack"]
+dependencies = ["sentence-transformers>=4.1.0", "gradio", "datasets", "accelerate", "transformers-haystack"]
 
 [[tutorial]]
 title = "Retrieving a Context Window Around a Sentence"
diff --git a/tutorials/29_Serializing_Pipelines.ipynb b/tutorials/29_Serializing_Pipelines.ipynb
index 64fc550..64449b0 100644
--- a/tutorials/29_Serializing_Pipelines.ipynb
+++ b/tutorials/29_Serializing_Pipelines.ipynb
@@ -102,7 +102,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 16,
+   "execution_count": null,
    "metadata": {
     "colab": {
      "base_uri": "https://localhost:8080/"
@@ -120,23 +120,26 @@
       "    init_parameters:\n",
       "      required_variables: null\n",
       "      template:\n",
-      "      - _content:\n",
+      "      - content:\n",
       "        - text: '\n",
       "\n",
-      "          Please create a summary about the following topic:\n",
+      "            Please create a summary about the following topic:\n",
       "\n",
-      "          {{ topic }}\n",
+      "            {{ topic }}\n",
       "\n",
-      "          '\n",
-      "        _meta: {}\n",
-      "        _name: null\n",
-      "        _role: user\n",
+      "            '\n",
+      "        meta: {}\n",
+      "        name: null\n",
+      "        role: user\n",
       "      variables: null\n",
       "    type: haystack.components.builders.chat_prompt_builder.ChatPromptBuilder\n",
       "  llm:\n",
       "    init_parameters:\n",
+      "      chat_template: null\n",
+      "      enable_thinking: false\n",
       "      generation_kwargs:\n",
       "        max_new_tokens: 150\n",
+      "        return_full_text: false\n",
       "        stop_sequences: []\n",
       "      huggingface_pipeline_kwargs:\n",
       "        device: cpu\n",
@@ -149,7 +152,10 @@
       "        - HF_TOKEN\n",
       "        strict: false\n",
       "        type: env_var\n",
-      "    type: haystack.components.generators.chat.hugging_face_local.HuggingFaceLocalChatGenerator\n",
+      "      tool_parsing_function: haystack_integrations.components.generators.transformers.chat.chat_generator.default_tool_parser\n",
+      "      tools: null\n",
+      "    type: haystack_integrations.components.generators.transformers.chat.chat_generator.TransformersChatGenerator\n",
+      "connection_type_validation: true\n",
       "connections:\n",
       "- receiver: llm.messages\n",
       "  sender: builder.prompt\n",
@@ -170,7 +176,7 @@
    "metadata": {
     "id": "0C7zGsUCGszq"
    },
-   "source": "You should get a pipeline YAML that looks like the following:\n\n```yaml\ncomponents:\n  builder:\n    init_parameters:\n      required_variables: null\n      template:\n      - _content:\n        - text: '\n\n            Please create a summary about the following topic:\n\n            {{ topic }}\n\n            '\n        _meta: {}\n        _name: null\n        _role: user\n      variables: null\n    type: haystack.components.builders.chat_prompt_builder.ChatPromptBuilder\n  llm:\n    init_parameters:\n      chat_template: null\n      enable_thinking: false\n      generation_kwargs:\n        max_new_tokens: 150\n      huggingface_pipeline_kwargs:\n        device: cpu\n        model: Qwen/Qwen2.5-1.5B-Instruct\n        task: text-generation\n      streaming_callback: null\n      token:\n        env_vars:\n        - HF_API_TOKEN\n        - HF_TOKEN\n        strict: false\n        type: env_var\n      tool_parsing_function: haystack_integrations.components.generators.transformers.chat.chat_generator.default_tool_parser\n      tools: null\n    type: haystack_integrations.components.generators.transformers.chat.chat_generator.TransformersChatGenerator\nconnections:\n- receiver: llm.messages\n  sender: builder.prompt\nmax_runs_per_component: 100\nmetadata: {}\n\n```"
+   "source": "You should get a pipeline YAML that looks like the following:\n\n```yaml\ncomponents:\n  builder:\n    init_parameters:\n      required_variables: null\n      template:\n      - content:\n        - text: '\n\n            Please create a summary about the following topic:\n\n            {{ topic }}\n\n            '\n        meta: {}\n        name: null\n        role: user\n      variables: null\n    type: haystack.components.builders.chat_prompt_builder.ChatPromptBuilder\n  llm:\n    init_parameters:\n      chat_template: null\n      enable_thinking: false\n      generation_kwargs:\n        max_new_tokens: 150\n        return_full_text: false\n        stop_sequences: []\n      huggingface_pipeline_kwargs:\n        device: cpu\n        model: Qwen/Qwen2.5-1.5B-Instruct\n        task: text-generation\n      streaming_callback: null\n      token:\n        env_vars:\n        - HF_API_TOKEN\n        - HF_TOKEN\n        strict: false\n        type: env_var\n      tool_parsing_function: haystack_integrations.components.generators.transformers.chat.chat_generator.default_tool_parser\n      tools: null\n    type: haystack_integrations.components.generators.transformers.chat.chat_generator.TransformersChatGenerator\nconnection_type_validation: true\nconnections:\n- receiver: llm.messages\n  sender: builder.prompt\nmax_runs_per_component: 100\nmetadata: {}\n\n```"
   },
   {
    "cell_type": "markdown",
@@ -190,7 +196,7 @@
     "id": "U332-VjovFfn"
    },
    "outputs": [],
-   "source": "yaml_pipeline = \"\"\"\ncomponents:\n  builder:\n    init_parameters:\n      template:\n      - _content:\n        - text: 'Please translate the following to French: \\n{{ sentence }}\\n'\n        _meta: {}\n        _name: null\n        _role: user\n      variables: null\n    type: haystack.components.builders.chat_prompt_builder.ChatPromptBuilder\n  llm:\n    init_parameters:\n      generation_kwargs:\n        max_new_tokens: 150\n        stop_sequences: []\n      huggingface_pipeline_kwargs:\n        device: cpu\n        model: Qwen/Qwen2.5-1.5B-Instruct\n        task: text-generation\n      streaming_callback: null\n      chat_template : \"{% for message in messages %}{% if message['role'] == 'user' %}{{ ' ' }}{% endif %}{{ message['content'] }}{% if not loop.last %}{{ '  ' }}{% endif %}{% endfor %}{{ eos_token }}\"\n      token:\n        env_vars:\n        - HF_API_TOKEN\n        - HF_TOKEN\n        strict: false\n        type: env_var\n    type: haystack_integrations.components.generators.transformers.chat.chat_generator.TransformersChatGenerator\nconnections:\n- receiver: llm.messages\n  sender: builder.prompt\nmax_runs_per_component: 100\nmetadata: {}\n\"\"\""
+   "source": "yaml_pipeline = \"\"\"\ncomponents:\n  builder:\n    init_parameters:\n      required_variables: null\n      template:\n      - content:\n        - text: 'Please translate the following to French: \\n{{ sentence }}\\n'\n        meta: {}\n        name: null\n        role: user\n      variables: null\n    type: haystack.components.builders.chat_prompt_builder.ChatPromptBuilder\n  llm:\n    init_parameters:\n      chat_template: \"{% for message in messages %}{% if message['role'] == 'user' %}{{ ' ' }}{% endif %}{{ message['content'] }}{% if not loop.last %}{{ '  ' }}{% endif %}{% endfor %}{{ eos_token }}\"\n      enable_thinking: false\n      generation_kwargs:\n        max_new_tokens: 150\n        return_full_text: false\n        stop_sequences: []\n      huggingface_pipeline_kwargs:\n        device: cpu\n        model: Qwen/Qwen2.5-1.5B-Instruct\n        task: text-generation\n      streaming_callback: null\n      token:\n        env_vars:\n        - HF_API_TOKEN\n        - HF_TOKEN\n        strict: false\n        type: env_var\n      tool_parsing_function: haystack_integrations.components.generators.transformers.chat.chat_generator.default_tool_parser\n      tools: null\n    type: haystack_integrations.components.generators.transformers.chat.chat_generator.TransformersChatGenerator\nconnection_type_validation: true\nconnections:\n- receiver: llm.messages\n  sender: builder.prompt\nmax_runs_per_component: 100\nmetadata: {}\n\"\"\""
   },
   {
    "cell_type": "markdown",
@@ -289,4 +295,4 @@
  },
  "nbformat": 4,
  "nbformat_minor": 0
-}
\ No newline at end of file
+}
diff --git a/tutorials/34_Extractive_QA_Pipeline.ipynb b/tutorials/34_Extractive_QA_Pipeline.ipynb
index 1ece9a0..18dc05c 100644
--- a/tutorials/34_Extractive_QA_Pipeline.ipynb
+++ b/tutorials/34_Extractive_QA_Pipeline.ipynb
@@ -38,7 +38,7 @@
     "id": "rwgpwV4eHVoo"
    },
    "outputs": [],
-   "source": "%%bash\n\npip install haystack-ai transformers-haystack accelerate \"sentence-transformers>=4.1.0\" \"datasets>=2.6.1\" \"transformers<5\""
+   "source": "%%bash\n\npip install haystack-ai transformers-haystack accelerate \"sentence-transformers>=4.1.0\" \"datasets>=2.6.1\""
   },
   {
    "cell_type": "markdown",
diff --git a/tutorials/41_Query_Classification_with_TransformersTextRouter_and_TransformersZeroShotTextRouter.ipynb b/tutorials/41_Query_Classification_with_TransformersTextRouter_and_TransformersZeroShotTextRouter.ipynb
index ced5902..395137e 100644
--- a/tutorials/41_Query_Classification_with_TransformersTextRouter_and_TransformersZeroShotTextRouter.ipynb
+++ b/tutorials/41_Query_Classification_with_TransformersTextRouter_and_TransformersZeroShotTextRouter.ipynb
@@ -60,7 +60,7 @@
     "id": "CjA5n5lMN-gd"
    },
    "outputs": [],
-   "source": "%%bash\n\npip install --upgrade pip\npip install haystack-ai transformers-haystack torch sentencepiece datasets sentence-transformers \"transformers<5\""
+   "source": "%%bash\n\npip install --upgrade pip\npip install haystack-ai transformers-haystack datasets sentence-transformers"
   },
   {
    "cell_type": "markdown",

From c7cd9dbc02986e2e780931b2f43d7461f818dd16 Mon Sep 17 00:00:00 2001
From: anakin87 <stefanofiorucci@gmail.com>
Date: Thu, 11 Jun 2026 10:09:55 +0200
Subject: [PATCH 3/6] rm accelerate

---
 index.toml | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/index.toml b/index.toml
index 2e6932d..f861d31 100644
--- a/index.toml
+++ b/index.toml
@@ -98,7 +98,7 @@ notebook = "34_Extractive_QA_Pipeline.ipynb"
 aliases = []
 completion_time = "10 min"
 created_at = 2024-02-09
-dependencies = ["accelerate", "sentence-transformers", "datasets", "transformers-haystack"]
+dependencies = ["sentence-transformers", "datasets", "transformers-haystack"]
 
 [[tutorial]]
 title = "Evaluating RAG Pipelines"
@@ -154,7 +154,7 @@ notebook = "41_Query_Classification_with_TransformersTextRouter_and_Transformers
 aliases = []
 completion_time = "25 min"
 created_at = 2024-10-15
-dependencies = ["sentence-transformers>=4.1.0", "gradio", "datasets", "accelerate", "transformers-haystack"]
+dependencies = ["sentence-transformers>=4.1.0", "gradio", "datasets", "transformers-haystack"]
 
 [[tutorial]]
 title = "Retrieving a Context Window Around a Sentence"

From bc9c73a95922822a88b0fe55250c3ab0e0e2bf67 Mon Sep 17 00:00:00 2001
From: anakin87 <stefanofiorucci@gmail.com>
Date: Thu, 11 Jun 2026 12:04:29 +0200
Subject: [PATCH 4/6] exclude transformers haystack from cutoff

---
 uv.toml | 1 +
 1 file changed, 1 insertion(+)

diff --git a/uv.toml b/uv.toml
index 3923704..822d47c 100644
--- a/uv.toml
+++ b/uv.toml
@@ -5,3 +5,4 @@ exclude-newer = "P3D"
 # first-party dependencies can be excluded from the global cutoff by adding entries below
 [exclude-newer-package]
 haystack-ai = false
+transformers-haystack = false

From f4357c965266ba84b2e853d9ef2a69dad05b94e6 Mon Sep 17 00:00:00 2001
From: anakin87 <stefanofiorucci@gmail.com>
Date: Thu, 11 Jun 2026 12:17:53 +0200
Subject: [PATCH 5/6] fix

---
 tutorials/44_Creating_Custom_SuperComponents.ipynb | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/tutorials/44_Creating_Custom_SuperComponents.ipynb b/tutorials/44_Creating_Custom_SuperComponents.ipynb
index 96fb927..88149fe 100644
--- a/tutorials/44_Creating_Custom_SuperComponents.ipynb
+++ b/tutorials/44_Creating_Custom_SuperComponents.ipynb
@@ -254,7 +254,7 @@
      "start_time": "2026-05-26T08:59:55.782346Z"
     }
    },
-   "source": "from haystack import Document, Pipeline, super_component\nfrom haystack.components.joiners import DocumentJoiner\nfrom haystack.components.embedders import SentenceTransformersTextEmbedder\nfrom haystack.components.rankers import SentenceTransformersSimilarityRanker\nfrom haystack.components.retrievers import InMemoryBM25Retriever, InMemoryEmbeddingRetriever\nfrom haystack.document_stores.in_memory import InMemoryDocumentStore\n\nfrom datasets import load_dataset\n\n\n@super_component\nclass HybridRetrieverWithRanker:\n    def __init__(\n        self,\n        document_store: InMemoryDocumentStore,\n        embedder_model: str = \"BAAI/bge-small-en-v1.5\",\n        ranker_model: str = \"BAAI/bge-reranker-base\",\n    ):\n        # Create the components\n        embedding_retriever = InMemoryEmbeddingRetriever(document_store)\n        bm25_retriever = InMemoryBM25Retriever(document_store)\n        text_embedder = SentenceTransformersTextEmbedder(embedder_model)\n        document_joiner = DocumentJoiner()\n        ranker = SentenceTransformersSimilarityRanker(ranker_model)\n\n        # Create the pipeline\n        self.pipeline = Pipeline()\n        self.pipeline.add_component(\"text_embedder\", text_embedder)\n        self.pipeline.add_component(\"embedding_retriever\", embedding_retriever)\n        self.pipeline.add_component(\"bm25_retriever\", bm25_retriever)\n        self.pipeline.add_component(\"document_joiner\", document_joiner)\n        self.pipeline.add_component(\"ranker\", ranker)\n\n        # Connect the components\n        self.pipeline.connect(\"text_embedder\", \"embedding_retriever\")\n        self.pipeline.connect(\"bm25_retriever\", \"document_joiner\")\n        self.pipeline.connect(\"embedding_retriever\", \"document_joiner\")\n        self.pipeline.connect(\"document_joiner\", \"ranker\")\n\n        # Define input mapping\n        self.input_mapping = {\"query\": [\"text_embedder.text\", \"bm25_retriever.query\", \"ranker.query\"]}",
+   "source": "from haystack import Document, Pipeline, super_component\nfrom haystack.components.joiners import DocumentJoiner\nfrom haystack.components.embedders import SentenceTransformersTextEmbedder\nfrom haystack.components.rankers import SentenceTransformersSimilarityRanker\nfrom haystack.components.retrievers import InMemoryBM25Retriever, InMemoryEmbeddingRetriever\nfrom haystack.document_stores.in_memory import InMemoryDocumentStore\n\nfrom datasets import load_dataset\n\n\n@super_component\nclass HybridRetrieverWithRanker:\n    def __init__(\n        self,\n        document_store: InMemoryDocumentStore,\n        embedder_model: str = \"BAAI/bge-small-en-v1.5\",\n        ranker_model: str = \"BAAI/bge-reranker-base\",\n    ):\n        # Create the components\n        embedding_retriever = InMemoryEmbeddingRetriever(document_store)\n        bm25_retriever = InMemoryBM25Retriever(document_store)\n        text_embedder = SentenceTransformersTextEmbedder(embedder_model)\n        document_joiner = DocumentJoiner()\n        ranker = SentenceTransformersSimilarityRanker(model=ranker_model)\n\n        # Create the pipeline\n        self.pipeline = Pipeline()\n        self.pipeline.add_component(\"text_embedder\", text_embedder)\n        self.pipeline.add_component(\"embedding_retriever\", embedding_retriever)\n        self.pipeline.add_component(\"bm25_retriever\", bm25_retriever)\n        self.pipeline.add_component(\"document_joiner\", document_joiner)\n        self.pipeline.add_component(\"ranker\", ranker)\n\n        # Connect the components\n        self.pipeline.connect(\"text_embedder\", \"embedding_retriever\")\n        self.pipeline.connect(\"bm25_retriever\", \"document_joiner\")\n        self.pipeline.connect(\"embedding_retriever\", \"document_joiner\")\n        self.pipeline.connect(\"document_joiner\", \"ranker\")\n\n        # Define input mapping\n        self.input_mapping = {\"query\": [\"text_embedder.text\", \"bm25_retriever.query\", \"ranker.query\"]}",
    "outputs": [],
    "execution_count": null
   },
@@ -502,7 +502,7 @@
      "start_time": "2026-05-26T09:01:35.685324Z"
     }
    },
-   "source": "from haystack import Document, Pipeline, super_component\nfrom haystack.components.joiners import DocumentJoiner\nfrom haystack.components.embedders import SentenceTransformersTextEmbedder\nfrom haystack.components.retrievers import InMemoryBM25Retriever, InMemoryEmbeddingRetriever\nfrom haystack.components.rankers import SentenceTransformersSimilarityRanker\nfrom haystack.document_stores.in_memory import InMemoryDocumentStore\n\n\n@super_component\nclass AdvancedHybridRetriever:\n    def __init__(\n        self,\n        document_store: InMemoryDocumentStore,\n        embedder_model: str = \"BAAI/bge-small-en-v1.5\",\n        ranker_model: str = \"BAAI/bge-reranker-base\",\n    ):\n        # Create the components\n        embedding_retriever = InMemoryEmbeddingRetriever(document_store)\n        bm25_retriever = InMemoryBM25Retriever(document_store)\n        text_embedder = SentenceTransformersTextEmbedder(embedder_model)\n        document_joiner = DocumentJoiner()\n        ranker = SentenceTransformersSimilarityRanker(ranker_model)\n\n        # Create the pipeline\n        self.pipeline = Pipeline()\n        self.pipeline.add_component(\"text_embedder\", text_embedder)\n        self.pipeline.add_component(\"embedding_retriever\", embedding_retriever)\n        self.pipeline.add_component(\"bm25_retriever\", bm25_retriever)\n        self.pipeline.add_component(\"document_joiner\", document_joiner)\n        self.pipeline.add_component(\"ranker\", ranker)\n\n        # Connect the components\n        self.pipeline.connect(\"text_embedder\", \"embedding_retriever\")\n        self.pipeline.connect(\"bm25_retriever\", \"document_joiner\")\n        self.pipeline.connect(\"embedding_retriever\", \"document_joiner\")\n        self.pipeline.connect(\"document_joiner\", \"ranker\")\n\n        # Define input and output mappings\n        self.input_mapping = {\"query\": [\"text_embedder.text\", \"bm25_retriever.query\", \"ranker.query\"]}\n\n        # Expose outputs from multiple components, including non-leaf components\n        self.output_mapping = {\n            \"bm25_retriever.documents\": \"bm25_documents\",\n            \"embedding_retriever.documents\": \"embedding_documents\",\n            \"document_joiner.documents\": \"joined_documents\",\n            \"ranker.documents\": \"ranked_documents\",\n            \"text_embedder.embedding\": \"query_embedding\",\n        }",
+   "source": "from haystack import Document, Pipeline, super_component\nfrom haystack.components.joiners import DocumentJoiner\nfrom haystack.components.embedders import SentenceTransformersTextEmbedder\nfrom haystack.components.retrievers import InMemoryBM25Retriever, InMemoryEmbeddingRetriever\nfrom haystack.components.rankers import SentenceTransformersSimilarityRanker\nfrom haystack.document_stores.in_memory import InMemoryDocumentStore\n\n\n@super_component\nclass AdvancedHybridRetriever:\n    def __init__(\n        self,\n        document_store: InMemoryDocumentStore,\n        embedder_model: str = \"BAAI/bge-small-en-v1.5\",\n        ranker_model: str = \"BAAI/bge-reranker-base\",\n    ):\n        # Create the components\n        embedding_retriever = InMemoryEmbeddingRetriever(document_store)\n        bm25_retriever = InMemoryBM25Retriever(document_store)\n        text_embedder = SentenceTransformersTextEmbedder(embedder_model)\n        document_joiner = DocumentJoiner()\n        ranker = SentenceTransformersSimilarityRanker(model=ranker_model)\n\n        # Create the pipeline\n        self.pipeline = Pipeline()\n        self.pipeline.add_component(\"text_embedder\", text_embedder)\n        self.pipeline.add_component(\"embedding_retriever\", embedding_retriever)\n        self.pipeline.add_component(\"bm25_retriever\", bm25_retriever)\n        self.pipeline.add_component(\"document_joiner\", document_joiner)\n        self.pipeline.add_component(\"ranker\", ranker)\n\n        # Connect the components\n        self.pipeline.connect(\"text_embedder\", \"embedding_retriever\")\n        self.pipeline.connect(\"bm25_retriever\", \"document_joiner\")\n        self.pipeline.connect(\"embedding_retriever\", \"document_joiner\")\n        self.pipeline.connect(\"document_joiner\", \"ranker\")\n\n        # Define input and output mappings\n        self.input_mapping = {\"query\": [\"text_embedder.text\", \"bm25_retriever.query\", \"ranker.query\"]}\n\n        # Expose outputs from multiple components, including non-leaf components\n        self.output_mapping = {\n            \"bm25_retriever.documents\": \"bm25_documents\",\n            \"embedding_retriever.documents\": \"embedding_documents\",\n            \"document_joiner.documents\": \"joined_documents\",\n            \"ranker.documents\": \"ranked_documents\",\n            \"text_embedder.embedding\": \"query_embedding\",\n        }",
    "outputs": [],
    "execution_count": null
   },

From 878523867008ba10e5c789b82aac4cbcc464eda9 Mon Sep 17 00:00:00 2001
From: anakin87 <stefanofiorucci@gmail.com>
Date: Thu, 11 Jun 2026 12:30:01 +0200
Subject: [PATCH 6/6] update eval guide

---
 tutorials/guide_evaluation.ipynb | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tutorials/guide_evaluation.ipynb b/tutorials/guide_evaluation.ipynb
index 15eacb0..65f32d6 100644
--- a/tutorials/guide_evaluation.ipynb
+++ b/tutorials/guide_evaluation.ipynb
@@ -110,7 +110,7 @@
     "### Methods to Improve Generation:\n",
     "\n",
     "- **Ranking**: Incorporate a ranking mechanism into your retrieved documents before providing the context to your prompt\n",
-    "    - **Order by similarity**: Reorder your retrieved documents by similarity using cross-encoder models from Hugging Face with [TransformersSimilarityRanker](https://docs.haystack.deepset.ai/docs/transformerssimilarityranker), Rerank models from Cohere with [CohereRanker](https://docs.haystack.deepset.ai/docs/cohereranker), or Rerankers from Jina with [JinaRanker](https://docs.haystack.deepset.ai/docs/jinaranker)\n",
+    "    - **Order by similarity**: Reorder your retrieved documents by similarity using cross-encoder models from Hugging Face with [SentenceTransformersSimilarityRanker](https://docs.haystack.deepset.ai/docs/sentencetransformerssimilarityranker), Rerank models from Cohere with [CohereRanker](https://docs.haystack.deepset.ai/docs/cohereranker), or Rerankers from Jina with [JinaRanker](https://docs.haystack.deepset.ai/docs/jinaranker)\n",
     "    - **Increase diversity by ranking**: Maximize the overall diversity among your context using sentence-transformers models with [SentenceTransformersDiversityRanker](https://docs.haystack.deepset.ai/docs/sentencetransformersdiversityranker) to help increase the semantic answer similarity (SAS) in LFQA applications.\n",
     "    - **Address the \"Lost in the Middle\" problem by reordering**: Position the most relevant documents at the beginning and end of the context using [LostInTheMiddleRanker](https://docs.haystack.deepset.ai/docs/lostinthemiddleranker) to increase faithfulness.\n",
     "- **Different Generators**: Try different large language models and benchmark the results. The full list of model providers is in [Generators](https://docs.haystack.deepset.ai/docs/generators).\n",