From d51be9edac914e281502075c5267d3e4b74c42fc Mon Sep 17 00:00:00 2001
From: Vladimir Blagojevic <dovlex@gmail.com>
Date: Thu, 12 Oct 2023 13:52:01 +0200
Subject: [PATCH 1/5] Add top_k to SimilarityRanker (#6036)

---
 .../preview/components/rankers/similarity.py  | 24 ++++++++---
 .../components/rankers/test_similarity.py     | 43 +++++++++++++++++--
 2 files changed, 59 insertions(+), 8 deletions(-)

diff --git a/haystack/preview/components/rankers/similarity.py b/haystack/preview/components/rankers/similarity.py
index 7abb370954..66f620294b 100644
--- a/haystack/preview/components/rankers/similarity.py
+++ b/haystack/preview/components/rankers/similarity.py
@@ -1,6 +1,6 @@
 import logging
 from pathlib import Path
-from typing import List, Union, Dict, Any
+from typing import List, Union, Dict, Any, Optional
 
 from haystack.preview import ComponentError, Document, component, default_from_dict, default_to_dict
 from haystack.preview.lazy_imports import LazyImport
@@ -34,17 +34,24 @@ class SimilarityRanker:
     """
 
     def __init__(
-        self, model_name_or_path: Union[str, Path] = "cross-encoder/ms-marco-MiniLM-L-6-v2", device: str = "cpu"
+        self,
+        model_name_or_path: Union[str, Path] = "cross-encoder/ms-marco-MiniLM-L-6-v2",
+        top_k: int = 10,
+        device: str = "cpu",
     ):
         """
         Creates an instance of SimilarityRanker.
 
         :param model_name_or_path: Path to a pre-trained sentence-transformers model.
+        :param top_k: The maximum number of documents to return per query.
         :param device: torch device (for example, cuda:0, cpu, mps) to limit model inference to a specific device.
         """
         torch_and_transformers_import.check()
 
         self.model_name_or_path = model_name_or_path
+        if top_k <= 0:
+            raise ValueError(f"top_k must be > 0, but got {top_k}")
+        self.top_k = top_k
         self.device = device
         self.model = None
         self.tokenizer = None
@@ -63,7 +70,7 @@ def to_dict(self) -> Dict[str, Any]:
         """
         Serialize this component to a dictionary.
         """
-        return default_to_dict(self, device=self.device, model_name_or_path=self.model_name_or_path)
+        return default_to_dict(self, top_k=self.top_k, device=self.device, model_name_or_path=self.model_name_or_path)
 
     @classmethod
     def from_dict(cls, data: Dict[str, Any]) -> "SimilarityRanker":
@@ -73,17 +80,24 @@ def from_dict(cls, data: Dict[str, Any]) -> "SimilarityRanker":
         return default_from_dict(cls, data)
 
     @component.output_types(documents=List[Document])
-    def run(self, query: str, documents: List[Document]):
+    def run(self, query: str, documents: List[Document], top_k: Optional[int] = None):
         """
         Returns a list of documents ranked by their similarity to the given query
 
         :param query: Query string.
         :param documents: List of Documents.
+        :param top_k: The maximum number of documents to return.
         :return: List of Documents sorted by (desc.) similarity with the query.
         """
         if not documents:
             return {"documents": []}
 
+        if top_k is None:
+            top_k = self.top_k
+
+        elif top_k <= 0:
+            raise ValueError(f"top_k must be > 0, but got {top_k}")
+
         # If a model path is provided but the model isn't loaded
         if self.model_name_or_path and not self.model:
             raise ComponentError(
@@ -105,4 +119,4 @@ def run(self, query: str, documents: List[Document]):
             i = sorted_index_tensor.item()
             documents[i].score = similarity_scores[i].item()
             ranked_docs.append(documents[i])
-        return {"documents": ranked_docs}
+        return {"documents": ranked_docs[:top_k]}
diff --git a/test/preview/components/rankers/test_similarity.py b/test/preview/components/rankers/test_similarity.py
index 5ddb3b18dc..cc2486a2cd 100644
--- a/test/preview/components/rankers/test_similarity.py
+++ b/test/preview/components/rankers/test_similarity.py
@@ -11,7 +11,11 @@ def test_to_dict(self):
         data = component.to_dict()
         assert data == {
             "type": "SimilarityRanker",
-            "init_parameters": {"device": "cpu", "model_name_or_path": "cross-encoder/ms-marco-MiniLM-L-6-v2"},
+            "init_parameters": {
+                "device": "cpu",
+                "top_k": 10,
+                "model_name_or_path": "cross-encoder/ms-marco-MiniLM-L-6-v2",
+            },
         }
 
     @pytest.mark.unit
@@ -20,14 +24,22 @@ def test_to_dict_with_custom_init_parameters(self):
         data = component.to_dict()
         assert data == {
             "type": "SimilarityRanker",
-            "init_parameters": {"device": "cpu", "model_name_or_path": "cross-encoder/ms-marco-MiniLM-L-6-v2"},
+            "init_parameters": {
+                "device": "cpu",
+                "top_k": 10,
+                "model_name_or_path": "cross-encoder/ms-marco-MiniLM-L-6-v2",
+            },
         }
 
     @pytest.mark.integration
     def test_from_dict(self):
         data = {
             "type": "SimilarityRanker",
-            "init_parameters": {"device": "cpu", "model_name_or_path": "cross-encoder/ms-marco-MiniLM-L-6-v2"},
+            "init_parameters": {
+                "device": "cpu",
+                "top_k": 10,
+                "model_name_or_path": "cross-encoder/ms-marco-MiniLM-L-6-v2",
+            },
         }
         component = SimilarityRanker.from_dict(data)
         assert component.model_name_or_path == "cross-encoder/ms-marco-MiniLM-L-6-v2"
@@ -72,3 +84,28 @@ def test_raises_component_error_if_model_not_warmed_up(self):
 
         with pytest.raises(ComponentError):
             sampler.run(query="query", documents=[Document(text="document")])
+
+    @pytest.mark.integration
+    @pytest.mark.parametrize(
+        "query,docs_before_texts,expected_first_text",
+        [
+            ("City in Bosnia and Herzegovina", ["Berlin", "Belgrade", "Sarajevo"], "Sarajevo"),
+            ("Machine learning", ["Python", "Bakery in Paris", "Tesla Giga Berlin"], "Python"),
+            ("Cubist movement", ["Nirvana", "Pablo Picasso", "Coffee"], "Pablo Picasso"),
+        ],
+    )
+    def test_run_top_k(self, query, docs_before_texts, expected_first_text):
+        """
+        Test if the component ranks documents correctly with a custom top_k.
+        """
+        ranker = SimilarityRanker(model_name_or_path="cross-encoder/ms-marco-MiniLM-L-6-v2", top_k=2)
+        ranker.warm_up()
+        docs_before = [Document(text=text) for text in docs_before_texts]
+        output = ranker.run(query=query, documents=docs_before)
+        docs_after = output["documents"]
+
+        assert len(docs_after) == 2
+        assert docs_after[0].text == expected_first_text
+
+        sorted_scores = sorted([doc.score for doc in docs_after], reverse=True)
+        assert [doc.score for doc in docs_after] == sorted_scores

From 2c2549f13d87193725d1441faa27ed9cad7de1e3 Mon Sep 17 00:00:00 2001
From: Stefano Fiorucci <44616784+anakin87@users.noreply.github.com>
Date: Thu, 12 Oct 2023 17:52:28 +0200
Subject: [PATCH 2/5] move embedding backends (#6033)

---
 .../embedders/backends}/__init__.py                |  0
 .../backends}/sentence_transformers_backend.py     |  0
 .../sentence_transformers_document_embedder.py     | 14 ++++++++------
 .../sentence_transformers_text_embedder.py         | 12 +++++++-----
 ...est_sentence_transformers_embedding_backend.py} |  8 ++++----
 5 files changed, 19 insertions(+), 15 deletions(-)
 rename haystack/preview/{embedding_backends => components/embedders/backends}/__init__.py (100%)
 rename haystack/preview/{embedding_backends => components/embedders/backends}/sentence_transformers_backend.py (100%)
 rename test/preview/{embedding_backends/test_sentence_transformers.py => components/embedders/test_sentence_transformers_embedding_backend.py} (78%)

diff --git a/haystack/preview/embedding_backends/__init__.py b/haystack/preview/components/embedders/backends/__init__.py
similarity index 100%
rename from haystack/preview/embedding_backends/__init__.py
rename to haystack/preview/components/embedders/backends/__init__.py
diff --git a/haystack/preview/embedding_backends/sentence_transformers_backend.py b/haystack/preview/components/embedders/backends/sentence_transformers_backend.py
similarity index 100%
rename from haystack/preview/embedding_backends/sentence_transformers_backend.py
rename to haystack/preview/components/embedders/backends/sentence_transformers_backend.py
diff --git a/haystack/preview/components/embedders/sentence_transformers_document_embedder.py b/haystack/preview/components/embedders/sentence_transformers_document_embedder.py
index 40ac170aa9..381a2d7d9b 100644
--- a/haystack/preview/components/embedders/sentence_transformers_document_embedder.py
+++ b/haystack/preview/components/embedders/sentence_transformers_document_embedder.py
@@ -1,7 +1,7 @@
 from typing import List, Optional, Union, Dict, Any
 
 from haystack.preview import component, Document, default_to_dict, default_from_dict
-from haystack.preview.embedding_backends.sentence_transformers_backend import (
+from haystack.preview.components.embedders.backends.sentence_transformers_backend import (
     _SentenceTransformersEmbeddingBackendFactory,
 )
 
@@ -29,11 +29,13 @@ def __init__(
         """
         Create a SentenceTransformersDocumentEmbedder component.
 
-        :param model_name_or_path: Local path or name of the model in Hugging Face's model hub, such as ``'sentence-transformers/all-mpnet-base-v2'``.
-        :param device: Device (like 'cuda' / 'cpu') that should be used for computation. If None, checks if a GPU can be used.
+        :param model_name_or_path: Local path or name of the model in Hugging Face's model hub,
+            such as ``'sentence-transformers/all-mpnet-base-v2'``.
+        :param device: Device (like 'cuda' / 'cpu') that should be used for computation.
+            Defaults to CPU.
         :param use_auth_token: The API token used to download private models from Hugging Face.
-                        If this parameter is set to `True`, then the token generated when running
-                        `transformers-cli login` (stored in ~/.huggingface) will be used.
+            If this parameter is set to `True`, then the token generated when running
+            `transformers-cli login` (stored in ~/.huggingface) will be used.
         :param prefix: A string to add to the beginning of each Document text before embedding.
         :param suffix: A string to add to the end of each Document text before embedding.
         :param batch_size: Number of strings to encode at once.
@@ -95,7 +97,7 @@ def run(self, documents: List[Document]):
         Embed a list of Documents.
         The embedding of each Document is stored in the `embedding` field of the Document.
         """
-        if not isinstance(documents, list) or not isinstance(documents[0], Document):
+        if not isinstance(documents, list) or documents and not isinstance(documents[0], Document):
             raise TypeError(
                 "SentenceTransformersDocumentEmbedder expects a list of Documents as input."
                 "In case you want to embed a list of strings, please use the SentenceTransformersTextEmbedder."
diff --git a/haystack/preview/components/embedders/sentence_transformers_text_embedder.py b/haystack/preview/components/embedders/sentence_transformers_text_embedder.py
index c22e04379a..527191b1d5 100644
--- a/haystack/preview/components/embedders/sentence_transformers_text_embedder.py
+++ b/haystack/preview/components/embedders/sentence_transformers_text_embedder.py
@@ -1,7 +1,7 @@
 from typing import List, Optional, Union, Dict, Any
 
 from haystack.preview import component, default_to_dict, default_from_dict
-from haystack.preview.embedding_backends.sentence_transformers_backend import (
+from haystack.preview.components.embedders.backends.sentence_transformers_backend import (
     _SentenceTransformersEmbeddingBackendFactory,
 )
 
@@ -26,11 +26,13 @@ def __init__(
         """
         Create a SentenceTransformersTextEmbedder component.
 
-        :param model_name_or_path: Local path or name of the model in Hugging Face's model hub, such as ``'sentence-transformers/all-mpnet-base-v2'``.
-        :param device: Device (like 'cuda' / 'cpu') that should be used for computation. If None, checks if a GPU can be used.
+        :param model_name_or_path: Local path or name of the model in Hugging Face's model hub,
+            such as ``'sentence-transformers/all-mpnet-base-v2'``.
+        :param device: Device (like 'cuda' / 'cpu') that should be used for computation.
+            Defaults to CPU.
         :param use_auth_token: The API token used to download private models from Hugging Face.
-                        If this parameter is set to `True`, then the token generated when running
-                        `transformers-cli login` (stored in ~/.huggingface) will be used.
+            If this parameter is set to `True`, then the token generated when running
+            `transformers-cli login` (stored in ~/.huggingface) will be used.
         :param prefix: A string to add to the beginning of each text.
         :param suffix: A string to add to the end of each text.
         :param batch_size: Number of strings to encode at once.
diff --git a/test/preview/embedding_backends/test_sentence_transformers.py b/test/preview/components/embedders/test_sentence_transformers_embedding_backend.py
similarity index 78%
rename from test/preview/embedding_backends/test_sentence_transformers.py
rename to test/preview/components/embedders/test_sentence_transformers_embedding_backend.py
index f9f98d0a02..4ac8c55869 100644
--- a/test/preview/embedding_backends/test_sentence_transformers.py
+++ b/test/preview/components/embedders/test_sentence_transformers_embedding_backend.py
@@ -1,12 +1,12 @@
 from unittest.mock import patch
 import pytest
-from haystack.preview.embedding_backends.sentence_transformers_backend import (
+from haystack.preview.components.embedders.backends.sentence_transformers_backend import (
     _SentenceTransformersEmbeddingBackendFactory,
 )
 
 
 @pytest.mark.unit
-@patch("haystack.preview.embedding_backends.sentence_transformers_backend.SentenceTransformer")
+@patch("haystack.preview.components.embedders.backends.sentence_transformers_backend.SentenceTransformer")
 def test_factory_behavior(mock_sentence_transformer):
     embedding_backend = _SentenceTransformersEmbeddingBackendFactory.get_embedding_backend(
         model_name_or_path="my_model", device="cpu"
@@ -21,7 +21,7 @@ def test_factory_behavior(mock_sentence_transformer):
 
 
 @pytest.mark.unit
-@patch("haystack.preview.embedding_backends.sentence_transformers_backend.SentenceTransformer")
+@patch("haystack.preview.components.embedders.backends.sentence_transformers_backend.SentenceTransformer")
 def test_model_initialization(mock_sentence_transformer):
     _SentenceTransformersEmbeddingBackendFactory.get_embedding_backend(
         model_name_or_path="model", device="cpu", use_auth_token="my_token"
@@ -32,7 +32,7 @@ def test_model_initialization(mock_sentence_transformer):
 
 
 @pytest.mark.unit
-@patch("haystack.preview.embedding_backends.sentence_transformers_backend.SentenceTransformer")
+@patch("haystack.preview.components.embedders.backends.sentence_transformers_backend.SentenceTransformer")
 def test_embedding_function_with_kwargs(mock_sentence_transformer):
     embedding_backend = _SentenceTransformersEmbeddingBackendFactory.get_embedding_backend(model_name_or_path="model")
 

From adf7e49af3d8654b7e325fd82d330c65436a0be6 Mon Sep 17 00:00:00 2001
From: ZanSara <sara.zanzottera@deepset.ai>
Date: Thu, 12 Oct 2023 20:50:53 +0100
Subject: [PATCH 3/5] chore: review `all` extra (#6029)

---
 .github/workflows/tests.yml                   | 35 ++++++++++++++++---
 haystack/pipelines/base.py                    |  2 +-
 pyproject.toml                                |  7 ++--
 .../review-all-extras-42d5a3a3d61f5393.yaml   |  3 ++
 test/pipelines/test_ray.py                    | 16 ++++-----
 5 files changed, 44 insertions(+), 19 deletions(-)
 create mode 100644 releasenotes/notes/review-all-extras-42d5a3a3d61f5393.yaml

diff --git a/.github/workflows/tests.yml b/.github/workflows/tests.yml
index 4ecdd1fe85..8650e94c07 100644
--- a/.github/workflows/tests.yml
+++ b/.github/workflows/tests.yml
@@ -124,10 +124,10 @@ jobs:
         include:
           - topic: document_stores
             os: ubuntu-latest
-            dependencies: elasticsearch8,faiss,weaviate,pinecone,opensearch,inference,audio,crawler,preprocessing,file-conversion,pdf,ocr,ray,onnx,beir,metrics,aws,dev
+            dependencies: elasticsearch8,faiss,weaviate,pinecone,opensearch,inference,crawler,preprocessing,file-conversion,pdf,ocr,metrics,dev
           - topic: document_stores
             os: windows-latest
-            dependencies: elasticsearch8,faiss,weaviate,pinecone,opensearch,inference,audio,crawler,preprocessing,file-conversion,pdf,ocr,ray,onnx,beir,metrics,aws,dev
+            dependencies: elasticsearch8,faiss,weaviate,pinecone,opensearch,inference,crawler,preprocessing,file-conversion,pdf,ocr,metrics,dev
     runs-on: ${{ matrix.os }}
     steps:
       - uses: actions/checkout@v4
@@ -329,7 +329,7 @@ jobs:
     runs-on: ${{ matrix.os }}
     services:
       elasticsearch:
-        image: elasticsearch:8.8.0
+        image: elasticsearch:8.10.2
         env:
           discovery.type: "single-node"
           xpack.security.enabled: "false"
@@ -346,9 +346,36 @@ jobs:
       - name: Install Haystack
         run: pip install .[elasticsearch8,dev,preprocessing,inference]
 
+      - name: Make elasticsearch comfortable with a disk almost full
+        run: |
+          curl -X PUT "localhost:9200/_cluster/settings?pretty" -H 'Content-Type: application/json' -d'
+          {
+            "persistent": {
+              "cluster.routing.allocation.disk.watermark.low": "90%",
+              "cluster.routing.allocation.disk.watermark.low.max_headroom": "100GB",
+              "cluster.routing.allocation.disk.watermark.high": "95%",
+              "cluster.routing.allocation.disk.watermark.high.max_headroom": "20GB",
+              "cluster.routing.allocation.disk.watermark.flood_stage": "97%",
+              "cluster.routing.allocation.disk.watermark.flood_stage.max_headroom": "5GB",
+              "cluster.routing.allocation.disk.watermark.flood_stage.frozen": "97%",
+              "cluster.routing.allocation.disk.watermark.flood_stage.frozen.max_headroom": "5GB"
+            }
+          }
+          '
+          curl -X PUT "localhost:9200/*/_settings?expand_wildcards=all&pretty" -H 'Content-Type: application/json' -d'
+          {
+            "index.blocks.read_only_allow_delete": null
+          }
+          '
+
       - name: Run tests
         run: |
-          pytest --maxfail=5 -m "document_store and integration" test/document_stores/test_elasticsearch.py
+          pytest -x -m"document_store and integration" test/document_stores/test_elasticsearch.py
+
+      - name: logs
+        if: failure()
+        run: |
+          docker logs "${{ job.services.elasticsearch.id }}"
 
       - name: Calculate alert data
         id: calculator
diff --git a/haystack/pipelines/base.py b/haystack/pipelines/base.py
index 982c6b7d29..a5774b5a15 100644
--- a/haystack/pipelines/base.py
+++ b/haystack/pipelines/base.py
@@ -963,7 +963,7 @@ def eval_beir(
             from beir.datasets.data_loader import GenericDataLoader
             from beir.retrieval.evaluation import EvaluateRetrieval
         except ModuleNotFoundError as e:
-            raise HaystackError("beir is not installed. Please run `pip install farm-haystack[beir]`...") from e
+            raise HaystackError("beir is not installed. Please run `pip install beir`") from e
 
         url = f"https://public.ukp.informatik.tu-darmstadt.de/thakur/BEIR/datasets/{dataset}.zip"
         data_path = util.download_and_unzip(url, dataset_dir)
diff --git a/pyproject.toml b/pyproject.toml
index 8ecde0c81b..93bdb17676 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -152,9 +152,6 @@ docstores-gpu = [
 audio = [
   "openai-whisper"
 ]
-beir = [
-  "beir; platform_system != 'Windows'",
-]
 aws = [
   "boto3",
   # Costraint botocore to avoid taking to much time to resolve the dependency tree.
@@ -246,11 +243,11 @@ formatting = [
 ]
 
 all = [
-  "farm-haystack[inference,docstores,audio,crawler,preprocessing,file-conversion,pdf,ocr,ray,onnx,beir,metrics,aws,preview]",
+  "farm-haystack[inference,docstores,crawler,preprocessing,file-conversion,pdf,ocr,metrics,aws,preview]",
 ]
 all-gpu = [
   # beir is incompatible with faiss-gpu: https://github.com/beir-cellar/beir/issues/71
-  "farm-haystack[inference,docstores-gpu,audio,crawler,preprocessing,file-conversion,pdf,ocr,ray,onnx-gpu,metrics,aws,preview]",
+  "farm-haystack[inference,docstores-gpu,crawler,preprocessing,file-conversion,pdf,ocr,metrics,aws,preview]",
 ]
 
 [project.scripts]
diff --git a/releasenotes/notes/review-all-extras-42d5a3a3d61f5393.yaml b/releasenotes/notes/review-all-extras-42d5a3a3d61f5393.yaml
new file mode 100644
index 0000000000..80a9fcddc1
--- /dev/null
+++ b/releasenotes/notes/review-all-extras-42d5a3a3d61f5393.yaml
@@ -0,0 +1,3 @@
+upgrade:
+  - |
+    Removes the `audio`, `ray`, `onnx` and `beir` extras from the extra group `all`.
diff --git a/test/pipelines/test_ray.py b/test/pipelines/test_ray.py
index 1e3379f655..ddb1ebf54a 100644
--- a/test/pipelines/test_ray.py
+++ b/test/pipelines/test_ray.py
@@ -1,17 +1,15 @@
-from pathlib import Path
-
 import pytest
-import ray
 
 from haystack.pipelines import RayPipeline
 
 
-@pytest.fixture(autouse=True)
-def shutdown_ray():
-    yield
+@pytest.fixture()
+def ray():
     try:
         import ray
 
+        yield ray
+
         ray.serve.shutdown()
         ray.shutdown()
     except:
@@ -21,7 +19,7 @@ def shutdown_ray():
 @pytest.mark.integration
 @pytest.mark.parametrize("document_store_with_docs", ["elasticsearch"], indirect=True)
 @pytest.mark.parametrize("serve_detached", [True, False])
-def test_load_pipeline(document_store_with_docs, serve_detached, samples_path):
+def test_load_pipeline(ray, document_store_with_docs, serve_detached, samples_path):
     pipeline = RayPipeline.load_from_yaml(
         samples_path / "pipeline" / "ray.simple.haystack-pipeline.yml",
         pipeline_name="ray_query_pipeline",
@@ -43,7 +41,7 @@ def test_load_pipeline(document_store_with_docs, serve_detached, samples_path):
 
 @pytest.mark.integration
 @pytest.mark.parametrize("document_store_with_docs", ["elasticsearch"], indirect=True)
-def test_load_advanced_pipeline(document_store_with_docs, samples_path):
+def test_load_advanced_pipeline(ray, document_store_with_docs, samples_path):
     pipeline = RayPipeline.load_from_yaml(
         samples_path / "pipeline" / "ray.advanced.haystack-pipeline.yml",
         pipeline_name="ray_query_pipeline",
@@ -71,7 +69,7 @@ def test_load_advanced_pipeline(document_store_with_docs, samples_path):
 @pytest.mark.asyncio
 @pytest.mark.integration
 @pytest.mark.parametrize("document_store_with_docs", ["elasticsearch"], indirect=True)
-async def test_load_advanced_pipeline_async(document_store_with_docs, samples_path):
+async def test_load_advanced_pipeline_async(ray, document_store_with_docs, samples_path):
     pipeline = RayPipeline.load_from_yaml(
         samples_path / "pipeline" / "ray.advanced.haystack-pipeline.yml",
         pipeline_name="ray_query_pipeline",

From 59e89b10313c620655355a30bcfbdfa0ee157bda Mon Sep 17 00:00:00 2001
From: Julian Risch <julian.risch@deepset.ai>
Date: Thu, 12 Oct 2023 22:36:49 +0200
Subject: [PATCH 4/5] test: Remove anthropic from "getting started" example
 test (#6024)

---
 examples/test_getting_started.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/examples/test_getting_started.py b/examples/test_getting_started.py
index ba33e9755c..ee4b99aa98 100644
--- a/examples/test_getting_started.py
+++ b/examples/test_getting_started.py
@@ -6,7 +6,7 @@
 from haystack.schema import Answer, Document
 
 
-@pytest.mark.parametrize("provider", ["anthropic", "cohere", "huggingface", "openai"])
+@pytest.mark.parametrize("provider", ["cohere", "huggingface", "openai"])
 def test_getting_started(provider):
     if provider == "anthropic":
         api_key = os.environ.get("ANTHROPIC_API_KEY", "")

From 988fa61f84dbe00662a3ff0e31ee6029d4b9c507 Mon Sep 17 00:00:00 2001
From: Akash Goyal <akashgoyal2110@gmail.com>
Date: Fri, 13 Oct 2023 12:35:21 +0530
Subject: [PATCH 5/5] =?UTF-8?q?Addition=20to=20the=20text=20in=20ValueErro?=
 =?UTF-8?q?r=20when=20creating=20a=20prompt=20node=20to=20inf=E2=80=A6=20(?=
 =?UTF-8?q?#6000)?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

* Addition to the text in ValueError when creating a prompt node to inform users to double check they have authorisation for the loaded model and have logged into the huggingface cli

* Update haystack/nodes/prompt/prompt_model.py

Accepted the suggested changes to the value error text

Co-authored-by: Massimiliano Pippi <mpippi@gmail.com>

---------

Co-authored-by: Massimiliano Pippi <mpippi@gmail.com>
Co-authored-by: Stefano Fiorucci <44616784+anakin87@users.noreply.github.com>
---
 haystack/nodes/prompt/prompt_model.py | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/haystack/nodes/prompt/prompt_model.py b/haystack/nodes/prompt/prompt_model.py
index 100a2b46ea..437b0fdc40 100644
--- a/haystack/nodes/prompt/prompt_model.py
+++ b/haystack/nodes/prompt/prompt_model.py
@@ -98,6 +98,8 @@ def create_invocation_layer(
             f" Currently supported invocation layers are: {PromptModelInvocationLayer.invocation_layer_providers}"
             f" You can implement and provide custom invocation layer for {self.model_name_or_path} by subclassing "
             "PromptModelInvocationLayer."
+            f" Also please ensure you are authorised to load the model {self.model_name_or_path} and you are "
+            "logged-in into the huggingface cli."
         )
 
     def invoke(self, prompt: Union[str, List[str], List[Dict[str, str]]], **kwargs) -> List[str]: