Skip to content

Commit 176db5d

Browse files
initial import (#8635)
1 parent f2b5f12 commit 176db5d

File tree

2 files changed

+2
-4
lines changed

2 files changed

+2
-4
lines changed

Diff for: e2e/pipelines/test_dense_doc_search.py

+1-1
Original file line numberDiff line numberDiff line change
@@ -26,7 +26,7 @@ def test_dense_doc_search_pipeline(tmp_path, samples_path):
2626
indexing_pipeline.add_component(instance=DocumentJoiner(), name="joiner")
2727
indexing_pipeline.add_component(instance=DocumentCleaner(), name="cleaner")
2828
indexing_pipeline.add_component(
29-
instance=DocumentSplitter(split_by="sentence", split_length=250, split_overlap=30), name="splitter"
29+
instance=DocumentSplitter(split_by="period", split_length=250, split_overlap=30), name="splitter"
3030
)
3131
indexing_pipeline.add_component(
3232
instance=SentenceTransformersDocumentEmbedder(model="sentence-transformers/all-MiniLM-L6-v2"), name="embedder"

Diff for: e2e/pipelines/test_preprocessing_pipeline.py

+1-3
Original file line numberDiff line numberDiff line change
@@ -25,9 +25,7 @@ def test_preprocessing_pipeline(tmp_path):
2525
instance=MetadataRouter(rules={"en": {"field": "language", "operator": "==", "value": "en"}}), name="router"
2626
)
2727
preprocessing_pipeline.add_component(instance=DocumentCleaner(), name="cleaner")
28-
preprocessing_pipeline.add_component(
29-
instance=DocumentSplitter(split_by="sentence", split_length=1), name="splitter"
30-
)
28+
preprocessing_pipeline.add_component(instance=DocumentSplitter(split_by="period", split_length=1), name="splitter")
3129
preprocessing_pipeline.add_component(
3230
instance=SentenceTransformersDocumentEmbedder(model="sentence-transformers/all-MiniLM-L6-v2"), name="embedder"
3331
)

0 commit comments

Comments
 (0)