mirror of
https://github.com/deepset-ai/haystack.git
synced 2025-07-20 23:41:36 +00:00

* remove duplicate imports * fix ungrouped-imports * Fix wrong-import-position * Fix unused-import * pyproject.toml * Working on wrong-import-order * Solve wrong-import-order * fix Pool import * Move open_search_index_to_document_store and elasticsearch_index_to_document_store in elasticsearch.py * remove Converter from modeling * Fix mypy issues on adaptive_model.py * create es_converter.py * remove converter import * change import path in tests * Restructure REST API to not rely on global vars from search.apy and improve tests * Fix openapi generator * Move variable initialization * Change type of FilterRequest.filters Co-authored-by: github-actions[bot] <41898282+github-actions[bot]@users.noreply.github.com>
56 lines
1.9 KiB
Python
56 lines
1.9 KiB
Python
from typing import List
|
|
|
|
import logging
|
|
|
|
from fastapi import FastAPI, APIRouter
|
|
from haystack.document_stores import BaseDocumentStore
|
|
|
|
from rest_api.utils import get_app, get_pipelines
|
|
from rest_api.config import LOG_LEVEL
|
|
from rest_api.schema import FilterRequest, DocumentSerialized
|
|
|
|
|
|
logging.getLogger("haystack").setLevel(LOG_LEVEL)
|
|
logger = logging.getLogger("haystack")
|
|
|
|
|
|
router = APIRouter()
|
|
app: FastAPI = get_app()
|
|
document_store: BaseDocumentStore = get_pipelines().get("document_store", None)
|
|
|
|
|
|
@router.post("/documents/get_by_filters", response_model=List[DocumentSerialized], response_model_exclude_none=True)
|
|
def get_documents(filters: FilterRequest):
|
|
"""
|
|
This endpoint allows you to retrieve documents contained in your document store.
|
|
You can filter the documents to delete by metadata (like the document's name),
|
|
or provide an empty JSON object to clear the document store.
|
|
|
|
Example of filters:
|
|
`'{"filters": {{"name": ["some", "more"], "category": ["only_one"]}}'`
|
|
|
|
To get all documents you should provide an empty dict, like:
|
|
`'{"filters": {}}'`
|
|
"""
|
|
docs = [doc.to_dict() for doc in document_store.get_all_documents(filters=filters.filters)]
|
|
for doc in docs:
|
|
doc["embedding"] = None
|
|
return docs
|
|
|
|
|
|
@router.post("/documents/delete_by_filters", response_model=bool)
|
|
def delete_documents(filters: FilterRequest):
|
|
"""
|
|
This endpoint allows you to delete documents contained in your document store.
|
|
You can filter the documents to delete by metadata (like the document's name),
|
|
or provide an empty JSON object to clear the document store.
|
|
|
|
Example of filters:
|
|
`'{"filters": {{"name": ["some", "more"], "category": ["only_one"]}}'`
|
|
|
|
To get all documents you should provide an empty dict, like:
|
|
`'{"filters": {}}'`
|
|
"""
|
|
document_store.delete_documents(filters=filters.filters)
|
|
return True
|