2023-05-15 08:51:32 +08:00
|
|
|
import logging
|
|
|
|
|
2023-08-21 13:57:18 +08:00
|
|
|
from flask_login import current_user
|
2023-10-08 05:21:32 -05:00
|
|
|
from libs.login import login_required
|
2023-09-27 16:06:32 +08:00
|
|
|
from flask_restful import Resource, reqparse, marshal
|
2023-05-15 08:51:32 +08:00
|
|
|
from werkzeug.exceptions import InternalServerError, NotFound, Forbidden
|
|
|
|
|
|
|
|
import services
|
|
|
|
from controllers.console import api
|
2023-05-22 17:39:28 +08:00
|
|
|
from controllers.console.app.error import ProviderNotInitializeError, ProviderQuotaExceededError, \
|
|
|
|
ProviderModelCurrentlyNotSupportError
|
2023-05-15 08:51:32 +08:00
|
|
|
from controllers.console.datasets.error import HighQualityDatasetOnlyError, DatasetNotInitializedError
|
|
|
|
from controllers.console.setup import setup_required
|
|
|
|
from controllers.console.wraps import account_initialization_required
|
2024-01-02 23:42:00 +08:00
|
|
|
from core.errors.error import ProviderTokenNotInitError, QuotaExceededError, ModelCurrentlyNotSupportError, \
|
2023-08-18 17:37:31 +08:00
|
|
|
LLMBadRequestError
|
2023-09-27 16:06:32 +08:00
|
|
|
from fields.hit_testing_fields import hit_testing_record_fields
|
2023-05-15 08:51:32 +08:00
|
|
|
from services.dataset_service import DatasetService
|
|
|
|
from services.hit_testing_service import HitTestingService
|
|
|
|
|
|
|
|
|
|
|
|
class HitTestingApi(Resource):
|
|
|
|
|
|
|
|
@setup_required
|
|
|
|
@login_required
|
|
|
|
@account_initialization_required
|
|
|
|
def post(self, dataset_id):
|
|
|
|
dataset_id_str = str(dataset_id)
|
|
|
|
|
|
|
|
dataset = DatasetService.get_dataset(dataset_id_str)
|
|
|
|
if dataset is None:
|
|
|
|
raise NotFound("Dataset not found.")
|
|
|
|
|
|
|
|
try:
|
|
|
|
DatasetService.check_dataset_permission(dataset, current_user)
|
|
|
|
except services.errors.account.NoPermissionError as e:
|
|
|
|
raise Forbidden(str(e))
|
|
|
|
|
|
|
|
# only high quality dataset can be used for hit testing
|
|
|
|
if dataset.indexing_technique != 'high_quality':
|
|
|
|
raise HighQualityDatasetOnlyError()
|
|
|
|
|
|
|
|
parser = reqparse.RequestParser()
|
|
|
|
parser.add_argument('query', type=str, location='json')
|
2023-11-17 22:13:37 +08:00
|
|
|
parser.add_argument('retrieval_model', type=dict, required=False, location='json')
|
2023-05-15 08:51:32 +08:00
|
|
|
args = parser.parse_args()
|
|
|
|
|
2023-11-17 22:13:37 +08:00
|
|
|
HitTestingService.hit_testing_args_check(args)
|
2023-05-15 08:51:32 +08:00
|
|
|
|
|
|
|
try:
|
|
|
|
response = HitTestingService.retrieve(
|
|
|
|
dataset=dataset,
|
2023-11-17 22:13:37 +08:00
|
|
|
query=args['query'],
|
2023-05-15 08:51:32 +08:00
|
|
|
account=current_user,
|
2023-11-17 22:13:37 +08:00
|
|
|
retrieval_model=args['retrieval_model'],
|
|
|
|
limit=10
|
2023-05-15 08:51:32 +08:00
|
|
|
)
|
|
|
|
|
|
|
|
return {"query": response['query'], 'records': marshal(response['records'], hit_testing_record_fields)}
|
|
|
|
except services.errors.index.IndexNotInitializedError:
|
|
|
|
raise DatasetNotInitializedError()
|
2023-07-17 00:14:19 +08:00
|
|
|
except ProviderTokenNotInitError as ex:
|
|
|
|
raise ProviderNotInitializeError(ex.description)
|
2023-05-22 17:39:28 +08:00
|
|
|
except QuotaExceededError:
|
|
|
|
raise ProviderQuotaExceededError()
|
|
|
|
except ModelCurrentlyNotSupportError:
|
|
|
|
raise ProviderModelCurrentlyNotSupportError()
|
2023-08-18 17:37:31 +08:00
|
|
|
except LLMBadRequestError:
|
|
|
|
raise ProviderNotInitializeError(
|
2023-11-19 15:12:55 +08:00
|
|
|
f"No Embedding Model or Reranking Model available. Please configure a valid provider "
|
2023-08-18 17:37:31 +08:00
|
|
|
f"in the Settings -> Model Provider.")
|
2023-08-12 00:57:00 +08:00
|
|
|
except ValueError as e:
|
|
|
|
raise ValueError(str(e))
|
2023-05-15 08:51:32 +08:00
|
|
|
except Exception as e:
|
|
|
|
logging.exception("Hit testing failed.")
|
|
|
|
raise InternalServerError(str(e))
|
|
|
|
|
|
|
|
|
|
|
|
api.add_resource(HitTestingApi, '/datasets/<uuid:dataset_id>/hit-testing')
|