hit_testing.py 3.3 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990
  1. import logging
  2. from flask_login import current_user
  3. from flask_restful import Resource, marshal, reqparse
  4. from werkzeug.exceptions import Forbidden, InternalServerError, NotFound
  5. import services
  6. from controllers.console import api
  7. from controllers.console.app.error import (
  8. CompletionRequestError,
  9. ProviderModelCurrentlyNotSupportError,
  10. ProviderNotInitializeError,
  11. ProviderQuotaExceededError,
  12. )
  13. from controllers.console.datasets.error import DatasetNotInitializedError, HighQualityDatasetOnlyError
  14. from controllers.console.setup import setup_required
  15. from controllers.console.wraps import account_initialization_required
  16. from core.errors.error import (
  17. LLMBadRequestError,
  18. ModelCurrentlyNotSupportError,
  19. ProviderTokenNotInitError,
  20. QuotaExceededError,
  21. )
  22. from core.model_runtime.errors.invoke import InvokeError
  23. from fields.hit_testing_fields import hit_testing_record_fields
  24. from libs.login import login_required
  25. from services.dataset_service import DatasetService
  26. from services.hit_testing_service import HitTestingService
  27. class HitTestingApi(Resource):
  28. @setup_required
  29. @login_required
  30. @account_initialization_required
  31. def post(self, dataset_id):
  32. dataset_id_str = str(dataset_id)
  33. dataset = DatasetService.get_dataset(dataset_id_str)
  34. if dataset is None:
  35. raise NotFound("Dataset not found.")
  36. try:
  37. DatasetService.check_dataset_permission(dataset, current_user)
  38. except services.errors.account.NoPermissionError as e:
  39. raise Forbidden(str(e))
  40. # only high quality dataset can be used for hit testing
  41. if dataset.indexing_technique != 'high_quality':
  42. raise HighQualityDatasetOnlyError()
  43. parser = reqparse.RequestParser()
  44. parser.add_argument('query', type=str, location='json')
  45. parser.add_argument('retrieval_model', type=dict, required=False, location='json')
  46. args = parser.parse_args()
  47. HitTestingService.hit_testing_args_check(args)
  48. try:
  49. response = HitTestingService.retrieve(
  50. dataset=dataset,
  51. query=args['query'],
  52. account=current_user,
  53. retrieval_model=args['retrieval_model'],
  54. limit=10
  55. )
  56. return {"query": response['query'], 'records': marshal(response['records'], hit_testing_record_fields)}
  57. except services.errors.index.IndexNotInitializedError:
  58. raise DatasetNotInitializedError()
  59. except ProviderTokenNotInitError as ex:
  60. raise ProviderNotInitializeError(ex.description)
  61. except QuotaExceededError:
  62. raise ProviderQuotaExceededError()
  63. except ModelCurrentlyNotSupportError:
  64. raise ProviderModelCurrentlyNotSupportError()
  65. except LLMBadRequestError:
  66. raise ProviderNotInitializeError(
  67. "No Embedding Model or Reranking Model available. Please configure a valid provider "
  68. "in the Settings -> Model Provider.")
  69. except InvokeError as e:
  70. raise CompletionRequestError(e.description)
  71. except ValueError as e:
  72. raise ValueError(str(e))
  73. except Exception as e:
  74. logging.exception("Hit testing failed.")
  75. raise InternalServerError(str(e))
  76. api.add_resource(HitTestingApi, '/datasets/<uuid:dataset_id>/hit-testing')