test_replicate_model.py 2.5 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475
  1. import json
  2. import os
  3. from unittest.mock import patch, MagicMock
  4. from langchain.schema import Generation
  5. from core.model_providers.models.entity.message import PromptMessage, MessageType
  6. from core.model_providers.models.entity.model_params import ModelKwargs, ModelType
  7. from core.model_providers.models.llm.replicate_model import ReplicateModel
  8. from core.model_providers.providers.replicate_provider import ReplicateProvider
  9. from models.provider import Provider, ProviderType, ProviderModel
  10. def get_mock_provider():
  11. return Provider(
  12. id='provider_id',
  13. tenant_id='tenant_id',
  14. provider_name='replicate',
  15. provider_type=ProviderType.CUSTOM.value,
  16. encrypted_config='',
  17. is_valid=True,
  18. )
  19. def get_mock_model(model_name, model_version, mocker):
  20. model_kwargs = ModelKwargs(
  21. max_tokens=10,
  22. temperature=0.01
  23. )
  24. valid_api_key = os.environ['REPLICATE_API_TOKEN']
  25. model_provider = ReplicateProvider(provider=get_mock_provider())
  26. mock_query = MagicMock()
  27. mock_query.filter.return_value.first.return_value = ProviderModel(
  28. provider_name='replicate',
  29. model_name=model_name,
  30. model_type=ModelType.TEXT_GENERATION.value,
  31. encrypted_config=json.dumps({
  32. 'replicate_api_token': valid_api_key,
  33. 'model_version': model_version
  34. }),
  35. is_valid=True,
  36. )
  37. mocker.patch('extensions.ext_database.db.session.query', return_value=mock_query)
  38. return ReplicateModel(
  39. model_provider=model_provider,
  40. name=model_name,
  41. model_kwargs=model_kwargs
  42. )
  43. def decrypt_side_effect(tenant_id, encrypted_api_key):
  44. return encrypted_api_key
  45. @patch('core.helper.encrypter.decrypt_token', side_effect=decrypt_side_effect)
  46. def test_get_num_tokens(mock_decrypt, mocker):
  47. model = get_mock_model('a16z-infra/llama-2-13b-chat', '2a7f981751ec7fdf87b5b91ad4db53683a98082e9ff7bfd12c8cd5ea85980a52', mocker)
  48. rst = model.get_num_tokens([
  49. PromptMessage(type=MessageType.HUMAN, content='Who is your manufacturer?')
  50. ])
  51. assert rst == 7
  52. @patch('core.helper.encrypter.decrypt_token', side_effect=decrypt_side_effect)
  53. def test_run(mock_decrypt, mocker):
  54. mocker.patch('core.model_providers.providers.base.BaseModelProvider.update_last_used', return_value=None)
  55. model = get_mock_model('a16z-infra/llama-2-13b-chat', '2a7f981751ec7fdf87b5b91ad4db53683a98082e9ff7bfd12c8cd5ea85980a52', mocker)
  56. messages = [PromptMessage(content='Human: 1+1=? \nAnswer: ')]
  57. rst = model.run(
  58. messages
  59. )
  60. assert len(rst.content) > 0