| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218 | import osfrom collections.abc import Generatorimport pytestfrom core.model_runtime.entities.llm_entities import LLMResult, LLMResultChunk, LLMResultChunkDeltafrom core.model_runtime.entities.message_entities import (    AssistantPromptMessage,    PromptMessageTool,    SystemPromptMessage,    TextPromptMessageContent,    UserPromptMessage,)from core.model_runtime.entities.model_entities import ParameterRulefrom core.model_runtime.errors.validate import CredentialsValidateFailedErrorfrom core.model_runtime.model_providers.localai.llm.llm import LocalAILanguageModeldef test_validate_credentials_for_chat_model():    model = LocalAILanguageModel()    with pytest.raises(CredentialsValidateFailedError):        model.validate_credentials(            model='chinese-llama-2-7b',            credentials={                'server_url': 'hahahaha',                'completion_type': 'completion',            }        )    model.validate_credentials(        model='chinese-llama-2-7b',        credentials={            'server_url': os.environ.get('LOCALAI_SERVER_URL'),            'completion_type': 'completion',        }    )def test_invoke_completion_model():    model = LocalAILanguageModel()    response = model.invoke(        model='chinese-llama-2-7b',        credentials={            'server_url': os.environ.get('LOCALAI_SERVER_URL'),            'completion_type': 'completion',        },        prompt_messages=[            UserPromptMessage(                content='ping'            )        ],        model_parameters={            'temperature': 0.7,            'top_p': 1.0,            'max_tokens': 10        },        stop=[],        user="abc-123",        stream=False    )    assert isinstance(response, LLMResult)    assert len(response.message.content) > 0    assert response.usage.total_tokens > 0def test_invoke_chat_model():    model = LocalAILanguageModel()    response = model.invoke(        model='chinese-llama-2-7b',        credentials={            'server_url': os.environ.get('LOCALAI_SERVER_URL'),            'completion_type': 'chat_completion',        },        prompt_messages=[            UserPromptMessage(                content='ping'            )        ],        model_parameters={            'temperature': 0.7,            'top_p': 1.0,            'max_tokens': 10        },        stop=[],        user="abc-123",        stream=False    )    assert isinstance(response, LLMResult)    assert len(response.message.content) > 0    assert response.usage.total_tokens > 0def test_invoke_stream_completion_model():    model = LocalAILanguageModel()    response = model.invoke(        model='chinese-llama-2-7b',        credentials={            'server_url': os.environ.get('LOCALAI_SERVER_URL'),            'completion_type': 'completion',        },        prompt_messages=[            UserPromptMessage(                content='Hello World!'            )        ],        model_parameters={            'temperature': 0.7,            'top_p': 1.0,            'max_tokens': 10        },        stop=['you'],        stream=True,        user="abc-123"    )    assert isinstance(response, Generator)    for chunk in response:        assert isinstance(chunk, LLMResultChunk)        assert isinstance(chunk.delta, LLMResultChunkDelta)        assert isinstance(chunk.delta.message, AssistantPromptMessage)        assert len(chunk.delta.message.content) > 0 if chunk.delta.finish_reason is None else Truedef test_invoke_stream_chat_model():    model = LocalAILanguageModel()    response = model.invoke(        model='chinese-llama-2-7b',        credentials={            'server_url': os.environ.get('LOCALAI_SERVER_URL'),            'completion_type': 'chat_completion',        },        prompt_messages=[            UserPromptMessage(                content='Hello World!'            )        ],        model_parameters={            'temperature': 0.7,            'top_p': 1.0,            'max_tokens': 10        },        stop=['you'],        stream=True,        user="abc-123"    )    assert isinstance(response, Generator)    for chunk in response:        assert isinstance(chunk, LLMResultChunk)        assert isinstance(chunk.delta, LLMResultChunkDelta)        assert isinstance(chunk.delta.message, AssistantPromptMessage)        assert len(chunk.delta.message.content) > 0 if chunk.delta.finish_reason is None else Truedef test_get_num_tokens():    model = LocalAILanguageModel()    num_tokens = model.get_num_tokens(        model='????',        credentials={            'server_url': os.environ.get('LOCALAI_SERVER_URL'),            'completion_type': 'chat_completion',        },        prompt_messages=[            SystemPromptMessage(                content='You are a helpful AI assistant.',            ),            UserPromptMessage(                content='Hello World!'            )        ],        tools=[            PromptMessageTool(                name='get_current_weather',                description='Get the current weather in a given location',                parameters={                    "type": "object",                    "properties": {                        "location": {                        "type": "string",                            "description": "The city and state e.g. San Francisco, CA"                        },                        "unit": {                            "type": "string",                            "enum": [                                "c",                                "f"                            ]                        }                    },                    "required": [                        "location"                    ]                }            )        ]    )    assert isinstance(num_tokens, int)    assert num_tokens == 77    num_tokens = model.get_num_tokens(        model='????',        credentials={            'server_url': os.environ.get('LOCALAI_SERVER_URL'),            'completion_type': 'chat_completion',        },        prompt_messages=[            UserPromptMessage(                content='Hello World!'            )        ],    )    assert isinstance(num_tokens, int)    assert num_tokens == 10
 |