mirror of
				https://github.com/langgenius/dify.git
				synced 2025-10-31 19:03:09 +00:00 
			
		
		
		
	
		
			
				
	
	
		
			113 lines
		
	
	
		
			3.5 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
			
		
		
	
	
			113 lines
		
	
	
		
			3.5 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
| import os
 | |
| from collections.abc import Generator
 | |
| 
 | |
| import pytest
 | |
| 
 | |
| from core.model_runtime.entities.llm_entities import LLMResult, LLMResultChunk, LLMResultChunkDelta
 | |
| from core.model_runtime.entities.message_entities import AssistantPromptMessage, SystemPromptMessage, UserPromptMessage
 | |
| from core.model_runtime.errors.validate import CredentialsValidateFailedError
 | |
| from core.model_runtime.model_providers.replicate.llm.llm import ReplicateLargeLanguageModel
 | |
| 
 | |
| 
 | |
| def test_validate_credentials():
 | |
|     model = ReplicateLargeLanguageModel()
 | |
| 
 | |
|     with pytest.raises(CredentialsValidateFailedError):
 | |
|         model.validate_credentials(
 | |
|             model="meta/llama-2-13b-chat",
 | |
|             credentials={
 | |
|                 "replicate_api_token": "invalid_key",
 | |
|                 "model_version": "f4e2de70d66816a838a89eeeb621910adffb0dd0baba3976c96980970978018d",
 | |
|             },
 | |
|         )
 | |
| 
 | |
|     model.validate_credentials(
 | |
|         model="meta/llama-2-13b-chat",
 | |
|         credentials={
 | |
|             "replicate_api_token": os.environ.get("REPLICATE_API_KEY"),
 | |
|             "model_version": "f4e2de70d66816a838a89eeeb621910adffb0dd0baba3976c96980970978018d",
 | |
|         },
 | |
|     )
 | |
| 
 | |
| 
 | |
| def test_invoke_model():
 | |
|     model = ReplicateLargeLanguageModel()
 | |
| 
 | |
|     response = model.invoke(
 | |
|         model="meta/llama-2-13b-chat",
 | |
|         credentials={
 | |
|             "replicate_api_token": os.environ.get("REPLICATE_API_KEY"),
 | |
|             "model_version": "f4e2de70d66816a838a89eeeb621910adffb0dd0baba3976c96980970978018d",
 | |
|         },
 | |
|         prompt_messages=[
 | |
|             SystemPromptMessage(
 | |
|                 content="You are a helpful AI assistant.",
 | |
|             ),
 | |
|             UserPromptMessage(content="Who are you?"),
 | |
|         ],
 | |
|         model_parameters={
 | |
|             "temperature": 1.0,
 | |
|             "top_k": 2,
 | |
|             "top_p": 0.5,
 | |
|         },
 | |
|         stop=["How"],
 | |
|         stream=False,
 | |
|         user="abc-123",
 | |
|     )
 | |
| 
 | |
|     assert isinstance(response, LLMResult)
 | |
|     assert len(response.message.content) > 0
 | |
| 
 | |
| 
 | |
| def test_invoke_stream_model():
 | |
|     model = ReplicateLargeLanguageModel()
 | |
| 
 | |
|     response = model.invoke(
 | |
|         model="mistralai/mixtral-8x7b-instruct-v0.1",
 | |
|         credentials={
 | |
|             "replicate_api_token": os.environ.get("REPLICATE_API_KEY"),
 | |
|             "model_version": "2b56576fcfbe32fa0526897d8385dd3fb3d36ba6fd0dbe033c72886b81ade93e",
 | |
|         },
 | |
|         prompt_messages=[
 | |
|             SystemPromptMessage(
 | |
|                 content="You are a helpful AI assistant.",
 | |
|             ),
 | |
|             UserPromptMessage(content="Who are you?"),
 | |
|         ],
 | |
|         model_parameters={
 | |
|             "temperature": 1.0,
 | |
|             "top_k": 2,
 | |
|             "top_p": 0.5,
 | |
|         },
 | |
|         stop=["How"],
 | |
|         stream=True,
 | |
|         user="abc-123",
 | |
|     )
 | |
| 
 | |
|     assert isinstance(response, Generator)
 | |
| 
 | |
|     for chunk in response:
 | |
|         assert isinstance(chunk, LLMResultChunk)
 | |
|         assert isinstance(chunk.delta, LLMResultChunkDelta)
 | |
|         assert isinstance(chunk.delta.message, AssistantPromptMessage)
 | |
| 
 | |
| 
 | |
| def test_get_num_tokens():
 | |
|     model = ReplicateLargeLanguageModel()
 | |
| 
 | |
|     num_tokens = model.get_num_tokens(
 | |
|         model="",
 | |
|         credentials={
 | |
|             "replicate_api_token": os.environ.get("REPLICATE_API_KEY"),
 | |
|             "model_version": "2b56576fcfbe32fa0526897d8385dd3fb3d36ba6fd0dbe033c72886b81ade93e",
 | |
|         },
 | |
|         prompt_messages=[
 | |
|             SystemPromptMessage(
 | |
|                 content="You are a helpful AI assistant.",
 | |
|             ),
 | |
|             UserPromptMessage(content="Hello World!"),
 | |
|         ],
 | |
|     )
 | |
| 
 | |
|     assert num_tokens == 14
 | 
