feat: backend model load balancing support (#4927)

This commit is contained in:
takatost
2024-06-05 00:13:04 +08:00
committed by GitHub
parent 52ec152dd3
commit d1dbbc1e33
47 changed files with 2191 additions and 256 deletions

View File

@@ -1,6 +1,6 @@
import os
from core.utils.module_import_helper import import_module_from_source, load_single_subclass_from_source
from core.helper.module_import_helper import import_module_from_source, load_single_subclass_from_source
from tests.integration_tests.utils.parent_class import ParentClass

View File

@@ -92,7 +92,8 @@ def test_execute_llm(setup_openai_mock):
provider=CustomProviderConfiguration(
credentials=credentials
)
)
),
model_settings=[]
),
provider_instance=provider_instance,
model_type_instance=model_type_instance
@@ -206,10 +207,11 @@ def test_execute_llm_with_jinja2(setup_code_executor_mock, setup_openai_mock):
provider=CustomProviderConfiguration(
credentials=credentials
)
)
),
model_settings=[]
),
provider_instance=provider_instance,
model_type_instance=model_type_instance
model_type_instance=model_type_instance,
)
model_instance = ModelInstance(provider_model_bundle=provider_model_bundle, model='gpt-3.5-turbo')

View File

@@ -42,7 +42,8 @@ def get_mocked_fetch_model_config(
provider=CustomProviderConfiguration(
credentials=credentials
)
)
),
model_settings=[]
),
provider_instance=provider_instance,
model_type_instance=model_type_instance