feat: server xinference support (#927)

This commit is contained in:
takatost
2023-08-20 17:46:41 +08:00
committed by GitHub
parent 8c991b5b26
commit da3f10a55e
18 changed files with 456 additions and 17 deletions

View File

@@ -65,6 +65,8 @@ def test_get_num_tokens(mock_decrypt, mocker):
@patch('core.helper.encrypter.decrypt_token', side_effect=decrypt_side_effect)
def test_run(mock_decrypt, mocker):
mocker.patch('core.model_providers.providers.base.BaseModelProvider.update_last_used', return_value=None)
model = get_mock_model('a16z-infra/llama-2-13b-chat', '2a7f981751ec7fdf87b5b91ad4db53683a98082e9ff7bfd12c8cd5ea85980a52', mocker)
messages = [PromptMessage(content='Human: 1+1=? \nAnswer: ')]
rst = model.run(