| .. |
|
__init__.py
|
5fa2161b05
feat: server multi models support (#799)
|
2 anni fa |
|
anthropic_llm.py
|
d75e8aeafa
feat: disable anthropic retry (#1067)
|
2 anni fa |
|
azure_chat_open_ai.py
|
5fa2161b05
feat: server multi models support (#799)
|
2 anni fa |
|
azure_open_ai.py
|
5fa2161b05
feat: server multi models support (#799)
|
2 anni fa |
|
chat_open_ai.py
|
417c19577a
feat: add LocalAI local embedding model support (#1021)
|
2 anni fa |
|
fake.py
|
5fa2161b05
feat: server multi models support (#799)
|
2 anni fa |
|
huggingface_endpoint_llm.py
|
0796791de5
feat: hf inference endpoint stream support (#1028)
|
2 anni fa |
|
huggingface_hub_llm.py
|
e409895c02
Feat/huggingface embedding support (#1211)
|
2 anni fa |
|
open_ai.py
|
ae3f1ac0a9
feat: support gpt-3.5-turbo-instruct model (#1195)
|
2 anni fa |
|
openllm.py
|
866ee5da91
fix: openllm generate cutoff (#945)
|
2 anni fa |
|
replicate_llm.py
|
5fa2161b05
feat: server multi models support (#799)
|
2 anni fa |
|
spark.py
|
f42e7d1a61
feat: add spark v2 support (#885)
|
2 anni fa |
|
tongyi_llm.py
|
5fa2161b05
feat: server multi models support (#799)
|
2 anni fa |
|
wenxin.py
|
c4d759dfba
fix: wenxin error not raise when stream mode (#884)
|
2 anni fa |
|
xinference_llm.py
|
2d9616c29c
fix: xinference last token being ignored (#1013)
|
2 anni fa |
|
zhipuai_llm.py
|
827c97f0d3
feat: add zhipuai (#1188)
|
2 anni fa |