.. |
__init__.py
|
5fa2161b05
feat: server multi models support (#799)
|
2 anni fa |
anthropic_llm.py
|
d75e8aeafa
feat: disable anthropic retry (#1067)
|
1 anno fa |
azure_chat_open_ai.py
|
5fa2161b05
feat: server multi models support (#799)
|
2 anni fa |
azure_open_ai.py
|
5fa2161b05
feat: server multi models support (#799)
|
2 anni fa |
chat_open_ai.py
|
417c19577a
feat: add LocalAI local embedding model support (#1021)
|
1 anno fa |
fake.py
|
5fa2161b05
feat: server multi models support (#799)
|
2 anni fa |
huggingface_endpoint_llm.py
|
0796791de5
feat: hf inference endpoint stream support (#1028)
|
1 anno fa |
open_ai.py
|
417c19577a
feat: add LocalAI local embedding model support (#1021)
|
1 anno fa |
openllm.py
|
866ee5da91
fix: openllm generate cutoff (#945)
|
1 anno fa |
replicate_llm.py
|
5fa2161b05
feat: server multi models support (#799)
|
2 anni fa |
spark.py
|
f42e7d1a61
feat: add spark v2 support (#885)
|
2 anni fa |
tongyi_llm.py
|
5fa2161b05
feat: server multi models support (#799)
|
2 anni fa |
wenxin.py
|
c4d759dfba
fix: wenxin error not raise when stream mode (#884)
|
2 anni fa |
xinference_llm.py
|
2d9616c29c
fix: xinference last token being ignored (#1013)
|
1 anno fa |