| .. |
|
__init__.py
|
5fa2161b05
feat: server multi models support (#799)
|
2 years ago |
|
azure_chat_open_ai.py
|
5fa2161b05
feat: server multi models support (#799)
|
2 years ago |
|
azure_open_ai.py
|
5fa2161b05
feat: server multi models support (#799)
|
2 years ago |
|
chat_open_ai.py
|
5fa2161b05
feat: server multi models support (#799)
|
2 years ago |
|
fake.py
|
5fa2161b05
feat: server multi models support (#799)
|
2 years ago |
|
huggingface_endpoint_llm.py
|
0796791de5
feat: hf inference endpoint stream support (#1028)
|
2 years ago |
|
open_ai.py
|
5fa2161b05
feat: server multi models support (#799)
|
2 years ago |
|
openllm.py
|
866ee5da91
fix: openllm generate cutoff (#945)
|
2 years ago |
|
replicate_llm.py
|
5fa2161b05
feat: server multi models support (#799)
|
2 years ago |
|
spark.py
|
f42e7d1a61
feat: add spark v2 support (#885)
|
2 years ago |
|
tongyi_llm.py
|
5fa2161b05
feat: server multi models support (#799)
|
2 years ago |
|
wenxin.py
|
c4d759dfba
fix: wenxin error not raise when stream mode (#884)
|
2 years ago |
|
xinference_llm.py
|
2d9616c29c
fix: xinference last token being ignored (#1013)
|
2 years ago |