binary-husky · jiangfy-ihep · May 8, 2024
diff --git a/config.py b/config.py
@@ -35,7 +35,7 @@
 AVAIL_LLM_MODELS = ["gpt-4-1106-preview", "gpt-4-turbo-preview", "gpt-4-vision-preview", "gpt-4-turbo", "gpt-4-turbo-2024-04-09",
  "gpt-3.5-turbo-1106", "gpt-3.5-turbo-16k", "gpt-3.5-turbo", "azure-gpt-3.5",
  "gpt-4", "gpt-4-32k", "azure-gpt-4", "glm-4", "glm-4v", "glm-3-turbo",
- "gemini-pro", "chatglm3"
+ "gemini-pro", "chatglm3", "deepseek-chat", "deepseek-coder"
  ]
 # --- --- --- ---
 # P.S. 其他可用的模型还包括
@@ -223,6 +223,8 @@
 # 零一万物(Yi Model) API KEY
 YIMODEL_API_KEY = ""
 
+# DEEPSEEK API KEY
+DEEPSEEK_API_KEY = ""
 
 # Mathpix 拥有执行PDF的OCR功能，但是需要注册账号
 MATHPIX_APPID = ""
@@ -332,6 +334,9 @@
 ├── "yi-34b-chat-0205", "yi-34b-chat-200k" 等零一万物(Yi Model)大模型
 │ └── YIMODEL_API_KEY
 │
+├── "deepseek-chat", "deepseek-coder" 等DEEPSEEK大模型
+│ └── DEEPSEEK_API_KEY
+│
 ├── "qwen-turbo" 等通义千问大模型
 │ └── DASHSCOPE_API_KEY
 │

diff --git a/request_llms/bridge_all.py b/request_llms/bridge_all.py
@@ -34,6 +34,9 @@
 from .bridge_zhipu import predict_no_ui_long_connection as zhipu_noui
 from .bridge_zhipu import predict as zhipu_ui
 
+from .bridge_deepseek import predict_no_ui_long_connection as deepseek_noui
+from .bridge_deepseek import predict as deepseek_ui
+
 from .bridge_cohere import predict as cohere_ui
 from .bridge_cohere import predict_no_ui_long_connection as cohere_noui
 
@@ -69,6 +72,7 @@ def decode(self, *args, **kwargs):
 yimodel_endpoint = "https://api.lingyiwanwu.com/v1/chat/completions"
 cohere_endpoint = "https://api.cohere.ai/v1/chat"
 ollama_endpoint = "http://localhost:11434/api/chat"
+deepseek_endpoint = "https://api.deepseek.com/chat/completions"
 
 if not AZURE_ENDPOINT.endswith('/'): AZURE_ENDPOINT += '/'
 azure_endpoint = AZURE_ENDPOINT + f'openai/deployments/{AZURE_ENGINE}/chat/completions?api-version=2023-05-15'
@@ -89,6 +93,7 @@ def decode(self, *args, **kwargs):
 if yimodel_endpoint in API_URL_REDIRECT: yimodel_endpoint = API_URL_REDIRECT[yimodel_endpoint]
 if cohere_endpoint in API_URL_REDIRECT: cohere_endpoint = API_URL_REDIRECT[cohere_endpoint]
 if ollama_endpoint in API_URL_REDIRECT: ollama_endpoint = API_URL_REDIRECT[ollama_endpoint]
+if deepseek_endpoint in API_URL_REDIRECT: deepseek_endpoint = API_URL_REDIRECT[deepseek_endpoint]
 
 # 获取tokenizer
 tokenizer_gpt35 = LazyloadTiktoken("gpt-3.5-turbo")
@@ -790,6 +795,29 @@ def decode(self, *args, **kwargs):
  except:
  print(trimmed_format_exc())
 
+if "deepseek-chat" in AVAIL_LLM_MODELS or "deepseek-coder" in AVAIL_LLM_MODELS: # deepseek oneline api
+ try:
+ model_info.update({
+ "deepseek-chat": {
+ "fn_with_ui": deepseek_ui,
+ "fn_without_ui": deepseek_noui,
+ "endpoint": deepseek_endpoint,
+ "max_token": 32000,
+ "tokenizer": tokenizer_gpt35,
+ "token_cnt": get_token_num_gpt35,
+ },
+ "deepseek-coder": {
+ "fn_with_ui": deepseek_ui,
+ "fn_without_ui": deepseek_noui,
+ "endpoint": deepseek_endpoint,
+ "max_token": 16000,
+ "tokenizer": tokenizer_gpt35,
+ "token_cnt": get_token_num_gpt35,
+ }
+ })
+ except:
+ print(trimmed_format_exc())
+
 
 # -=-=-=-=-=-=- one-api 对齐支持 -=-=-=-=-=-=-
 for model in [m for m in AVAIL_LLM_MODELS if m.startswith("one-api-")]: