From f720135e7d6aaf9bb2d8b64c1032aadd1b32d6bc Mon Sep 17 00:00:00 2001
From: sigoden <sigoden@gmail.com>
Date: Wed, 13 Nov 2024 07:58:05 +0800
Subject: [PATCH] feat: remove supports for huggingface (#988)

---
 Argcfile.sh         |  1 -
 config.example.yaml |  6 ------
 models.yaml         | 24 ------------------------
 src/client/mod.rs   |  3 +--
 4 files changed, 1 insertion(+), 33 deletions(-)

diff --git a/Argcfile.sh b/Argcfile.sh
index 558d0565..2c8a830b 100755
--- a/Argcfile.sh
+++ b/Argcfile.sh
@@ -87,7 +87,6 @@ OPENAI_COMPATIBLE_PLATFORMS=( \
   fireworks,accounts/fireworks/models/llama-v3p1-8b-instruct,https://api.fireworks.ai/inference/v1 \
   github,gpt-4o-mini,https://models.inference.ai.azure.com \
   groq,llama3-8b-8192,https://api.groq.com/openai/v1 \
-  huggingface,meta-llama/Meta-Llama-3-8B-Instruct,https://api-inference.huggingface.co/v1 \
   hunyuan,hunyuan-large,https://api.hunyuan.cloud.tencent.com/v1 \
   lingyiwanwu,yi-large,https://api.lingyiwanwu.com/v1 \
   mistral,open-mistral-nemo,https://api.mistral.ai/v1 \
diff --git a/config.example.yaml b/config.example.yaml
index 706c8c6f..f46cddd1 100644
--- a/config.example.yaml
+++ b/config.example.yaml
@@ -244,12 +244,6 @@ clients:
     api_base: https://api.cloudflare.com/client/v4/accounts/{ACCOUNT_ID}/ai/v1
     api_key: xxx
 
-  # See https://huggingface.co/inference-api/serverless
-  - type: openai-compatible
-    name: huggingface
-    api_base: https://api-inference.huggingface.co/v1
-    api_key: xxx
-
   # See https://cloud.baidu.com/doc/WENXINWORKSHOP/index.html
   - type: ernie
     api_key: xxx
diff --git a/models.yaml b/models.yaml
index 80e3fc7f..7c2b2526 100644
--- a/models.yaml
+++ b/models.yaml
@@ -685,30 +685,6 @@
       default_chunk_size: 1000
       max_batch_size: 100
 
-# Links:
-#  - https://huggingface.co/models?other=text-generation-inference
-#  - https://huggingface.co/docs/text-generation-inference/en/reference/api_reference
-- platform: huggingface
-  models:
-    - name: NousResearch/Hermes-3-Llama-3.1-8B
-      max_input_tokens: 8192
-      max_output_tokens: 4096
-      require_max_tokens: true
-      input_price: 0
-      output_price: 0
-    - name: mistralai/Mistral-Small-Instruct-2409
-      max_input_tokens: 128000
-      max_output_tokens: 4096
-      require_max_tokens: true
-      input_price: 0
-      output_price: 0
-    - name: mistralai/Mistral-Nemo-Instruct-2407
-      max_input_tokens: 128000
-      max_output_tokens: 4096
-      require_max_tokens: true
-      input_price: 0
-      output_price: 0
-
 # Links:
 #  - https://cloud.baidu.com/doc/WENXINWORKSHOP/s/Nlks5zkzu
 #  - https://cloud.baidu.com/doc/WENXINWORKSHOP/s/hlrk4akp7
diff --git a/src/client/mod.rs b/src/client/mod.rs
index 2430d94c..b22508b5 100644
--- a/src/client/mod.rs
+++ b/src/client/mod.rs
@@ -35,7 +35,7 @@ register_client!(
     (ernie, "ernie", ErnieConfig, ErnieClient),
 );
 
-pub const OPENAI_COMPATIBLE_PLATFORMS: [(&str, &str); 22] = [
+pub const OPENAI_COMPATIBLE_PLATFORMS: [(&str, &str); 21] = [
     ("ai21", "https://api.ai21.com/studio/v1"),
     ("cloudflare", ""),
     ("deepinfra", "https://api.deepinfra.com/v1/openai"),
@@ -43,7 +43,6 @@ pub const OPENAI_COMPATIBLE_PLATFORMS: [(&str, &str); 22] = [
     ("fireworks", "https://api.fireworks.ai/inference/v1"),
     ("github", "https://models.inference.ai.azure.com"),
     ("groq", "https://api.groq.com/openai/v1"),
-    ("huggingface", "https://api-inference.huggingface.co/v1"),
     ("hunyuan", "https://api.hunyuan.cloud.tencent.com/v1"),
     ("lingyiwanwu", "https://api.lingyiwanwu.com/v1"),
     ("mistral", "https://api.mistral.ai/v1"),