Skip to content

Commit

Permalink
feat: remove supports for huggingface (#988)
Browse files Browse the repository at this point in the history
  • Loading branch information
sigoden authored Nov 12, 2024
1 parent 36e884c commit f720135
Show file tree
Hide file tree
Showing 4 changed files with 1 addition and 33 deletions.
1 change: 0 additions & 1 deletion Argcfile.sh
Original file line number Diff line number Diff line change
Expand Up @@ -87,7 +87,6 @@ OPENAI_COMPATIBLE_PLATFORMS=( \
fireworks,accounts/fireworks/models/llama-v3p1-8b-instruct,https://api.fireworks.ai/inference/v1 \
github,gpt-4o-mini,https://models.inference.ai.azure.com \
groq,llama3-8b-8192,https://api.groq.com/openai/v1 \
huggingface,meta-llama/Meta-Llama-3-8B-Instruct,https://api-inference.huggingface.co/v1 \
hunyuan,hunyuan-large,https://api.hunyuan.cloud.tencent.com/v1 \
lingyiwanwu,yi-large,https://api.lingyiwanwu.com/v1 \
mistral,open-mistral-nemo,https://api.mistral.ai/v1 \
Expand Down
6 changes: 0 additions & 6 deletions config.example.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -244,12 +244,6 @@ clients:
api_base: https://api.cloudflare.com/client/v4/accounts/{ACCOUNT_ID}/ai/v1
api_key: xxx

# See https://huggingface.co/inference-api/serverless
- type: openai-compatible
name: huggingface
api_base: https://api-inference.huggingface.co/v1
api_key: xxx

# See https://cloud.baidu.com/doc/WENXINWORKSHOP/index.html
- type: ernie
api_key: xxx
Expand Down
24 changes: 0 additions & 24 deletions models.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -685,30 +685,6 @@
default_chunk_size: 1000
max_batch_size: 100

# Links:
# - https://huggingface.co/models?other=text-generation-inference
# - https://huggingface.co/docs/text-generation-inference/en/reference/api_reference
- platform: huggingface
models:
- name: NousResearch/Hermes-3-Llama-3.1-8B
max_input_tokens: 8192
max_output_tokens: 4096
require_max_tokens: true
input_price: 0
output_price: 0
- name: mistralai/Mistral-Small-Instruct-2409
max_input_tokens: 128000
max_output_tokens: 4096
require_max_tokens: true
input_price: 0
output_price: 0
- name: mistralai/Mistral-Nemo-Instruct-2407
max_input_tokens: 128000
max_output_tokens: 4096
require_max_tokens: true
input_price: 0
output_price: 0

# Links:
# - https://cloud.baidu.com/doc/WENXINWORKSHOP/s/Nlks5zkzu
# - https://cloud.baidu.com/doc/WENXINWORKSHOP/s/hlrk4akp7
Expand Down
3 changes: 1 addition & 2 deletions src/client/mod.rs
Original file line number Diff line number Diff line change
Expand Up @@ -35,15 +35,14 @@ register_client!(
(ernie, "ernie", ErnieConfig, ErnieClient),
);

pub const OPENAI_COMPATIBLE_PLATFORMS: [(&str, &str); 22] = [
pub const OPENAI_COMPATIBLE_PLATFORMS: [(&str, &str); 21] = [
("ai21", "https://api.ai21.com/studio/v1"),
("cloudflare", ""),
("deepinfra", "https://api.deepinfra.com/v1/openai"),
("deepseek", "https://api.deepseek.com"),
("fireworks", "https://api.fireworks.ai/inference/v1"),
("github", "https://models.inference.ai.azure.com"),
("groq", "https://api.groq.com/openai/v1"),
("huggingface", "https://api-inference.huggingface.co/v1"),
("hunyuan", "https://api.hunyuan.cloud.tencent.com/v1"),
("lingyiwanwu", "https://api.lingyiwanwu.com/v1"),
("mistral", "https://api.mistral.ai/v1"),
Expand Down

0 comments on commit f720135

Please sign in to comment.