From ffb0af8236331c942f19ae7c4c4da38a6d0e8214 Mon Sep 17 00:00:00 2001 From: sigoden Date: Mon, 29 Apr 2024 20:08:59 +0800 Subject: [PATCH] refactor: add some openai-compatiable platforms to config.example.yaml (#464) --- config.example.yaml | 72 +++++++++++++++++++++++++++++++++++++++------ models.yaml | 4 +++ 2 files changed, 67 insertions(+), 9 deletions(-) diff --git a/config.example.yaml b/config.example.yaml index bc38ef0..f838d04 100644 --- a/config.example.yaml +++ b/config.example.yaml @@ -124,14 +124,7 @@ clients: - type: moonshot api_key: sk-xxx # ENV: {client_name}_API_KEY - # Any platform that is compatible with OpenAI's API can be used here, including: - # - localai: https://github.com/mudler/LocalAI - # - anyscale: https://docs.anyscale.com/endpoints/model-serving/openai-migration-guide - # - deepinfra: https://deepinfra.com/docs/advanced/openai_api - # - fireworks: https://readme.fireworks.ai/docs/openai-compatibility - # - together.ai: https://docs.together.ai/docs/openai-api-compatibility - # - huggingface: https://huggingface.co/docs/text-generation-inference/messages_api - # - OctoAI: https://octo.ai/docs/text-gen-solution/migration-from-openai + # For any platform compatible with OpenAI's API - type: openai-compatible name: localai api_base: http://localhost:8080/v1 # ENV: {client_name}_API_BASE @@ -139,4 +132,65 @@ clients: chat_endpoint: /chat/completions # Optional models: # Required - name: llama3 - max_input_tokens: 8192 \ No newline at end of file + max_input_tokens: 8192 + + # See https://docs.endpoints.anyscale.com/ + - type: openai-compatible + name: anyscale + api_base: https://api.endpoints.anyscale.com/v1 + api_key: xxx + models: + # https://docs.endpoints.anyscale.com/text-generation/query-a-model#select-a-model + - name: meta-llama/Meta-Llama-3-70B-Instruct + max_input_tokens: 8192 + input_price: 1 + output_price: 1 + + # See https://deepinfra.com/docs + - type: openai-compatible + name: deepinfra + api_base: https://api.deepinfra.com/v1/openai + api_key: xxx + models: + # https://deepinfra.com/models + - name: meta-llama/Meta-Llama-3-70B-Instruct + max_input_tokens: 8192 + input_price: 0.59 + output_price: 0.79 + + # See https://readme.fireworks.ai/docs/quickstart + - type: openai-compatible + name: fireworks + api_base: https://api.fireworks.ai/inference/v1 + api_key: xxx + models: + # https://fireworks.ai/models + - name: accounts/fireworks/models/llama-v3-70b-instruct + max_input_tokens: 8192 + input_price: 0.9 + output_price: 0.9 + + + # See https://octo.ai/docs/getting-started/quickstart + - type: openai-compatible + name: octoai + api_base: https://text.octoai.run/v1 + api_key: xxx + models: + # https://octo.ai/docs/getting-started/inference-models + - name: meta-llama-3-70b-instruct + max_input_tokens: 8192 + input_price: 0.86 + output_price: 0.86 + + # See https://docs.together.ai/docs/quickstart + - type: openai-compatible + name: together + api_base: https://api.together.xyz/v1 + api_key: xxx + models: + # https://docs.together.ai/docs/inference-models + - name: meta-llama/Llama-3-70b-chat-hf + max_input_tokens: 8192 + input_price: 0.9 + output_price: 0.9 \ No newline at end of file diff --git a/models.yaml b/models.yaml index 52dffdd..ed53521 100644 --- a/models.yaml +++ b/models.yaml @@ -1,3 +1,7 @@ +# NOTES: +# - This model list is scheduled to be updated with each new aichat release. Please do not submit PR to add new models. +# - This model list does not include models officially marked as legacy or beta. + - type: openai # docs: # - https://platform.openai.com/docs/models