From 4ddccc361c04592d54d796b24f72508a5234ffb5 Mon Sep 17 00:00:00 2001 From: sigoden Date: Mon, 29 Apr 2024 09:05:02 +0000 Subject: [PATCH] refactor: update groq models at models.yaml --- models.yaml | 17 ++++++++++++++--- 1 file changed, 14 insertions(+), 3 deletions(-) diff --git a/models.yaml b/models.yaml index 1ca2c4b..52dffdd 100644 --- a/models.yaml +++ b/models.yaml @@ -208,21 +208,32 @@ - type: groq # docs: # - https://console.groq.com/docs/models + # - https://wow.groq.com # - https://console.groq.com/docs/text-chat # notes: - # - unable to get max_output_tokens info + # - get max_output_tokens info from playgourd # - all models are free with rate limits models: - name: llama3-8b-8192 max_input_tokens: 8192 + max_output_tokens?: 8192 + input_price: 0.05 + output_price: 0.10 - name: llama3-70b-8192 max_input_tokens: 8192 - - name: llama2-70b-4096 - max_input_tokens: 4096 + max_output_tokens?: 8192 + input_price: 0.59 + output_price: 0.79 - name: mixtral-8x7b-32768 max_input_tokens: 32768 + max_output_tokens?: 32768 + input_price: 0.27 + output_price: 0.27 - name: gemma-7b-it max_input_tokens: 8192 + max_output_tokens?: 8192 + input_price: 0.10 + output_price: 0.10 - type: vertexai # docs: