From c34d11906195d38a8826d308e6db68a03df3a20c Mon Sep 17 00:00:00 2001 From: Ariya Hidayat Date: Sun, 15 Sep 2024 19:05:18 -0700 Subject: [PATCH] CI: Use LLama 3.1 8B whenever possible --- .github/workflows/test-deepinfra.yml | 2 +- .github/workflows/test-fireworks.yml | 2 +- .github/workflows/test-groq.yml | 2 +- .github/workflows/test-lepton.yml | 3 ++- .github/workflows/test-novita.yml | 2 +- .github/workflows/test-octo.yml | 2 +- .github/workflows/test-together.yml | 2 +- 7 files changed, 8 insertions(+), 7 deletions(-) diff --git a/.github/workflows/test-deepinfra.yml b/.github/workflows/test-deepinfra.yml index d7fda09..6c5096f 100644 --- a/.github/workflows/test-deepinfra.yml +++ b/.github/workflows/test-deepinfra.yml @@ -21,6 +21,6 @@ jobs: env: LLM_API_BASE_URL: 'https://api.deepinfra.com/v1/openai' LLM_API_KEY: ${{ secrets.DEEPINFRA_API_KEY }} - LLM_CHAT_MODEL: 'meta-llama/Meta-Llama-3-8B-Instruct' + LLM_CHAT_MODEL: 'meta-llama/Meta-Llama-3.1-8B-Instruct' - run: cat output.txt diff --git a/.github/workflows/test-fireworks.yml b/.github/workflows/test-fireworks.yml index 76e302a..793b0e2 100644 --- a/.github/workflows/test-fireworks.yml +++ b/.github/workflows/test-fireworks.yml @@ -21,6 +21,6 @@ jobs: env: LLM_API_BASE_URL: 'https://api.fireworks.ai/inference/v1' LLM_API_KEY: ${{ secrets.FIREWORKS_API_KEY }} - LLM_CHAT_MODEL: 'accounts/fireworks/models/llama-v3-8b-instruct' + LLM_CHAT_MODEL: 'accounts/fireworks/models/llama-v3p1-8b-instruct' - run: cat output.txt diff --git a/.github/workflows/test-groq.yml b/.github/workflows/test-groq.yml index c0ee277..75f1036 100644 --- a/.github/workflows/test-groq.yml +++ b/.github/workflows/test-groq.yml @@ -21,6 +21,6 @@ jobs: env: LLM_API_BASE_URL: 'https://api.groq.com/openai/v1' LLM_API_KEY: ${{ secrets.GROQ_API_KEY }} - LLM_CHAT_MODEL: 'llama3-8b-8192' + LLM_CHAT_MODEL: 'llama-3.1-8b-instant' - run: cat output.txt diff --git a/.github/workflows/test-lepton.yml b/.github/workflows/test-lepton.yml index 19ce332..8721453 100644 --- a/.github/workflows/test-lepton.yml +++ b/.github/workflows/test-lepton.yml @@ -19,7 +19,8 @@ jobs: - run: echo 'Which planet in our solar system is the largest?' | ./ask-llm.js | tee output.txt | grep -i jupiter timeout-minutes: 3 env: - LLM_API_BASE_URL: 'https://llama3-8b.lepton.run/api/v1' + LLM_API_BASE_URL: 'https://llama3-1-8b.lepton.run/api/v1' LLM_API_KEY: ${{ secrets.LEPTON_API_KEY }} + LLM_CHAT_MODEL: 'llama3-1-8b' - run: cat output.txt diff --git a/.github/workflows/test-novita.yml b/.github/workflows/test-novita.yml index 4306f3b..7b3568b 100644 --- a/.github/workflows/test-novita.yml +++ b/.github/workflows/test-novita.yml @@ -21,6 +21,6 @@ jobs: env: LLM_API_BASE_URL: 'https://api.novita.ai/v3/openai' LLM_API_KEY: ${{ secrets.NOVITA_API_KEY }} - LLM_CHAT_MODEL: 'meta-llama/llama-3-8b-instruct' + LLM_CHAT_MODEL: 'meta-llama/llama-3.1-8b-instruct' - run: cat output.txt diff --git a/.github/workflows/test-octo.yml b/.github/workflows/test-octo.yml index 83b5e87..a015df5 100644 --- a/.github/workflows/test-octo.yml +++ b/.github/workflows/test-octo.yml @@ -21,7 +21,7 @@ jobs: env: LLM_API_BASE_URL: 'https://text.octoai.run/v1' LLM_API_KEY: ${{ secrets.OCTOAI_API_KEY }} - LLM_CHAT_MODEL: 'hermes-2-pro-mistral-7b' + LLM_CHAT_MODEL: 'meta-llama-3.1-8b-instruct' LLM_STREAMING: 'no' - run: cat output.txt diff --git a/.github/workflows/test-together.yml b/.github/workflows/test-together.yml index 4b2db2b..9b1ece1 100644 --- a/.github/workflows/test-together.yml +++ b/.github/workflows/test-together.yml @@ -21,6 +21,6 @@ jobs: env: LLM_API_BASE_URL: 'https://api.together.xyz/v1' LLM_API_KEY: ${{ secrets.TOGETHER_API_KEY }} - LLM_CHAT_MODEL: 'meta-llama/Llama-3-8b-chat-hf' + LLM_CHAT_MODEL: 'meta-llama/Meta-Llama-3.1-8B-Instruct-Turbo' - run: cat output.txt