From e28c0469f49950e82d9fe5106de73305647466d2 Mon Sep 17 00:00:00 2001
From: timothycarambat <rambat1010@gmail.com>
Date: Thu, 18 Apr 2024 16:28:43 -0700
Subject: [PATCH] bump togetherai models Apr 18, 2024 resolves #1126

---
 server/utils/AiProviders/togetherAi/models.js | 26 ++++++++++++++++++-
 .../togetherAi/scripts/chat_models.txt        |  6 ++++-
 .../AiProviders/togetherAi/scripts/parse.mjs  |  2 +-
 3 files changed, 31 insertions(+), 3 deletions(-)

diff --git a/server/utils/AiProviders/togetherAi/models.js b/server/utils/AiProviders/togetherAi/models.js
index 6fad3969b..79ab93bab 100644
--- a/server/utils/AiProviders/togetherAi/models.js
+++ b/server/utils/AiProviders/togetherAi/models.js
@@ -39,7 +39,7 @@ const MODELS = {
     id: "databricks/dbrx-instruct",
     organization: "databricks",
     name: "DBRX Instruct",
-    maxLength: 32000,
+    maxLength: 32768,
   },
   "deepseek-ai/deepseek-coder-33b-instruct": {
     id: "deepseek-ai/deepseek-coder-33b-instruct",
@@ -131,6 +131,24 @@ const MODELS = {
     name: "LLaMA-2 Chat (7B)",
     maxLength: 4096,
   },
+  "meta-llama/Llama-3-8b-chat-hf": {
+    id: "meta-llama/Llama-3-8b-chat-hf",
+    organization: "Meta",
+    name: "LLaMA-3 Chat (8B)",
+    maxLength: 8000,
+  },
+  "meta-llama/Llama-3-70b-chat-hf": {
+    id: "meta-llama/Llama-3-70b-chat-hf",
+    organization: "Meta",
+    name: "LLaMA-3 Chat (70B)",
+    maxLength: 8000,
+  },
+  "microsoft/WizardLM-2-8x22B": {
+    id: "microsoft/WizardLM-2-8x22B",
+    organization: "Microsoft",
+    name: "WizardLM-2 (8x22B)",
+    maxLength: 65536,
+  },
   "mistralai/Mistral-7B-Instruct-v0.1": {
     id: "mistralai/Mistral-7B-Instruct-v0.1",
     organization: "mistralai",
@@ -149,6 +167,12 @@ const MODELS = {
     name: "Mixtral-8x7B Instruct (46.7B)",
     maxLength: 32768,
   },
+  "mistralai/Mixtral-8x22B-Instruct-v0.1": {
+    id: "mistralai/Mixtral-8x22B-Instruct-v0.1",
+    organization: "mistralai",
+    name: "Mixtral-8x22B Instruct (141B)",
+    maxLength: 65536,
+  },
   "NousResearch/Nous-Capybara-7B-V1p9": {
     id: "NousResearch/Nous-Capybara-7B-V1p9",
     organization: "NousResearch",
diff --git a/server/utils/AiProviders/togetherAi/scripts/chat_models.txt b/server/utils/AiProviders/togetherAi/scripts/chat_models.txt
index 03f0414cb..499d23549 100644
--- a/server/utils/AiProviders/togetherAi/scripts/chat_models.txt
+++ b/server/utils/AiProviders/togetherAi/scripts/chat_models.txt
@@ -6,7 +6,7 @@
 | Allen AI | OLMo (7B) | allenai/OLMo-7B | 2048 |
 | Austism | Chronos Hermes (13B) | Austism/chronos-hermes-13b | 2048 |
 | cognitivecomputations | Dolphin 2.5 Mixtral 8x7b | cognitivecomputations/dolphin-2.5-mixtral-8x7b | 32768 |
-| databricks | DBRX Instruct | databricks/dbrx-instruct | 32000 |
+| databricks | DBRX Instruct | databricks/dbrx-instruct | 32768 |
 | DeepSeek | Deepseek Coder Instruct (33B) | deepseek-ai/deepseek-coder-33b-instruct | 16384 |
 | DeepSeek | DeepSeek LLM Chat (67B) | deepseek-ai/deepseek-llm-67b-chat | 4096 |
 | garage-bAInd | Platypus2 Instruct (70B) | garage-bAInd/Platypus2-70B-instruct | 4096 |
@@ -22,9 +22,13 @@
 | Meta | LLaMA-2 Chat (70B) | meta-llama/Llama-2-70b-chat-hf | 4096 |
 | Meta | LLaMA-2 Chat (13B) | meta-llama/Llama-2-13b-chat-hf | 4096 |
 | Meta | LLaMA-2 Chat (7B) | meta-llama/Llama-2-7b-chat-hf | 4096 |
+| Meta | LLaMA-3 Chat (8B) | meta-llama/Llama-3-8b-chat-hf | 8000 |
+| Meta | LLaMA-3 Chat (70B) | meta-llama/Llama-3-70b-chat-hf | 8000 |
+| Microsoft | WizardLM-2 (8x22B) | microsoft/WizardLM-2-8x22B | 65536 |
 | mistralai | Mistral (7B) Instruct | mistralai/Mistral-7B-Instruct-v0.1 | 8192 |
 | mistralai | Mistral (7B) Instruct v0.2 | mistralai/Mistral-7B-Instruct-v0.2 | 32768 |
 | mistralai | Mixtral-8x7B Instruct (46.7B) | mistralai/Mixtral-8x7B-Instruct-v0.1 | 32768 |
+| mistralai | Mixtral-8x22B Instruct (141B) | mistralai/Mixtral-8x22B-Instruct-v0.1 | 65536 |
 | NousResearch | Nous Capybara v1.9 (7B) | NousResearch/Nous-Capybara-7B-V1p9 | 8192 |
 | NousResearch | Nous Hermes 2 - Mistral DPO (7B) | NousResearch/Nous-Hermes-2-Mistral-7B-DPO | 32768 |
 | NousResearch | Nous Hermes 2 - Mixtral 8x7B-DPO (46.7B) | NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO | 32768 |
diff --git a/server/utils/AiProviders/togetherAi/scripts/parse.mjs b/server/utils/AiProviders/togetherAi/scripts/parse.mjs
index b78404012..7d5d6277c 100644
--- a/server/utils/AiProviders/togetherAi/scripts/parse.mjs
+++ b/server/utils/AiProviders/togetherAi/scripts/parse.mjs
@@ -8,7 +8,7 @@
 // copy outputs into the export in ../models.js
 
 // Update the date below if you run this again because TogetherAI added new models.
-// Last Collected: Apr 14, 2024
+// Last Collected: Apr 18, 2024
 // Since last collection Together's docs are broken. I just copied the HTML table
 // and had claude3 convert to markdown and it works well enough.
 
-- 
GitLab