From de1f90881dabeeef0677b37f54917372e9ca4b54 Mon Sep 17 00:00:00 2001
From: Yifan Mai <yifan@cs.stanford.edu>
Date: Fri, 16 Feb 2024 12:15:48 -0800
Subject: [PATCH] Add openai/gpt-3.5-turbo-instruct model

---
 src/helm/config/model_deployments.yaml  | 8 ++++++++
 src/helm/config/model_metadata.yaml     | 8 ++++++++
 src/helm/proxy/clients/openai_client.py | 6 +++++-
 3 files changed, 21 insertions(+), 1 deletion(-)

diff --git a/src/helm/config/model_deployments.yaml b/src/helm/config/model_deployments.yaml
index 8fed4b64c5..78c7b0e403 100644
--- a/src/helm/config/model_deployments.yaml
+++ b/src/helm/config/model_deployments.yaml
@@ -1041,6 +1041,14 @@ model_deployments:
   ## GPT 3.5 Turbo Models
   # ChatGPT: https://openai.com/blog/chatgpt
 
+  - name: openai/gpt-3.5-turbo-instruct
+    model_name: openai/gpt-3.5-turbo-instruct
+    tokenizer_name: openai/cl100k_base
+    max_sequence_length: 4096
+    max_sequence_length: 4097
+    client_spec:
+      class_name: "helm.proxy.clients.openai_client.OpenAIClient"
+
   # The claimed sequence length is 4096, but as of 2023-03-07, the empirical usable
   # sequence length is smaller at 4087 with one user input message and one assistant
   # output message because ChatGPT uses special tokens for message roles and boundaries.
diff --git a/src/helm/config/model_metadata.yaml b/src/helm/config/model_metadata.yaml
index e316c6fcb0..aeed2e0cdb 100644
--- a/src/helm/config/model_metadata.yaml
+++ b/src/helm/config/model_metadata.yaml
@@ -1360,6 +1360,14 @@ models:
   ## GPT 3.5 Turbo Models
   # ChatGPT: https://openai.com/blog/chatgpt
   
+  - name: openai/gpt-3.5-turbo-instruct
+    display_name: GPT-3.5 Turbo Instruct
+    description: Similar capabilities as GPT-3 era models. Compatible with legacy Completions endpoint and not Chat Completions.
+    creator_organization_name: OpenAI
+    access: limited
+    release_date: 2023-09-18
+    tags: [TEXT_MODEL_TAG, OPENAI_CHATGPT_MODEL_TAG, LIMITED_FUNCTIONALITY_TEXT_MODEL_TAG, INSTRUCTION_FOLLOWING_MODEL_TAG]
+
   - name: openai/gpt-3.5-turbo-0301
     display_name: GPT-3.5 Turbo (0301)
     description: Sibling model of text-davinci-003 that is optimized for chat but works well for traditional completions tasks as well. Snapshot from 2023-03-01.
diff --git a/src/helm/proxy/clients/openai_client.py b/src/helm/proxy/clients/openai_client.py
index 37068574f9..a6042678dd 100644
--- a/src/helm/proxy/clients/openai_client.py
+++ b/src/helm/proxy/clients/openai_client.py
@@ -43,7 +43,11 @@ def __init__(
         self.api_base: str = "https://api.openai.com/v1"
 
     def _is_chat_model_engine(self, model_engine: str):
-        return model_engine.startswith("gpt-3.5") or model_engine.startswith("gpt-4")
+        if model_engine == "gpt-3.5-turbo-instruct":
+            return False
+        elif model_engine.startswith("gpt-3.5") or model_engine.startswith("gpt-4"):
+            return True
+        return False
 
     def _set_access_info(self):
         # Following https://beta.openai.com/docs/api-reference/authentication