sotopia-pi prompt template fix (#66)

sotopia-lab · Apr 29, 2024 · 1f90e24 · 1f90e24
1 parent 79cc507
commit 1f90e24
Show file tree

Hide file tree

Showing 3 changed files with 10 additions and 7 deletions.
diff --git a/sotopia_pi_generate.py → sotopia_generate.py b/sotopia_pi_generate.py → sotopia_generate.py
@@ -3,6 +3,7 @@
 from typing import TypeVar
 from functools import cache
 import logging
+import json
 
 import torch
 from transformers import AutoModelForCausalLM, AutoTokenizer, pipeline
@@ -22,9 +23,10 @@
     PromptTemplate,
 )
 from langchain.schema import BaseOutputParser, OutputParserException
+import spaces
+
 from message_classes import ActionType, AgentAction
 from utils import format_docstring
-
 from langchain_callback_handler import LoggingCallbackHandler
 
 HF_TOKEN_KEY_FILE="./hf_token.key"
@@ -89,7 +91,7 @@ def prepare_model(model_name):
         model = AutoModelForCausalLM.from_pretrained(
         "mistralai/Mistral-7B-Instruct-v0.1",
         cache_dir="./.cache",
-        device_map='cuda'
+        # device_map='cuda'
         )
         model = PeftModel.from_pretrained(model, model_name).to("cuda")
 
@@ -98,7 +100,7 @@ def prepare_model(model_name):
         model = AutoModelForCausalLM.from_pretrained(
         "mistralai/Mistral-7B-Instruct-v0.1",
         cache_dir="./.cache",
-        device_map='cuda',
+        # device_map='cuda',
         quantization_config=BitsAndBytesConfig(
             load_in_4bit=True,
             bnb_4bit_use_double_quant=True,
@@ -114,7 +116,7 @@ def prepare_model(model_name):
         model = AutoModelForCausalLM.from_pretrained(
         "mistralai/Mistral-7B-Instruct-v0.1",
         cache_dir="./.cache",
-        device_map='cuda'
+        # device_map='cuda'
         )
 
     else:
@@ -131,7 +133,7 @@ def obtain_chain_hf(
     max_tokens: int = 2700
 ) -> LLMChain:
     human_message_prompt = HumanMessagePromptTemplate(
-        prompt=PromptTemplate(template=template, input_variables=input_variables)
+        prompt=PromptTemplate(template="[INST] " + template + " [/INST]", input_variables=input_variables)
     )
     chat_prompt_template = ChatPromptTemplate.from_messages([human_message_prompt])
     model, tokenizer = prepare_model(model_name)
@@ -148,6 +150,7 @@ def obtain_chain_hf(
     chain = LLMChain(llm=hf, prompt=chat_prompt_template)
     return chain
 
+
 def generate(
     model_name: str,
     template: str,

diff --git a/sotopia_space/chat.py b/sotopia_space/chat.py
@@ -6,7 +6,7 @@
 import json
 from collections import defaultdict
 from utils import Environment, Agent, get_context_prompt, dialogue_history_prompt
-from sotopia_pi_generate import prepare_model, generate_action
+from sotopia_generate import prepare_model, generate_action
 from sotopia_space.constants import MODEL_OPTIONS
 
 DEPLOYED = os.getenv("DEPLOYED", "true").lower() == "true"

diff --git a/sotopia_space/constants.py b/sotopia_space/constants.py
@@ -5,7 +5,7 @@
     "cmu-lti/sotopia-pi-mistral-7b-BC_SR",
     "cmu-lti/sotopia-pi-mistral-7b-BC_SR_4bit",
     "mistralai/Mistral-7B-Instruct-v0.1"
-    # "mistralai/Mixtral-8x7B-Instruct-v0.1",
+    # "mistralai/Mixtral-8x7B-Instruct-v0.1", # TODO: Add these model
     # "togethercomputer/llama-2-7b-chat",
     # "togethercomputer/llama-2-70b-chat",
     # "togethercomputer/mpt-30b-chat",