Spaces:

cmu-lti
/

sotopia-space

Runtime error

App Files Files Community

Wonderplex commited on Apr 29, 2024

Commit

1f90e24

unverified ·

1 Parent(s): 79cc507

sotopia-pi prompt template fix (#66)

Browse files

Files changed (3) hide show

sotopia_pi_generate.py → sotopia_generate.py +8 -5
sotopia_space/chat.py +1 -1
sotopia_space/constants.py +1 -1

sotopia_pi_generate.py → sotopia_generate.py RENAMED Viewed

@@ -3,6 +3,7 @@ import os
 from typing import TypeVar
 from functools import cache
 import logging
 import torch
 from transformers import AutoModelForCausalLM, AutoTokenizer, pipeline
@@ -22,9 +23,10 @@ from langchain.prompts import (
     PromptTemplate,
 )
 from langchain.schema import BaseOutputParser, OutputParserException
 from message_classes import ActionType, AgentAction
 from utils import format_docstring
 from langchain_callback_handler import LoggingCallbackHandler
 HF_TOKEN_KEY_FILE="./hf_token.key"
@@ -89,7 +91,7 @@ def prepare_model(model_name):
         model = AutoModelForCausalLM.from_pretrained(
         "mistralai/Mistral-7B-Instruct-v0.1",
         cache_dir="./.cache",
-        device_map='cuda'
         )
         model = PeftModel.from_pretrained(model, model_name).to("cuda")
@@ -98,7 +100,7 @@ def prepare_model(model_name):
         model = AutoModelForCausalLM.from_pretrained(
         "mistralai/Mistral-7B-Instruct-v0.1",
         cache_dir="./.cache",
-        device_map='cuda',
         quantization_config=BitsAndBytesConfig(
             load_in_4bit=True,
             bnb_4bit_use_double_quant=True,
@@ -114,7 +116,7 @@ def prepare_model(model_name):
         model = AutoModelForCausalLM.from_pretrained(
         "mistralai/Mistral-7B-Instruct-v0.1",
         cache_dir="./.cache",
-        device_map='cuda'
         )
     else:
@@ -131,7 +133,7 @@ def obtain_chain_hf(
     max_tokens: int = 2700
 ) -> LLMChain:
     human_message_prompt = HumanMessagePromptTemplate(
-        prompt=PromptTemplate(template=template, input_variables=input_variables)
     )
     chat_prompt_template = ChatPromptTemplate.from_messages([human_message_prompt])
     model, tokenizer = prepare_model(model_name)
@@ -148,6 +150,7 @@ def obtain_chain_hf(
     chain = LLMChain(llm=hf, prompt=chat_prompt_template)
     return chain
 def generate(
     model_name: str,
     template: str,

 from typing import TypeVar
 from functools import cache
 import logging
+import json
 import torch
 from transformers import AutoModelForCausalLM, AutoTokenizer, pipeline
     PromptTemplate,
 )
 from langchain.schema import BaseOutputParser, OutputParserException
+import spaces
 from message_classes import ActionType, AgentAction
 from utils import format_docstring
 from langchain_callback_handler import LoggingCallbackHandler
 HF_TOKEN_KEY_FILE="./hf_token.key"
         model = AutoModelForCausalLM.from_pretrained(
         "mistralai/Mistral-7B-Instruct-v0.1",
         cache_dir="./.cache",
+        # device_map='cuda'
         )
         model = PeftModel.from_pretrained(model, model_name).to("cuda")
         model = AutoModelForCausalLM.from_pretrained(
         "mistralai/Mistral-7B-Instruct-v0.1",
         cache_dir="./.cache",
+        # device_map='cuda',
         quantization_config=BitsAndBytesConfig(
             load_in_4bit=True,
             bnb_4bit_use_double_quant=True,
         model = AutoModelForCausalLM.from_pretrained(
         "mistralai/Mistral-7B-Instruct-v0.1",
         cache_dir="./.cache",
+        # device_map='cuda'
         )
     else:
     max_tokens: int = 2700
 ) -> LLMChain:
     human_message_prompt = HumanMessagePromptTemplate(
+        prompt=PromptTemplate(template="[INST] " + template + " [/INST]", input_variables=input_variables)
     )
     chat_prompt_template = ChatPromptTemplate.from_messages([human_message_prompt])
     model, tokenizer = prepare_model(model_name)
     chain = LLMChain(llm=hf, prompt=chat_prompt_template)
     return chain
 def generate(
     model_name: str,
     template: str,

sotopia_space/chat.py CHANGED Viewed

@@ -6,7 +6,7 @@ from typing import Literal
 import json
 from collections import defaultdict
 from utils import Environment, Agent, get_context_prompt, dialogue_history_prompt
-from sotopia_pi_generate import prepare_model, generate_action
 from sotopia_space.constants import MODEL_OPTIONS
 DEPLOYED = os.getenv("DEPLOYED", "true").lower() == "true"

 import json
 from collections import defaultdict
 from utils import Environment, Agent, get_context_prompt, dialogue_history_prompt
+from sotopia_generate import prepare_model, generate_action
 from sotopia_space.constants import MODEL_OPTIONS
 DEPLOYED = os.getenv("DEPLOYED", "true").lower() == "true"

sotopia_space/constants.py CHANGED Viewed

@@ -5,7 +5,7 @@ MODEL_OPTIONS = [
     "cmu-lti/sotopia-pi-mistral-7b-BC_SR",
     "cmu-lti/sotopia-pi-mistral-7b-BC_SR_4bit",
     "mistralai/Mistral-7B-Instruct-v0.1"
-    # "mistralai/Mixtral-8x7B-Instruct-v0.1",
     # "togethercomputer/llama-2-7b-chat",
     # "togethercomputer/llama-2-70b-chat",
     # "togethercomputer/mpt-30b-chat",

     "cmu-lti/sotopia-pi-mistral-7b-BC_SR",
     "cmu-lti/sotopia-pi-mistral-7b-BC_SR_4bit",
     "mistralai/Mistral-7B-Instruct-v0.1"
+    # "mistralai/Mixtral-8x7B-Instruct-v0.1", # TODO: Add these model
     # "togethercomputer/llama-2-7b-chat",
     # "togethercomputer/llama-2-70b-chat",
     # "togethercomputer/mpt-30b-chat",